{"train/loss": 6.4331, "train/learning_rate": 2.2647779629448096e-05, "train/epoch": 0.84, "train/global_step": 3000, "_runtime": 12512, "_timestamp": 1646226791, "_step": 3004, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 19.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 30396.0, 61.0, 10.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4632.0, -4527.953125, -4423.90625, -4319.859375, -4215.8125, -4111.765625, -4007.71875, -3903.671875, -3799.625, -3695.578125, -3591.53125, -3487.484375, -3383.4375, -3279.390625, -3175.34375, -3071.296875, -2967.25, -2863.203125, -2759.15625, -2655.109375, -2551.0625, -2447.015625, -2342.96875, -2238.921875, -2134.875, -2030.828125, -1926.78125, -1822.734375, -1718.6875, -1614.640625, -1510.59375, -1406.546875, -1302.5, -1198.453125, -1094.40625, -990.359375, -886.3125, -782.265625, -678.21875, -574.171875, -470.125, -366.078125, -262.03125, -157.984375, -53.9375, 50.109375, 154.15625, 258.203125, 362.25, 466.296875, 570.34375, 674.390625, 778.4375, 882.484375, 986.53125, 1090.578125, 1194.625, 1298.671875, 1402.71875, 1506.765625, 1610.8125, 1714.859375, 1818.90625, 1922.953125, 2027.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 10.0, 4.0, 7.0, 17.0, 18.0, 56.0, 76.0, 106.0, 185.0, 162.0, 120.0, 101.0, 48.0, 30.0, 18.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2122.14208984375, -2072.442626953125, -2022.7432861328125, -1973.0438232421875, -1923.344482421875, -1873.64501953125, -1823.945556640625, -1774.2462158203125, -1724.546875, -1674.847412109375, -1625.1480712890625, -1575.4486083984375, -1525.749267578125, -1476.0498046875, -1426.350341796875, -1376.6510009765625, -1326.9515380859375, -1277.2520751953125, -1227.552734375, -1177.853271484375, -1128.1539306640625, -1078.4544677734375, -1028.755126953125, -979.0556640625, -929.3562622070312, -879.6568603515625, -829.9574584960938, -780.258056640625, -730.55859375, -680.8592529296875, -631.1597900390625, -581.4603881835938, -531.7608642578125, -482.06146240234375, -432.362060546875, -382.6626281738281, -332.9632263183594, -283.2638244628906, -233.56439208984375, -183.864990234375, -134.16558837890625, -84.46617889404297, -34.76676940917969, 14.932647705078125, 64.63204956054688, 114.33145141601562, 164.0308837890625, 213.73028564453125, 263.4296875, 313.12908935546875, 362.8284912109375, 412.5279235839844, 462.2273254394531, 511.9267272949219, 561.6261596679688, 611.3255615234375, 661.0249633789062, 710.724365234375, 760.4237670898438, 810.1231689453125, 859.8226318359375, 909.52197265625, 959.221435546875, 1008.9208374023438, 1058.6202392578125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 11.0, 6.0, 12.0, 16.0, 11.0, 14.0, 21.0, 25.0, 23.0, 16.0, 32.0, 31.0, 32.0, 43.0, 41.0, 33.0, 33.0, 51.0, 34.0, 37.0, 45.0, 51.0, 39.0, 35.0, 35.0, 29.0, 36.0, 26.0, 30.0, 19.0, 15.0, 19.0, 17.0, 15.0, 9.0, 12.0, 8.0, 6.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-624.51416015625, -602.9755249023438, -581.4368896484375, -559.8982543945312, -538.359619140625, -516.821044921875, -495.28240966796875, -473.7437744140625, -452.20513916015625, -430.66650390625, -409.12786865234375, -387.5892639160156, -366.0506286621094, -344.5119934082031, -322.973388671875, -301.43475341796875, -279.8961181640625, -258.35748291015625, -236.81886291503906, -215.28024291992188, -193.74160766601562, -172.20297241210938, -150.6643524169922, -129.125732421875, -107.58709716796875, -86.04846954345703, -64.50984191894531, -42.971214294433594, -21.432586669921875, 0.10604095458984375, 21.644668579101562, 43.18328857421875, 64.721923828125, 86.26055145263672, 107.79917907714844, 129.33779907226562, 150.87643432617188, 172.41506958007812, 193.9536895751953, 215.4923095703125, 237.03094482421875, 258.569580078125, 280.10821533203125, 301.6468200683594, 323.1854553222656, 344.7240905761719, 366.2626953125, 387.80133056640625, 409.3399658203125, 430.87860107421875, 452.417236328125, 473.9558410644531, 495.4944763183594, 517.0330810546875, 538.5717163085938, 560.1103515625, 581.6489868164062, 603.1876220703125, 624.7262573242188, 646.264892578125, 667.803466796875, 689.3421020507812, 710.8807373046875, 732.4193725585938, 753.9580078125]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 8.0, 11.0, 21.0, 25.0, 35.0, 56.0, 80.0, 116.0, 158.0, 218.0, 354.0, 471.0, 636.0, 992.0, 1481.0, 2059.0, 3250.0, 4707.0, 7369.0, 11341.0, 18799.0, 31169.0, 55873.0, 119648.0, 428467.0, 188229.0, 72085.0, 38592.0, 22704.0, 13722.0, 8789.0, 5686.0, 3700.0, 2464.0, 1653.0, 1068.0, 764.0, 512.0, 388.0, 265.0, 170.0, 133.0, 79.0, 59.0, 37.0, 34.0, 18.0, 11.0, 13.0, 12.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0], "bins": [-1773.0, -1718.765625, -1664.53125, -1610.296875, -1556.0625, -1501.828125, -1447.59375, -1393.359375, -1339.125, -1284.890625, -1230.65625, -1176.421875, -1122.1875, -1067.953125, -1013.71875, -959.484375, -905.25, -851.015625, -796.78125, -742.546875, -688.3125, -634.078125, -579.84375, -525.609375, -471.375, -417.140625, -362.90625, -308.671875, -254.4375, -200.203125, -145.96875, -91.734375, -37.5, 16.734375, 70.96875, 125.203125, 179.4375, 233.671875, 287.90625, 342.140625, 396.375, 450.609375, 504.84375, 559.078125, 613.3125, 667.546875, 721.78125, 776.015625, 830.25, 884.484375, 938.71875, 992.953125, 1047.1875, 1101.421875, 1155.65625, 1209.890625, 1264.125, 1318.359375, 1372.59375, 1426.828125, 1481.0625, 1535.296875, 1589.53125, 1643.765625, 1698.0]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 9.0, 4.0, 18.0, 13.0, 13.0, 13.0, 12.0, 20.0, 21.0, 26.0, 38.0, 33.0, 49.0, 63.0, 109.0, 151.0, 126.0, 65.0, 32.0, 26.0, 24.0, 17.0, 22.0, 14.0, 18.0, 7.0, 8.0, 14.0, 4.0, 6.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-654.0, -633.921875, -613.84375, -593.765625, -573.6875, -553.609375, -533.53125, -513.453125, -493.375, -473.296875, -453.21875, -433.140625, -413.0625, -392.984375, -372.90625, -352.828125, -332.75, -312.671875, -292.59375, -272.515625, -252.4375, -232.359375, -212.28125, -192.203125, -172.125, -152.046875, -131.96875, -111.890625, -91.8125, -71.734375, -51.65625, -31.578125, -11.5, 8.578125, 28.65625, 48.734375, 68.8125, 88.890625, 108.96875, 129.046875, 149.125, 169.203125, 189.28125, 209.359375, 229.4375, 249.515625, 269.59375, 289.671875, 309.75, 329.828125, 349.90625, 369.984375, 390.0625, 410.140625, 430.21875, 450.296875, 470.375, 490.453125, 510.53125, 530.609375, 550.6875, 570.765625, 590.84375, 610.921875, 631.0]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 3.0, 6.0, 5.0, 13.0, 21.0, 29.0, 31.0, 31.0, 50.0, 57.0, 85.0, 77.0, 109.0, 76.0, 87.0, 55.0, 55.0, 36.0, 34.0, 20.0, 22.0, 14.0, 13.0, 9.0, 13.0, 6.0, 7.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-420.38818359375, -407.6455383300781, -394.90289306640625, -382.1602478027344, -369.4176025390625, -356.6749572753906, -343.93231201171875, -331.18963623046875, -318.447021484375, -305.7043762207031, -292.96173095703125, -280.2190856933594, -267.4764404296875, -254.73379516601562, -241.9911346435547, -229.2484893798828, -216.50582885742188, -203.76318359375, -191.02053833007812, -178.27789306640625, -165.53524780273438, -152.7926025390625, -140.04994201660156, -127.30729675292969, -114.56465148925781, -101.82200622558594, -89.07936096191406, -76.33670806884766, -63.59406280517578, -50.851417541503906, -38.1087646484375, -25.366119384765625, -12.62347412109375, 0.11917304992675781, 12.861820220947266, 25.604469299316406, 38.34711456298828, 51.089759826660156, 63.83241271972656, 76.57505798339844, 89.31770324707031, 102.06034851074219, 114.80299377441406, 127.54564666748047, 140.28829956054688, 153.03094482421875, 165.77359008789062, 178.5162353515625, 191.25888061523438, 204.00152587890625, 216.74417114257812, 229.48681640625, 242.22946166992188, 254.97210693359375, 267.71478271484375, 280.4573974609375, 293.2000732421875, 305.9427185058594, 318.68536376953125, 331.4280090332031, 344.170654296875, 356.9132995605469, 369.65594482421875, 382.39862060546875, 395.1412353515625]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 6.0, 8.0, 4.0, 13.0, 21.0, 15.0, 27.0, 26.0, 22.0, 35.0, 31.0, 39.0, 20.0, 33.0, 38.0, 30.0, 48.0, 41.0, 42.0, 35.0, 36.0, 39.0, 39.0, 38.0, 33.0, 30.0, 17.0, 37.0, 19.0, 17.0, 23.0, 27.0, 18.0, 8.0, 16.0, 8.0, 3.0, 9.0, 8.0, 5.0, 5.0, 8.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-286.638916015625, -277.99169921875, -269.3444519042969, -260.6972351074219, -252.0500030517578, -243.40277099609375, -234.75555419921875, -226.1083221435547, -217.46109008789062, -208.81385803222656, -200.1666259765625, -191.5194091796875, -182.87217712402344, -174.22494506835938, -165.57772827148438, -156.9304962158203, -148.28326416015625, -139.6360321044922, -130.98880004882812, -122.34158325195312, -113.69435119628906, -105.047119140625, -96.39989471435547, -87.75267028808594, -79.10543823242188, -70.45820617675781, -61.81098175048828, -53.163753509521484, -44.51652526855469, -35.86929702758789, -27.222068786621094, -18.574840545654297, -9.9276123046875, -1.2803840637207031, 7.366844177246094, 16.01407241821289, 24.661300659179688, 33.308528900146484, 41.95575714111328, 50.60298538208008, 59.250213623046875, 67.89744567871094, 76.54467010498047, 85.19189453125, 93.83912658691406, 102.48635864257812, 111.13358306884766, 119.78080749511719, 128.42803955078125, 137.0752716064453, 145.72250366210938, 154.36972045898438, 163.01695251464844, 171.6641845703125, 180.3114013671875, 188.95863342285156, 197.60586547851562, 206.2530975341797, 214.90032958984375, 223.54754638671875, 232.1947784423828, 240.84201049804688, 249.48922729492188, 258.136474609375, 266.78369140625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 14.0, 17.0, 22.0, 44.0, 66.0, 86.0, 158.0, 201.0, 350.0, 507.0, 699.0, 1127.0, 1719.0, 2659.0, 4404.0, 7190.0, 12280.0, 22238.0, 41837.0, 85378.0, 211375.0, 1265027.0, 1972747.0, 331615.0, 111230.0, 53185.0, 28344.0, 15908.0, 9148.0, 5366.0, 3282.0, 2111.0, 1321.0, 876.0, 574.0, 378.0, 257.0, 175.0, 106.0, 92.0, 60.0, 27.0, 23.0, 26.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-422.25, -409.12109375, -395.9921875, -382.86328125, -369.734375, -356.60546875, -343.4765625, -330.34765625, -317.21875, -304.08984375, -290.9609375, -277.83203125, -264.703125, -251.57421875, -238.4453125, -225.31640625, -212.1875, -199.05859375, -185.9296875, -172.80078125, -159.671875, -146.54296875, -133.4140625, -120.28515625, -107.15625, -94.02734375, -80.8984375, -67.76953125, -54.640625, -41.51171875, -28.3828125, -15.25390625, -2.125, 11.00390625, 24.1328125, 37.26171875, 50.390625, 63.51953125, 76.6484375, 89.77734375, 102.90625, 116.03515625, 129.1640625, 142.29296875, 155.421875, 168.55078125, 181.6796875, 194.80859375, 207.9375, 221.06640625, 234.1953125, 247.32421875, 260.453125, 273.58203125, 286.7109375, 299.83984375, 312.96875, 326.09765625, 339.2265625, 352.35546875, 365.484375, 378.61328125, 391.7421875, 404.87109375, 418.0]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 13.0, 20.0, 17.0, 28.0, 20.0, 15.0, 24.0, 36.0, 24.0, 37.0, 30.0, 38.0, 42.0, 33.0, 48.0, 32.0, 40.0, 41.0, 38.0, 27.0, 33.0, 41.0, 32.0, 40.0, 13.0, 35.0, 24.0, 23.0, 23.0, 17.0, 20.0, 5.0, 10.0, 14.0, 7.0, 6.0, 7.0, 3.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-143.0, -138.802734375, -134.60546875, -130.408203125, -126.2109375, -122.013671875, -117.81640625, -113.619140625, -109.421875, -105.224609375, -101.02734375, -96.830078125, -92.6328125, -88.435546875, -84.23828125, -80.041015625, -75.84375, -71.646484375, -67.44921875, -63.251953125, -59.0546875, -54.857421875, -50.66015625, -46.462890625, -42.265625, -38.068359375, -33.87109375, -29.673828125, -25.4765625, -21.279296875, -17.08203125, -12.884765625, -8.6875, -4.490234375, -0.29296875, 3.904296875, 8.1015625, 12.298828125, 16.49609375, 20.693359375, 24.890625, 29.087890625, 33.28515625, 37.482421875, 41.6796875, 45.876953125, 50.07421875, 54.271484375, 58.46875, 62.666015625, 66.86328125, 71.060546875, 75.2578125, 79.455078125, 83.65234375, 87.849609375, 92.046875, 96.244140625, 100.44140625, 104.638671875, 108.8359375, 113.033203125, 117.23046875, 121.427734375, 125.625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 5.0, 8.0, 14.0, 18.0, 31.0, 34.0, 65.0, 68.0, 127.0, 231.0, 309.0, 427.0, 712.0, 1076.0, 1652.0, 2622.0, 4289.0, 7256.0, 12045.0, 21729.0, 40284.0, 77446.0, 164186.0, 397852.0, 1412728.0, 1338837.0, 384071.0, 159529.0, 76100.0, 39117.0, 21140.0, 12168.0, 6893.0, 4211.0, 2632.0, 1573.0, 984.0, 680.0, 384.0, 256.0, 158.0, 85.0, 79.0, 59.0, 40.0, 30.0, 17.0, 13.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-273.25, -264.96484375, -256.6796875, -248.39453125, -240.109375, -231.82421875, -223.5390625, -215.25390625, -206.96875, -198.68359375, -190.3984375, -182.11328125, -173.828125, -165.54296875, -157.2578125, -148.97265625, -140.6875, -132.40234375, -124.1171875, -115.83203125, -107.546875, -99.26171875, -90.9765625, -82.69140625, -74.40625, -66.12109375, -57.8359375, -49.55078125, -41.265625, -32.98046875, -24.6953125, -16.41015625, -8.125, 0.16015625, 8.4453125, 16.73046875, 25.015625, 33.30078125, 41.5859375, 49.87109375, 58.15625, 66.44140625, 74.7265625, 83.01171875, 91.296875, 99.58203125, 107.8671875, 116.15234375, 124.4375, 132.72265625, 141.0078125, 149.29296875, 157.578125, 165.86328125, 174.1484375, 182.43359375, 190.71875, 199.00390625, 207.2890625, 215.57421875, 223.859375, 232.14453125, 240.4296875, 248.71484375, 257.0]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 8.0, 8.0, 12.0, 13.0, 24.0, 21.0, 34.0, 40.0, 36.0, 60.0, 75.0, 76.0, 128.0, 165.0, 194.0, 244.0, 377.0, 525.0, 552.0, 357.0, 253.0, 209.0, 134.0, 104.0, 92.0, 73.0, 41.0, 46.0, 26.0, 37.0, 21.0, 11.0, 7.0, 20.0, 6.0, 10.0, 9.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-92.5, -89.7783203125, -87.056640625, -84.3349609375, -81.61328125, -78.8916015625, -76.169921875, -73.4482421875, -70.7265625, -68.0048828125, -65.283203125, -62.5615234375, -59.83984375, -57.1181640625, -54.396484375, -51.6748046875, -48.953125, -46.2314453125, -43.509765625, -40.7880859375, -38.06640625, -35.3447265625, -32.623046875, -29.9013671875, -27.1796875, -24.4580078125, -21.736328125, -19.0146484375, -16.29296875, -13.5712890625, -10.849609375, -8.1279296875, -5.40625, -2.6845703125, 0.037109375, 2.7587890625, 5.48046875, 8.2021484375, 10.923828125, 13.6455078125, 16.3671875, 19.0888671875, 21.810546875, 24.5322265625, 27.25390625, 29.9755859375, 32.697265625, 35.4189453125, 38.140625, 40.8623046875, 43.583984375, 46.3056640625, 49.02734375, 51.7490234375, 54.470703125, 57.1923828125, 59.9140625, 62.6357421875, 65.357421875, 68.0791015625, 70.80078125, 73.5224609375, 76.244140625, 78.9658203125, 81.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 3.0, 10.0, 11.0, 18.0, 33.0, 32.0, 39.0, 49.0, 75.0, 71.0, 96.0, 98.0, 91.0, 86.0, 68.0, 56.0, 36.0, 38.0, 21.0, 14.0, 15.0, 5.0, 11.0, 5.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-291.8419189453125, -283.3953552246094, -274.9488220214844, -266.50225830078125, -258.05572509765625, -249.60916137695312, -241.16259765625, -232.71604919433594, -224.26950073242188, -215.8229522705078, -207.37640380859375, -198.92984008789062, -190.48329162597656, -182.0367431640625, -173.59017944335938, -165.1436309814453, -156.69708251953125, -148.2505340576172, -139.80398559570312, -131.357421875, -122.91087341308594, -114.46432495117188, -106.01776885986328, -97.57121276855469, -89.12466430664062, -80.67811584472656, -72.23155975341797, -63.78500747680664, -55.33845520019531, -46.891902923583984, -38.445350646972656, -29.998798370361328, -21.552230834960938, -13.10567855834961, -4.659126281738281, 3.787425994873047, 12.233978271484375, 20.680530548095703, 29.12708282470703, 37.57363510131836, 46.02018737792969, 54.466739654541016, 62.913291931152344, 71.35984802246094, 79.806396484375, 88.25294494628906, 96.69950103759766, 105.14605712890625, 113.59260559082031, 122.03915405273438, 130.4857177734375, 138.93226623535156, 147.37881469726562, 155.8253631591797, 164.27191162109375, 172.71847534179688, 181.16502380371094, 189.611572265625, 198.05813598632812, 206.5046844482422, 214.95123291015625, 223.3977813720703, 231.84432983398438, 240.2908935546875, 248.73744201660156]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 3.0, 3.0, 6.0, 17.0, 13.0, 18.0, 21.0, 17.0, 18.0, 18.0, 26.0, 29.0, 38.0, 25.0, 39.0, 37.0, 41.0, 33.0, 44.0, 39.0, 36.0, 30.0, 35.0, 44.0, 33.0, 38.0, 42.0, 25.0, 27.0, 18.0, 21.0, 26.0, 19.0, 16.0, 15.0, 10.0, 15.0, 13.0, 10.0, 5.0, 5.0, 5.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-172.21194458007812, -167.1827850341797, -162.15362548828125, -157.12448120117188, -152.09532165527344, -147.066162109375, -142.03700256347656, -137.00784301757812, -131.97869873046875, -126.94953918457031, -121.9203872680664, -116.89122772216797, -111.86207580566406, -106.83291625976562, -101.80375671386719, -96.77459716796875, -91.74543762207031, -86.71627807617188, -81.68712615966797, -76.65796661376953, -71.62881469726562, -66.59965515136719, -61.57049560546875, -56.54133987426758, -51.512184143066406, -46.483028411865234, -41.45387268066406, -36.424713134765625, -31.395557403564453, -26.36640167236328, -21.337244033813477, -16.308086395263672, -11.278915405273438, -6.249758720397949, -1.220602035522461, 3.8085546493530273, 8.837711334228516, 13.866867065429688, 18.896024703979492, 23.925182342529297, 28.95433807373047, 33.98349380493164, 39.01264953613281, 44.04180908203125, 49.07096481323242, 54.100120544433594, 59.12928009033203, 64.15843200683594, 69.18759155273438, 74.21675109863281, 79.24590301513672, 84.27506256103516, 89.30421447753906, 94.3333740234375, 99.36253356933594, 104.39169311523438, 109.42084503173828, 114.45000457763672, 119.47915649414062, 124.50831604003906, 129.5374755859375, 134.56661987304688, 139.5957794189453, 144.62493896484375, 149.6540985107422]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 12.0, 14.0, 21.0, 24.0, 42.0, 75.0, 129.0, 182.0, 283.0, 490.0, 713.0, 1233.0, 2112.0, 3446.0, 5930.0, 10295.0, 18581.0, 34939.0, 67290.0, 138655.0, 281288.0, 241556.0, 116213.0, 57394.0, 29473.0, 16094.0, 9133.0, 5180.0, 2956.0, 1831.0, 1116.0, 657.0, 449.0, 273.0, 158.0, 123.0, 76.0, 41.0, 34.0, 14.0, 13.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-222.0, -215.447265625, -208.89453125, -202.341796875, -195.7890625, -189.236328125, -182.68359375, -176.130859375, -169.578125, -163.025390625, -156.47265625, -149.919921875, -143.3671875, -136.814453125, -130.26171875, -123.708984375, -117.15625, -110.603515625, -104.05078125, -97.498046875, -90.9453125, -84.392578125, -77.83984375, -71.287109375, -64.734375, -58.181640625, -51.62890625, -45.076171875, -38.5234375, -31.970703125, -25.41796875, -18.865234375, -12.3125, -5.759765625, 0.79296875, 7.345703125, 13.8984375, 20.451171875, 27.00390625, 33.556640625, 40.109375, 46.662109375, 53.21484375, 59.767578125, 66.3203125, 72.873046875, 79.42578125, 85.978515625, 92.53125, 99.083984375, 105.63671875, 112.189453125, 118.7421875, 125.294921875, 131.84765625, 138.400390625, 144.953125, 151.505859375, 158.05859375, 164.611328125, 171.1640625, 177.716796875, 184.26953125, 190.822265625, 197.375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 10.0, 12.0, 19.0, 15.0, 16.0, 17.0, 25.0, 28.0, 22.0, 42.0, 44.0, 23.0, 32.0, 36.0, 31.0, 34.0, 45.0, 43.0, 34.0, 40.0, 43.0, 37.0, 28.0, 34.0, 33.0, 26.0, 30.0, 22.0, 21.0, 18.0, 20.0, 15.0, 21.0, 12.0, 6.0, 10.0, 4.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.625, -139.9609375, -135.296875, -130.6328125, -125.96875, -121.3046875, -116.640625, -111.9765625, -107.3125, -102.6484375, -97.984375, -93.3203125, -88.65625, -83.9921875, -79.328125, -74.6640625, -70.0, -65.3359375, -60.671875, -56.0078125, -51.34375, -46.6796875, -42.015625, -37.3515625, -32.6875, -28.0234375, -23.359375, -18.6953125, -14.03125, -9.3671875, -4.703125, -0.0390625, 4.625, 9.2890625, 13.953125, 18.6171875, 23.28125, 27.9453125, 32.609375, 37.2734375, 41.9375, 46.6015625, 51.265625, 55.9296875, 60.59375, 65.2578125, 69.921875, 74.5859375, 79.25, 83.9140625, 88.578125, 93.2421875, 97.90625, 102.5703125, 107.234375, 111.8984375, 116.5625, 121.2265625, 125.890625, 130.5546875, 135.21875, 139.8828125, 144.546875, 149.2109375, 153.875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 4.0, 9.0, 22.0, 27.0, 27.0, 52.0, 74.0, 116.0, 142.0, 250.0, 374.0, 512.0, 915.0, 1419.0, 2331.0, 4192.0, 7628.0, 13766.0, 27316.0, 62695.0, 210408.0, 495813.0, 127649.0, 46028.0, 21229.0, 11011.0, 6065.0, 3300.0, 1960.0, 1175.0, 711.0, 425.0, 279.0, 180.0, 133.0, 97.0, 68.0, 44.0, 22.0, 25.0, 16.0, 14.0, 14.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-179.25, -174.02734375, -168.8046875, -163.58203125, -158.359375, -153.13671875, -147.9140625, -142.69140625, -137.46875, -132.24609375, -127.0234375, -121.80078125, -116.578125, -111.35546875, -106.1328125, -100.91015625, -95.6875, -90.46484375, -85.2421875, -80.01953125, -74.796875, -69.57421875, -64.3515625, -59.12890625, -53.90625, -48.68359375, -43.4609375, -38.23828125, -33.015625, -27.79296875, -22.5703125, -17.34765625, -12.125, -6.90234375, -1.6796875, 3.54296875, 8.765625, 13.98828125, 19.2109375, 24.43359375, 29.65625, 34.87890625, 40.1015625, 45.32421875, 50.546875, 55.76953125, 60.9921875, 66.21484375, 71.4375, 76.66015625, 81.8828125, 87.10546875, 92.328125, 97.55078125, 102.7734375, 107.99609375, 113.21875, 118.44140625, 123.6640625, 128.88671875, 134.109375, 139.33203125, 144.5546875, 149.77734375, 155.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 10.0, 5.0, 7.0, 8.0, 16.0, 16.0, 18.0, 13.0, 21.0, 16.0, 20.0, 26.0, 22.0, 34.0, 18.0, 33.0, 35.0, 30.0, 37.0, 34.0, 28.0, 26.0, 34.0, 32.0, 33.0, 30.0, 31.0, 38.0, 33.0, 27.0, 37.0, 26.0, 33.0, 25.0, 16.0, 18.0, 12.0, 12.0, 18.0, 17.0, 7.0, 12.0, 9.0, 4.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-119.4375, -115.4423828125, -111.447265625, -107.4521484375, -103.45703125, -99.4619140625, -95.466796875, -91.4716796875, -87.4765625, -83.4814453125, -79.486328125, -75.4912109375, -71.49609375, -67.5009765625, -63.505859375, -59.5107421875, -55.515625, -51.5205078125, -47.525390625, -43.5302734375, -39.53515625, -35.5400390625, -31.544921875, -27.5498046875, -23.5546875, -19.5595703125, -15.564453125, -11.5693359375, -7.57421875, -3.5791015625, 0.416015625, 4.4111328125, 8.40625, 12.4013671875, 16.396484375, 20.3916015625, 24.38671875, 28.3818359375, 32.376953125, 36.3720703125, 40.3671875, 44.3623046875, 48.357421875, 52.3525390625, 56.34765625, 60.3427734375, 64.337890625, 68.3330078125, 72.328125, 76.3232421875, 80.318359375, 84.3134765625, 88.30859375, 92.3037109375, 96.298828125, 100.2939453125, 104.2890625, 108.2841796875, 112.279296875, 116.2744140625, 120.26953125, 124.2646484375, 128.259765625, 132.2548828125, 136.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 16.0, 15.0, 13.0, 34.0, 51.0, 37.0, 74.0, 102.0, 133.0, 222.0, 292.0, 508.0, 705.0, 1110.0, 1724.0, 3109.0, 6350.0, 15837.0, 63854.0, 758871.0, 151230.0, 25426.0, 8622.0, 4037.0, 2183.0, 1299.0, 855.0, 574.0, 375.0, 290.0, 178.0, 126.0, 84.0, 61.0, 32.0, 29.0, 12.0, 13.0, 14.0, 12.0, 9.0, 1.0, 1.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-276.0, -267.29296875, -258.5859375, -249.87890625, -241.171875, -232.46484375, -223.7578125, -215.05078125, -206.34375, -197.63671875, -188.9296875, -180.22265625, -171.515625, -162.80859375, -154.1015625, -145.39453125, -136.6875, -127.98046875, -119.2734375, -110.56640625, -101.859375, -93.15234375, -84.4453125, -75.73828125, -67.03125, -58.32421875, -49.6171875, -40.91015625, -32.203125, -23.49609375, -14.7890625, -6.08203125, 2.625, 11.33203125, 20.0390625, 28.74609375, 37.453125, 46.16015625, 54.8671875, 63.57421875, 72.28125, 80.98828125, 89.6953125, 98.40234375, 107.109375, 115.81640625, 124.5234375, 133.23046875, 141.9375, 150.64453125, 159.3515625, 168.05859375, 176.765625, 185.47265625, 194.1796875, 202.88671875, 211.59375, 220.30078125, 229.0078125, 237.71484375, 246.421875, 255.12890625, 263.8359375, 272.54296875, 281.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 16.0, 13.0, 19.0, 20.0, 42.0, 71.0, 90.0, 106.0, 145.0, 148.0, 111.0, 71.0, 54.0, 41.0, 22.0, 13.0, 5.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.019805908203125, -0.0193326473236084, -0.018859386444091797, -0.018386125564575195, -0.017912864685058594, -0.017439603805541992, -0.01696634292602539, -0.01649308204650879, -0.016019821166992188, -0.015546560287475586, -0.015073299407958984, -0.014600038528442383, -0.014126777648925781, -0.01365351676940918, -0.013180255889892578, -0.012706995010375977, -0.012233734130859375, -0.011760473251342773, -0.011287212371826172, -0.01081395149230957, -0.010340690612792969, -0.009867429733276367, -0.009394168853759766, -0.008920907974243164, -0.008447647094726562, -0.007974386215209961, -0.007501125335693359, -0.007027864456176758, -0.006554603576660156, -0.006081342697143555, -0.005608081817626953, -0.0051348209381103516, -0.00466156005859375, -0.0041882991790771484, -0.003715038299560547, -0.0032417774200439453, -0.0027685165405273438, -0.002295255661010742, -0.0018219947814941406, -0.001348733901977539, -0.0008754730224609375, -0.00040221214294433594, 7.104873657226562e-05, 0.0005443096160888672, 0.0010175704956054688, 0.0014908313751220703, 0.001964092254638672, 0.0024373531341552734, 0.002910614013671875, 0.0033838748931884766, 0.003857135772705078, 0.00433039665222168, 0.004803657531738281, 0.005276918411254883, 0.005750179290771484, 0.006223440170288086, 0.0066967010498046875, 0.007169961929321289, 0.007643222808837891, 0.008116483688354492, 0.008589744567871094, 0.009063005447387695, 0.009536266326904297, 0.010009527206420898, 0.0104827880859375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 17.0, 17.0, 21.0, 32.0, 38.0, 45.0, 82.0, 107.0, 154.0, 201.0, 329.0, 466.0, 838.0, 1599.0, 2947.0, 5950.0, 12867.0, 38022.0, 313260.0, 587986.0, 53003.0, 15629.0, 7002.0, 3414.0, 1797.0, 1029.0, 568.0, 355.0, 236.0, 161.0, 86.0, 86.0, 61.0, 32.0, 32.0, 28.0, 8.0, 11.0, 10.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.25, -311.546875, -300.84375, -290.140625, -279.4375, -268.734375, -258.03125, -247.328125, -236.625, -225.921875, -215.21875, -204.515625, -193.8125, -183.109375, -172.40625, -161.703125, -151.0, -140.296875, -129.59375, -118.890625, -108.1875, -97.484375, -86.78125, -76.078125, -65.375, -54.671875, -43.96875, -33.265625, -22.5625, -11.859375, -1.15625, 9.546875, 20.25, 30.953125, 41.65625, 52.359375, 63.0625, 73.765625, 84.46875, 95.171875, 105.875, 116.578125, 127.28125, 137.984375, 148.6875, 159.390625, 170.09375, 180.796875, 191.5, 202.203125, 212.90625, 223.609375, 234.3125, 245.015625, 255.71875, 266.421875, 277.125, 287.828125, 298.53125, 309.234375, 319.9375, 330.640625, 341.34375, 352.046875, 362.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 5.0, 7.0, 6.0, 8.0, 12.0, 15.0, 13.0, 49.0, 115.0, 260.0, 245.0, 115.0, 52.0, 26.0, 17.0, 12.0, 9.0, 7.0, 7.0, 9.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.25, -108.39453125, -105.5390625, -102.68359375, -99.828125, -96.97265625, -94.1171875, -91.26171875, -88.40625, -85.55078125, -82.6953125, -79.83984375, -76.984375, -74.12890625, -71.2734375, -68.41796875, -65.5625, -62.70703125, -59.8515625, -56.99609375, -54.140625, -51.28515625, -48.4296875, -45.57421875, -42.71875, -39.86328125, -37.0078125, -34.15234375, -31.296875, -28.44140625, -25.5859375, -22.73046875, -19.875, -17.01953125, -14.1640625, -11.30859375, -8.453125, -5.59765625, -2.7421875, 0.11328125, 2.96875, 5.82421875, 8.6796875, 11.53515625, 14.390625, 17.24609375, 20.1015625, 22.95703125, 25.8125, 28.66796875, 31.5234375, 34.37890625, 37.234375, 40.08984375, 42.9453125, 45.80078125, 48.65625, 51.51171875, 54.3671875, 57.22265625, 60.078125, 62.93359375, 65.7890625, 68.64453125, 71.5]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 7.0, 10.0, 12.0, 18.0, 21.0, 28.0, 25.0, 34.0, 51.0, 62.0, 81.0, 98.0, 100.0, 98.0, 74.0, 54.0, 38.0, 35.0, 35.0, 30.0, 26.0, 18.0, 10.0, 12.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-258.6842346191406, -251.5355224609375, -244.3867950439453, -237.2380828857422, -230.08935546875, -222.94064331054688, -215.79193115234375, -208.64320373535156, -201.49447631835938, -194.34576416015625, -187.19703674316406, -180.04832458496094, -172.89959716796875, -165.75088500976562, -158.6021728515625, -151.4534454345703, -144.3047332763672, -137.15602111816406, -130.00729370117188, -122.85858154296875, -115.70985412597656, -108.56114196777344, -101.41242218017578, -94.26370239257812, -87.11498260498047, -79.96626281738281, -72.81754302978516, -65.6688232421875, -58.52010726928711, -51.37138748168945, -44.22267150878906, -37.073951721191406, -29.925216674804688, -22.77649688720703, -15.627779006958008, -8.479061126708984, -1.3303413391113281, 5.818378448486328, 12.967094421386719, 20.115814208984375, 27.26453399658203, 34.41325378417969, 41.561973571777344, 48.710689544677734, 55.85940933227539, 63.00812911987305, 70.15684509277344, 77.3055648803711, 84.45428466796875, 91.6030044555664, 98.75172424316406, 105.90043640136719, 113.04916381835938, 120.1978759765625, 127.34659576416016, 134.4953155517578, 141.64404296875, 148.79275512695312, 155.9414825439453, 163.09019470214844, 170.23892211914062, 177.38763427734375, 184.53634643554688, 191.68507385253906, 198.8337860107422]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 8.0, 7.0, 7.0, 13.0, 11.0, 9.0, 18.0, 17.0, 19.0, 20.0, 31.0, 33.0, 28.0, 32.0, 22.0, 29.0, 33.0, 35.0, 44.0, 39.0, 52.0, 52.0, 38.0, 39.0, 35.0, 32.0, 39.0, 28.0, 25.0, 25.0, 21.0, 28.0, 15.0, 21.0, 14.0, 11.0, 13.0, 8.0, 7.0, 8.0, 11.0, 7.0, 0.0, 0.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-153.67152404785156, -149.09848022460938, -144.52545166015625, -139.95240783691406, -135.37936401367188, -130.80633544921875, -126.23329162597656, -121.6602554321289, -117.08721923828125, -112.5141830444336, -107.9411392211914, -103.36810302734375, -98.7950668334961, -94.22203063964844, -89.64898681640625, -85.0759506225586, -80.5029067993164, -75.92987060546875, -71.35682678222656, -66.7837905883789, -62.21075439453125, -57.63771438598633, -53.064674377441406, -48.49163818359375, -43.91859817504883, -39.345558166503906, -34.77252197265625, -30.199481964111328, -25.62644386291504, -21.05340576171875, -16.480365753173828, -11.907329559326172, -7.33428955078125, -2.7612509727478027, 1.8117876052856445, 6.38482666015625, 10.957864761352539, 15.530902862548828, 20.10394287109375, 24.676979064941406, 29.250019073486328, 33.82305908203125, 38.396095275878906, 42.96913528442383, 47.54217529296875, 52.115211486816406, 56.68825149536133, 61.261287689208984, 65.8343276977539, 70.40736389160156, 74.98040771484375, 79.5534439086914, 84.12648010253906, 88.69952392578125, 93.2725601196289, 97.84559631347656, 102.41864013671875, 106.9916763305664, 111.5647201538086, 116.13775634765625, 120.7107925415039, 125.28382873535156, 129.85687255859375, 134.42990112304688, 139.00294494628906]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 3.0, 5.0, 12.0, 9.0, 22.0, 23.0, 45.0, 52.0, 85.0, 135.0, 185.0, 310.0, 550.0, 807.0, 1373.0, 2288.0, 3916.0, 6912.0, 12332.0, 21981.0, 40496.0, 79353.0, 164080.0, 282209.0, 212967.0, 103695.0, 51439.0, 27627.0, 15150.0, 8431.0, 4811.0, 2841.0, 1689.0, 988.0, 600.0, 394.0, 242.0, 138.0, 105.0, 85.0, 49.0, 29.0, 16.0, 18.0, 15.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-303.25, -293.03515625, -282.8203125, -272.60546875, -262.390625, -252.17578125, -241.9609375, -231.74609375, -221.53125, -211.31640625, -201.1015625, -190.88671875, -180.671875, -170.45703125, -160.2421875, -150.02734375, -139.8125, -129.59765625, -119.3828125, -109.16796875, -98.953125, -88.73828125, -78.5234375, -68.30859375, -58.09375, -47.87890625, -37.6640625, -27.44921875, -17.234375, -7.01953125, 3.1953125, 13.41015625, 23.625, 33.83984375, 44.0546875, 54.26953125, 64.484375, 74.69921875, 84.9140625, 95.12890625, 105.34375, 115.55859375, 125.7734375, 135.98828125, 146.203125, 156.41796875, 166.6328125, 176.84765625, 187.0625, 197.27734375, 207.4921875, 217.70703125, 227.921875, 238.13671875, 248.3515625, 258.56640625, 268.78125, 278.99609375, 289.2109375, 299.42578125, 309.640625, 319.85546875, 330.0703125, 340.28515625, 350.5]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 11.0, 6.0, 15.0, 14.0, 23.0, 21.0, 23.0, 36.0, 27.0, 37.0, 25.0, 33.0, 30.0, 34.0, 48.0, 41.0, 42.0, 50.0, 31.0, 43.0, 44.0, 45.0, 37.0, 31.0, 29.0, 25.0, 27.0, 21.0, 14.0, 16.0, 18.0, 20.0, 12.0, 13.0, 15.0, 5.0, 3.0, 5.0, 1.0, 4.0, 5.0, 0.0, 6.0, 3.0, 2.0, 2.0], "bins": [-113.375, -110.189453125, -107.00390625, -103.818359375, -100.6328125, -97.447265625, -94.26171875, -91.076171875, -87.890625, -84.705078125, -81.51953125, -78.333984375, -75.1484375, -71.962890625, -68.77734375, -65.591796875, -62.40625, -59.220703125, -56.03515625, -52.849609375, -49.6640625, -46.478515625, -43.29296875, -40.107421875, -36.921875, -33.736328125, -30.55078125, -27.365234375, -24.1796875, -20.994140625, -17.80859375, -14.623046875, -11.4375, -8.251953125, -5.06640625, -1.880859375, 1.3046875, 4.490234375, 7.67578125, 10.861328125, 14.046875, 17.232421875, 20.41796875, 23.603515625, 26.7890625, 29.974609375, 33.16015625, 36.345703125, 39.53125, 42.716796875, 45.90234375, 49.087890625, 52.2734375, 55.458984375, 58.64453125, 61.830078125, 65.015625, 68.201171875, 71.38671875, 74.572265625, 77.7578125, 80.943359375, 84.12890625, 87.314453125, 90.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 12.0, 13.0, 11.0, 17.0, 30.0, 37.0, 73.0, 92.0, 170.0, 215.0, 331.0, 549.0, 829.0, 1178.0, 1873.0, 2668.0, 4412.0, 6628.0, 10561.0, 16969.0, 26970.0, 44351.0, 75369.0, 130890.0, 211123.0, 204620.0, 124344.0, 71445.0, 42280.0, 26109.0, 15841.0, 10157.0, 6286.0, 4168.0, 2668.0, 1769.0, 1131.0, 782.0, 513.0, 361.0, 221.0, 165.0, 124.0, 68.0, 40.0, 28.0, 27.0, 17.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-211.875, -205.244140625, -198.61328125, -191.982421875, -185.3515625, -178.720703125, -172.08984375, -165.458984375, -158.828125, -152.197265625, -145.56640625, -138.935546875, -132.3046875, -125.673828125, -119.04296875, -112.412109375, -105.78125, -99.150390625, -92.51953125, -85.888671875, -79.2578125, -72.626953125, -65.99609375, -59.365234375, -52.734375, -46.103515625, -39.47265625, -32.841796875, -26.2109375, -19.580078125, -12.94921875, -6.318359375, 0.3125, 6.943359375, 13.57421875, 20.205078125, 26.8359375, 33.466796875, 40.09765625, 46.728515625, 53.359375, 59.990234375, 66.62109375, 73.251953125, 79.8828125, 86.513671875, 93.14453125, 99.775390625, 106.40625, 113.037109375, 119.66796875, 126.298828125, 132.9296875, 139.560546875, 146.19140625, 152.822265625, 159.453125, 166.083984375, 172.71484375, 179.345703125, 185.9765625, 192.607421875, 199.23828125, 205.869140625, 212.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 4.0, 9.0, 11.0, 5.0, 11.0, 8.0, 18.0, 18.0, 16.0, 18.0, 33.0, 31.0, 31.0, 31.0, 33.0, 23.0, 34.0, 34.0, 43.0, 43.0, 46.0, 41.0, 41.0, 33.0, 38.0, 35.0, 41.0, 40.0, 37.0, 29.0, 29.0, 18.0, 29.0, 18.0, 10.0, 10.0, 15.0, 10.0, 6.0, 4.0, 3.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -63.9541015625, -61.470703125, -58.9873046875, -56.50390625, -54.0205078125, -51.537109375, -49.0537109375, -46.5703125, -44.0869140625, -41.603515625, -39.1201171875, -36.63671875, -34.1533203125, -31.669921875, -29.1865234375, -26.703125, -24.2197265625, -21.736328125, -19.2529296875, -16.76953125, -14.2861328125, -11.802734375, -9.3193359375, -6.8359375, -4.3525390625, -1.869140625, 0.6142578125, 3.09765625, 5.5810546875, 8.064453125, 10.5478515625, 13.03125, 15.5146484375, 17.998046875, 20.4814453125, 22.96484375, 25.4482421875, 27.931640625, 30.4150390625, 32.8984375, 35.3818359375, 37.865234375, 40.3486328125, 42.83203125, 45.3154296875, 47.798828125, 50.2822265625, 52.765625, 55.2490234375, 57.732421875, 60.2158203125, 62.69921875, 65.1826171875, 67.666015625, 70.1494140625, 72.6328125, 75.1162109375, 77.599609375, 80.0830078125, 82.56640625, 85.0498046875, 87.533203125, 90.0166015625, 92.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 5.0, 13.0, 13.0, 17.0, 20.0, 32.0, 33.0, 44.0, 62.0, 85.0, 104.0, 149.0, 202.0, 282.0, 429.0, 584.0, 825.0, 1323.0, 2047.0, 3605.0, 6665.0, 13751.0, 31118.0, 86917.0, 420840.0, 344732.0, 77394.0, 28900.0, 12526.0, 6329.0, 3453.0, 2036.0, 1272.0, 815.0, 525.0, 362.0, 251.0, 223.0, 137.0, 95.0, 91.0, 65.0, 43.0, 40.0, 26.0, 19.0, 12.0, 10.0, 12.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 3.0], "bins": [-221.125, -214.4140625, -207.703125, -200.9921875, -194.28125, -187.5703125, -180.859375, -174.1484375, -167.4375, -160.7265625, -154.015625, -147.3046875, -140.59375, -133.8828125, -127.171875, -120.4609375, -113.75, -107.0390625, -100.328125, -93.6171875, -86.90625, -80.1953125, -73.484375, -66.7734375, -60.0625, -53.3515625, -46.640625, -39.9296875, -33.21875, -26.5078125, -19.796875, -13.0859375, -6.375, 0.3359375, 7.046875, 13.7578125, 20.46875, 27.1796875, 33.890625, 40.6015625, 47.3125, 54.0234375, 60.734375, 67.4453125, 74.15625, 80.8671875, 87.578125, 94.2890625, 101.0, 107.7109375, 114.421875, 121.1328125, 127.84375, 134.5546875, 141.265625, 147.9765625, 154.6875, 161.3984375, 168.109375, 174.8203125, 181.53125, 188.2421875, 194.953125, 201.6640625, 208.375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 14.0, 27.0, 48.0, 55.0, 96.0, 168.0, 194.0, 132.0, 107.0, 45.0, 31.0, 23.0, 15.0, 7.0, 4.0, 7.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0145263671875, -0.013927459716796875, -0.01332855224609375, -0.012729644775390625, -0.0121307373046875, -0.011531829833984375, -0.01093292236328125, -0.010334014892578125, -0.009735107421875, -0.009136199951171875, -0.00853729248046875, -0.007938385009765625, -0.0073394775390625, -0.006740570068359375, -0.00614166259765625, -0.005542755126953125, -0.00494384765625, -0.004344940185546875, -0.00374603271484375, -0.003147125244140625, -0.0025482177734375, -0.001949310302734375, -0.00135040283203125, -0.000751495361328125, -0.000152587890625, 0.000446319580078125, 0.00104522705078125, 0.001644134521484375, 0.0022430419921875, 0.002841949462890625, 0.00344085693359375, 0.004039764404296875, 0.004638671875, 0.005237579345703125, 0.00583648681640625, 0.006435394287109375, 0.0070343017578125, 0.007633209228515625, 0.00823211669921875, 0.008831024169921875, 0.009429931640625, 0.010028839111328125, 0.01062774658203125, 0.011226654052734375, 0.0118255615234375, 0.012424468994140625, 0.01302337646484375, 0.013622283935546875, 0.01422119140625, 0.014820098876953125, 0.01541900634765625, 0.016017913818359375, 0.0166168212890625, 0.017215728759765625, 0.01781463623046875, 0.018413543701171875, 0.019012451171875, 0.019611358642578125, 0.02021026611328125, 0.020809173583984375, 0.0214080810546875, 0.022006988525390625, 0.02260589599609375, 0.023204803466796875, 0.0238037109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 15.0, 10.0, 18.0, 31.0, 32.0, 49.0, 74.0, 92.0, 159.0, 218.0, 282.0, 459.0, 729.0, 1054.0, 1697.0, 2779.0, 5504.0, 14353.0, 63841.0, 635279.0, 266988.0, 34463.0, 9606.0, 4233.0, 2337.0, 1402.0, 929.0, 598.0, 401.0, 274.0, 196.0, 120.0, 107.0, 65.0, 39.0, 27.0, 24.0, 10.0, 10.0, 13.0, 9.0, 9.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-334.25, -323.74609375, -313.2421875, -302.73828125, -292.234375, -281.73046875, -271.2265625, -260.72265625, -250.21875, -239.71484375, -229.2109375, -218.70703125, -208.203125, -197.69921875, -187.1953125, -176.69140625, -166.1875, -155.68359375, -145.1796875, -134.67578125, -124.171875, -113.66796875, -103.1640625, -92.66015625, -82.15625, -71.65234375, -61.1484375, -50.64453125, -40.140625, -29.63671875, -19.1328125, -8.62890625, 1.875, 12.37890625, 22.8828125, 33.38671875, 43.890625, 54.39453125, 64.8984375, 75.40234375, 85.90625, 96.41015625, 106.9140625, 117.41796875, 127.921875, 138.42578125, 148.9296875, 159.43359375, 169.9375, 180.44140625, 190.9453125, 201.44921875, 211.953125, 222.45703125, 232.9609375, 243.46484375, 253.96875, 264.47265625, 274.9765625, 285.48046875, 295.984375, 306.48828125, 316.9921875, 327.49609375, 338.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 5.0, 19.0, 20.0, 41.0, 74.0, 132.0, 155.0, 190.0, 136.0, 86.0, 71.0, 31.0, 11.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.75, -84.0625, -81.375, -78.6875, -76.0, -73.3125, -70.625, -67.9375, -65.25, -62.5625, -59.875, -57.1875, -54.5, -51.8125, -49.125, -46.4375, -43.75, -41.0625, -38.375, -35.6875, -33.0, -30.3125, -27.625, -24.9375, -22.25, -19.5625, -16.875, -14.1875, -11.5, -8.8125, -6.125, -3.4375, -0.75, 1.9375, 4.625, 7.3125, 10.0, 12.6875, 15.375, 18.0625, 20.75, 23.4375, 26.125, 28.8125, 31.5, 34.1875, 36.875, 39.5625, 42.25, 44.9375, 47.625, 50.3125, 53.0, 55.6875, 58.375, 61.0625, 63.75, 66.4375, 69.125, 71.8125, 74.5, 77.1875, 79.875, 82.5625, 85.25]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 5.0, 6.0, 8.0, 11.0, 14.0, 17.0, 15.0, 35.0, 36.0, 44.0, 54.0, 67.0, 82.0, 98.0, 73.0, 76.0, 52.0, 66.0, 49.0, 31.0, 32.0, 25.0, 19.0, 22.0, 14.0, 10.0, 6.0, 6.0, 3.0, 4.0, 5.0, 0.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.383544921875, -124.29437255859375, -119.20520782470703, -114.11603546142578, -109.02687072753906, -103.93769836425781, -98.84852600097656, -93.75935363769531, -88.6701889038086, -83.58101654052734, -78.49185180664062, -73.40267944335938, -68.31350708007812, -63.224342346191406, -58.135169982910156, -53.04600143432617, -47.95683288574219, -42.8676643371582, -37.77849578857422, -32.68932342529297, -27.600154876708984, -22.510986328125, -17.421815872192383, -12.332645416259766, -7.243476867675781, -2.1543073654174805, 2.9348621368408203, 8.024031639099121, 13.113201141357422, 18.202369689941406, 23.291540145874023, 28.38071060180664, 33.46986389160156, 38.55903244018555, 43.64820098876953, 48.73737335205078, 53.826541900634766, 58.91571044921875, 64.0048828125, 69.09405517578125, 74.18321990966797, 79.27239227294922, 84.36155700683594, 89.45072937011719, 94.53990173339844, 99.62906646728516, 104.7182388305664, 109.80740356445312, 114.89657592773438, 119.98574829101562, 125.07491302490234, 130.16407775878906, 135.2532501220703, 140.34242248535156, 145.4315948486328, 150.52076721191406, 155.60992431640625, 160.6990966796875, 165.78826904296875, 170.87742614746094, 175.9665985107422, 181.05577087402344, 186.1449432373047, 191.23411560058594, 196.3232879638672]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 8.0, 12.0, 11.0, 11.0, 12.0, 18.0, 19.0, 24.0, 27.0, 30.0, 24.0, 29.0, 40.0, 39.0, 40.0, 37.0, 36.0, 35.0, 41.0, 35.0, 41.0, 35.0, 36.0, 34.0, 37.0, 31.0, 28.0, 31.0, 26.0, 24.0, 17.0, 17.0, 17.0, 14.0, 15.0, 12.0, 7.0, 8.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.5198974609375, -108.95657348632812, -105.39324951171875, -101.82992553710938, -98.2666015625, -94.70327758789062, -91.13995361328125, -87.5766372680664, -84.01331329345703, -80.44998931884766, -76.88666534423828, -73.3233413696289, -69.76001739501953, -66.19670104980469, -62.63337326049805, -59.07005310058594, -55.5067253112793, -51.94340133666992, -48.38007736206055, -44.81675720214844, -41.25343322753906, -37.69010925292969, -34.12678527832031, -30.56346321105957, -27.000139236450195, -23.43681526184082, -19.873493194580078, -16.310169219970703, -12.746846199035645, -9.183523178100586, -5.620199203491211, -2.0568771362304688, 1.5064468383789062, 5.069769859313965, 8.633092880249023, 12.196416854858398, 15.759739875793457, 19.323062896728516, 22.88638687133789, 26.449708938598633, 30.013032913208008, 33.57635498046875, 37.139678955078125, 40.7030029296875, 44.266326904296875, 47.82965087890625, 51.392974853515625, 54.956295013427734, 58.51961898803711, 62.082942962646484, 65.6462631225586, 69.20958709716797, 72.77291107177734, 76.33623504638672, 79.8995590209961, 83.46288299560547, 87.02620697021484, 90.58953094482422, 94.1528549194336, 97.71617889404297, 101.27950286865234, 104.84281921386719, 108.40614318847656, 111.96946716308594, 115.53279113769531]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 8.0, 7.0, 22.0, 39.0, 38.0, 73.0, 121.0, 177.0, 279.0, 456.0, 711.0, 1202.0, 1782.0, 2971.0, 4811.0, 8122.0, 13066.0, 22408.0, 37737.0, 66550.0, 124517.0, 268654.0, 992597.0, 1711674.0, 525545.0, 187313.0, 94518.0, 52291.0, 30158.0, 17909.0, 10854.0, 6661.0, 4051.0, 2664.0, 1605.0, 992.0, 627.0, 373.0, 259.0, 167.0, 96.0, 53.0, 48.0, 22.0, 21.0, 14.0, 9.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.75, -148.16015625, -143.5703125, -138.98046875, -134.390625, -129.80078125, -125.2109375, -120.62109375, -116.03125, -111.44140625, -106.8515625, -102.26171875, -97.671875, -93.08203125, -88.4921875, -83.90234375, -79.3125, -74.72265625, -70.1328125, -65.54296875, -60.953125, -56.36328125, -51.7734375, -47.18359375, -42.59375, -38.00390625, -33.4140625, -28.82421875, -24.234375, -19.64453125, -15.0546875, -10.46484375, -5.875, -1.28515625, 3.3046875, 7.89453125, 12.484375, 17.07421875, 21.6640625, 26.25390625, 30.84375, 35.43359375, 40.0234375, 44.61328125, 49.203125, 53.79296875, 58.3828125, 62.97265625, 67.5625, 72.15234375, 76.7421875, 81.33203125, 85.921875, 90.51171875, 95.1015625, 99.69140625, 104.28125, 108.87109375, 113.4609375, 118.05078125, 122.640625, 127.23046875, 131.8203125, 136.41015625, 141.0]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 0.0, 2.0, 7.0, 4.0, 4.0, 8.0, 9.0, 11.0, 10.0, 9.0, 18.0, 17.0, 25.0, 27.0, 29.0, 36.0, 31.0, 45.0, 38.0, 45.0, 46.0, 44.0, 52.0, 48.0, 40.0, 37.0, 27.0, 49.0, 44.0, 26.0, 33.0, 31.0, 21.0, 27.0, 24.0, 19.0, 17.0, 10.0, 7.0, 11.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.15625, -59.16943359375, -57.1826171875, -55.19580078125, -53.208984375, -51.22216796875, -49.2353515625, -47.24853515625, -45.26171875, -43.27490234375, -41.2880859375, -39.30126953125, -37.314453125, -35.32763671875, -33.3408203125, -31.35400390625, -29.3671875, -27.38037109375, -25.3935546875, -23.40673828125, -21.419921875, -19.43310546875, -17.4462890625, -15.45947265625, -13.47265625, -11.48583984375, -9.4990234375, -7.51220703125, -5.525390625, -3.53857421875, -1.5517578125, 0.43505859375, 2.421875, 4.40869140625, 6.3955078125, 8.38232421875, 10.369140625, 12.35595703125, 14.3427734375, 16.32958984375, 18.31640625, 20.30322265625, 22.2900390625, 24.27685546875, 26.263671875, 28.25048828125, 30.2373046875, 32.22412109375, 34.2109375, 36.19775390625, 38.1845703125, 40.17138671875, 42.158203125, 44.14501953125, 46.1318359375, 48.11865234375, 50.10546875, 52.09228515625, 54.0791015625, 56.06591796875, 58.052734375, 60.03955078125, 62.0263671875, 64.01318359375, 66.0]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 8.0, 8.0, 12.0, 13.0, 20.0, 38.0, 47.0, 49.0, 103.0, 119.0, 205.0, 284.0, 429.0, 655.0, 986.0, 1497.0, 2265.0, 3517.0, 5695.0, 9188.0, 15269.0, 26827.0, 47743.0, 90588.0, 183202.0, 417671.0, 1168668.0, 1330605.0, 464260.0, 202430.0, 99315.0, 51573.0, 28557.0, 16290.0, 9916.0, 5879.0, 3739.0, 2230.0, 1519.0, 946.0, 630.0, 389.0, 281.0, 202.0, 108.0, 98.0, 80.0, 51.0, 23.0, 16.0, 14.0, 13.0, 10.0, 7.0, 0.0, 2.0, 0.0, 4.0], "bins": [-118.9375, -115.33984375, -111.7421875, -108.14453125, -104.546875, -100.94921875, -97.3515625, -93.75390625, -90.15625, -86.55859375, -82.9609375, -79.36328125, -75.765625, -72.16796875, -68.5703125, -64.97265625, -61.375, -57.77734375, -54.1796875, -50.58203125, -46.984375, -43.38671875, -39.7890625, -36.19140625, -32.59375, -28.99609375, -25.3984375, -21.80078125, -18.203125, -14.60546875, -11.0078125, -7.41015625, -3.8125, -0.21484375, 3.3828125, 6.98046875, 10.578125, 14.17578125, 17.7734375, 21.37109375, 24.96875, 28.56640625, 32.1640625, 35.76171875, 39.359375, 42.95703125, 46.5546875, 50.15234375, 53.75, 57.34765625, 60.9453125, 64.54296875, 68.140625, 71.73828125, 75.3359375, 78.93359375, 82.53125, 86.12890625, 89.7265625, 93.32421875, 96.921875, 100.51953125, 104.1171875, 107.71484375, 111.3125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 1.0, 5.0, 6.0, 9.0, 13.0, 12.0, 22.0, 34.0, 30.0, 46.0, 50.0, 68.0, 79.0, 107.0, 120.0, 152.0, 162.0, 196.0, 231.0, 287.0, 397.0, 414.0, 331.0, 273.0, 205.0, 162.0, 148.0, 107.0, 84.0, 65.0, 52.0, 34.0, 41.0, 25.0, 20.0, 19.0, 10.0, 13.0, 8.0, 15.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.265625, -29.109130859375, -27.95263671875, -26.796142578125, -25.6396484375, -24.483154296875, -23.32666015625, -22.170166015625, -21.013671875, -19.857177734375, -18.70068359375, -17.544189453125, -16.3876953125, -15.231201171875, -14.07470703125, -12.918212890625, -11.76171875, -10.605224609375, -9.44873046875, -8.292236328125, -7.1357421875, -5.979248046875, -4.82275390625, -3.666259765625, -2.509765625, -1.353271484375, -0.19677734375, 0.959716796875, 2.1162109375, 3.272705078125, 4.42919921875, 5.585693359375, 6.7421875, 7.898681640625, 9.05517578125, 10.211669921875, 11.3681640625, 12.524658203125, 13.68115234375, 14.837646484375, 15.994140625, 17.150634765625, 18.30712890625, 19.463623046875, 20.6201171875, 21.776611328125, 22.93310546875, 24.089599609375, 25.24609375, 26.402587890625, 27.55908203125, 28.715576171875, 29.8720703125, 31.028564453125, 32.18505859375, 33.341552734375, 34.498046875, 35.654541015625, 36.81103515625, 37.967529296875, 39.1240234375, 40.280517578125, 41.43701171875, 42.593505859375, 43.75]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 11.0, 8.0, 6.0, 5.0, 8.0, 19.0, 19.0, 34.0, 39.0, 48.0, 63.0, 91.0, 106.0, 94.0, 94.0, 76.0, 71.0, 43.0, 48.0, 20.0, 22.0, 18.0, 13.0, 10.0, 11.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.8041000366211, -122.79422760009766, -118.78435516357422, -114.77447509765625, -110.76460266113281, -106.75473022460938, -102.74485778808594, -98.7349853515625, -94.72511291503906, -90.71524047851562, -86.70536804199219, -82.69549560546875, -78.68561553955078, -74.67574310302734, -70.6658706665039, -66.65599822998047, -62.6461181640625, -58.63624572753906, -54.62636947631836, -50.61649703979492, -46.60662078857422, -42.59674835205078, -38.586875915527344, -34.577003479003906, -30.567127227783203, -26.557252883911133, -22.547378540039062, -18.537506103515625, -14.527631759643555, -10.517757415771484, -6.507884979248047, -2.4980106353759766, 1.5118560791015625, 5.521729946136475, 9.531603813171387, 13.54147720336914, 17.55135154724121, 21.56122589111328, 25.57109832763672, 29.58097267150879, 33.59084701538086, 37.6007194519043, 41.610595703125, 45.62046813964844, 49.630340576171875, 53.64021682739258, 57.650089263916016, 61.65996551513672, 65.66983795166016, 69.6797103881836, 73.68958282470703, 77.699462890625, 81.70933532714844, 85.71920776367188, 89.72908020019531, 93.73895263671875, 97.74882507324219, 101.75869750976562, 105.76856994628906, 109.7784423828125, 113.78832244873047, 117.7981948852539, 121.80806732177734, 125.81793975830078, 129.82781982421875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 6.0, 9.0, 6.0, 10.0, 7.0, 14.0, 18.0, 9.0, 13.0, 12.0, 24.0, 18.0, 26.0, 27.0, 30.0, 31.0, 38.0, 33.0, 29.0, 52.0, 38.0, 32.0, 39.0, 33.0, 35.0, 38.0, 32.0, 38.0, 28.0, 27.0, 26.0, 32.0, 25.0, 25.0, 16.0, 11.0, 20.0, 15.0, 21.0, 11.0, 6.0, 11.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.47868347167969, -62.263492584228516, -60.048301696777344, -57.83311080932617, -55.617919921875, -53.40272903442383, -51.187538146972656, -48.972347259521484, -46.75715637207031, -44.54196548461914, -42.32677459716797, -40.1115837097168, -37.896392822265625, -35.68120193481445, -33.46601104736328, -31.25082015991211, -29.035629272460938, -26.820438385009766, -24.605247497558594, -22.390056610107422, -20.17486572265625, -17.959674835205078, -15.744483947753906, -13.529293060302734, -11.314102172851562, -9.09891128540039, -6.883720397949219, -4.668529510498047, -2.453338623046875, -0.23814773559570312, 1.9770431518554688, 4.192234039306641, 6.407417297363281, 8.622608184814453, 10.837799072265625, 13.052989959716797, 15.268180847167969, 17.48337173461914, 19.698562622070312, 21.913753509521484, 24.128944396972656, 26.344135284423828, 28.559326171875, 30.774517059326172, 32.989707946777344, 35.204898834228516, 37.42008972167969, 39.63528060913086, 41.85047149658203, 44.0656623840332, 46.280853271484375, 48.49604415893555, 50.71123504638672, 52.92642593383789, 55.14161682128906, 57.356807708740234, 59.571998596191406, 61.78718948364258, 64.00238037109375, 66.21757507324219, 68.4327621459961, 70.64794921875, 72.86314392089844, 75.07833862304688, 77.29352569580078]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 13.0, 8.0, 19.0, 27.0, 48.0, 46.0, 65.0, 105.0, 169.0, 237.0, 312.0, 489.0, 766.0, 1211.0, 1975.0, 3302.0, 5761.0, 10481.0, 19776.0, 38904.0, 78300.0, 174271.0, 358461.0, 185096.0, 82127.0, 40038.0, 20472.0, 10982.0, 5888.0, 3460.0, 2029.0, 1285.0, 799.0, 543.0, 334.0, 230.0, 166.0, 100.0, 81.0, 45.0, 43.0, 32.0, 18.0, 11.0, 7.0, 4.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-91.875, -89.05078125, -86.2265625, -83.40234375, -80.578125, -77.75390625, -74.9296875, -72.10546875, -69.28125, -66.45703125, -63.6328125, -60.80859375, -57.984375, -55.16015625, -52.3359375, -49.51171875, -46.6875, -43.86328125, -41.0390625, -38.21484375, -35.390625, -32.56640625, -29.7421875, -26.91796875, -24.09375, -21.26953125, -18.4453125, -15.62109375, -12.796875, -9.97265625, -7.1484375, -4.32421875, -1.5, 1.32421875, 4.1484375, 6.97265625, 9.796875, 12.62109375, 15.4453125, 18.26953125, 21.09375, 23.91796875, 26.7421875, 29.56640625, 32.390625, 35.21484375, 38.0390625, 40.86328125, 43.6875, 46.51171875, 49.3359375, 52.16015625, 54.984375, 57.80859375, 60.6328125, 63.45703125, 66.28125, 69.10546875, 71.9296875, 74.75390625, 77.578125, 80.40234375, 83.2265625, 86.05078125, 88.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 3.0, 10.0, 8.0, 11.0, 15.0, 11.0, 11.0, 10.0, 21.0, 25.0, 24.0, 22.0, 31.0, 25.0, 29.0, 42.0, 32.0, 45.0, 41.0, 30.0, 40.0, 43.0, 40.0, 34.0, 40.0, 34.0, 37.0, 30.0, 27.0, 30.0, 26.0, 20.0, 24.0, 15.0, 23.0, 14.0, 11.0, 18.0, 10.0, 14.0, 3.0, 1.0, 2.0, 7.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.8125, -67.4892578125, -65.166015625, -62.8427734375, -60.51953125, -58.1962890625, -55.873046875, -53.5498046875, -51.2265625, -48.9033203125, -46.580078125, -44.2568359375, -41.93359375, -39.6103515625, -37.287109375, -34.9638671875, -32.640625, -30.3173828125, -27.994140625, -25.6708984375, -23.34765625, -21.0244140625, -18.701171875, -16.3779296875, -14.0546875, -11.7314453125, -9.408203125, -7.0849609375, -4.76171875, -2.4384765625, -0.115234375, 2.2080078125, 4.53125, 6.8544921875, 9.177734375, 11.5009765625, 13.82421875, 16.1474609375, 18.470703125, 20.7939453125, 23.1171875, 25.4404296875, 27.763671875, 30.0869140625, 32.41015625, 34.7333984375, 37.056640625, 39.3798828125, 41.703125, 44.0263671875, 46.349609375, 48.6728515625, 50.99609375, 53.3193359375, 55.642578125, 57.9658203125, 60.2890625, 62.6123046875, 64.935546875, 67.2587890625, 69.58203125, 71.9052734375, 74.228515625, 76.5517578125, 78.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 10.0, 16.0, 22.0, 33.0, 48.0, 72.0, 102.0, 131.0, 212.0, 302.0, 440.0, 698.0, 1153.0, 1783.0, 3119.0, 5369.0, 9141.0, 16962.0, 33294.0, 80744.0, 293931.0, 413697.0, 102399.0, 39929.0, 19483.0, 10490.0, 5886.0, 3456.0, 2054.0, 1232.0, 760.0, 502.0, 352.0, 214.0, 148.0, 106.0, 73.0, 52.0, 38.0, 33.0, 21.0, 19.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.875, -79.474609375, -77.07421875, -74.673828125, -72.2734375, -69.873046875, -67.47265625, -65.072265625, -62.671875, -60.271484375, -57.87109375, -55.470703125, -53.0703125, -50.669921875, -48.26953125, -45.869140625, -43.46875, -41.068359375, -38.66796875, -36.267578125, -33.8671875, -31.466796875, -29.06640625, -26.666015625, -24.265625, -21.865234375, -19.46484375, -17.064453125, -14.6640625, -12.263671875, -9.86328125, -7.462890625, -5.0625, -2.662109375, -0.26171875, 2.138671875, 4.5390625, 6.939453125, 9.33984375, 11.740234375, 14.140625, 16.541015625, 18.94140625, 21.341796875, 23.7421875, 26.142578125, 28.54296875, 30.943359375, 33.34375, 35.744140625, 38.14453125, 40.544921875, 42.9453125, 45.345703125, 47.74609375, 50.146484375, 52.546875, 54.947265625, 57.34765625, 59.748046875, 62.1484375, 64.548828125, 66.94921875, 69.349609375, 71.75]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 15.0, 11.0, 8.0, 6.0, 13.0, 24.0, 16.0, 15.0, 26.0, 29.0, 17.0, 35.0, 30.0, 27.0, 36.0, 31.0, 34.0, 37.0, 26.0, 21.0, 35.0, 48.0, 36.0, 37.0, 28.0, 16.0, 38.0, 37.0, 28.0, 34.0, 26.0, 25.0, 23.0, 17.0, 18.0, 12.0, 18.0, 8.0, 12.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0], "bins": [-79.5625, -77.2939453125, -75.025390625, -72.7568359375, -70.48828125, -68.2197265625, -65.951171875, -63.6826171875, -61.4140625, -59.1455078125, -56.876953125, -54.6083984375, -52.33984375, -50.0712890625, -47.802734375, -45.5341796875, -43.265625, -40.9970703125, -38.728515625, -36.4599609375, -34.19140625, -31.9228515625, -29.654296875, -27.3857421875, -25.1171875, -22.8486328125, -20.580078125, -18.3115234375, -16.04296875, -13.7744140625, -11.505859375, -9.2373046875, -6.96875, -4.7001953125, -2.431640625, -0.1630859375, 2.10546875, 4.3740234375, 6.642578125, 8.9111328125, 11.1796875, 13.4482421875, 15.716796875, 17.9853515625, 20.25390625, 22.5224609375, 24.791015625, 27.0595703125, 29.328125, 31.5966796875, 33.865234375, 36.1337890625, 38.40234375, 40.6708984375, 42.939453125, 45.2080078125, 47.4765625, 49.7451171875, 52.013671875, 54.2822265625, 56.55078125, 58.8193359375, 61.087890625, 63.3564453125, 65.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 7.0, 3.0, 13.0, 8.0, 16.0, 11.0, 27.0, 28.0, 36.0, 40.0, 45.0, 75.0, 96.0, 124.0, 158.0, 184.0, 258.0, 348.0, 402.0, 622.0, 876.0, 1246.0, 2033.0, 3495.0, 6394.0, 14896.0, 52594.0, 610118.0, 288587.0, 38759.0, 12327.0, 5516.0, 3057.0, 1842.0, 1174.0, 783.0, 563.0, 412.0, 318.0, 210.0, 199.0, 147.0, 108.0, 91.0, 84.0, 58.0, 40.0, 41.0, 23.0, 17.0, 16.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-148.75, -143.935546875, -139.12109375, -134.306640625, -129.4921875, -124.677734375, -119.86328125, -115.048828125, -110.234375, -105.419921875, -100.60546875, -95.791015625, -90.9765625, -86.162109375, -81.34765625, -76.533203125, -71.71875, -66.904296875, -62.08984375, -57.275390625, -52.4609375, -47.646484375, -42.83203125, -38.017578125, -33.203125, -28.388671875, -23.57421875, -18.759765625, -13.9453125, -9.130859375, -4.31640625, 0.498046875, 5.3125, 10.126953125, 14.94140625, 19.755859375, 24.5703125, 29.384765625, 34.19921875, 39.013671875, 43.828125, 48.642578125, 53.45703125, 58.271484375, 63.0859375, 67.900390625, 72.71484375, 77.529296875, 82.34375, 87.158203125, 91.97265625, 96.787109375, 101.6015625, 106.416015625, 111.23046875, 116.044921875, 120.859375, 125.673828125, 130.48828125, 135.302734375, 140.1171875, 144.931640625, 149.74609375, 154.560546875, 159.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 17.0, 16.0, 15.0, 32.0, 47.0, 43.0, 79.0, 79.0, 81.0, 113.0, 90.0, 79.0, 60.0, 51.0, 33.0, 35.0, 29.0, 11.0, 21.0, 16.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00653076171875, -0.00633549690246582, -0.006140232086181641, -0.005944967269897461, -0.005749702453613281, -0.0055544376373291016, -0.005359172821044922, -0.005163908004760742, -0.0049686431884765625, -0.004773378372192383, -0.004578113555908203, -0.0043828487396240234, -0.004187583923339844, -0.003992319107055664, -0.0037970542907714844, -0.0036017894744873047, -0.003406524658203125, -0.0032112598419189453, -0.0030159950256347656, -0.002820730209350586, -0.0026254653930664062, -0.0024302005767822266, -0.002234935760498047, -0.002039670944213867, -0.0018444061279296875, -0.0016491413116455078, -0.0014538764953613281, -0.0012586116790771484, -0.0010633468627929688, -0.0008680820465087891, -0.0006728172302246094, -0.0004775524139404297, -0.00028228759765625, -8.702278137207031e-05, 0.00010824203491210938, 0.00030350685119628906, 0.0004987716674804688, 0.0006940364837646484, 0.0008893013000488281, 0.0010845661163330078, 0.0012798309326171875, 0.0014750957489013672, 0.0016703605651855469, 0.0018656253814697266, 0.0020608901977539062, 0.002256155014038086, 0.0024514198303222656, 0.0026466846466064453, 0.002841949462890625, 0.0030372142791748047, 0.0032324790954589844, 0.003427743911743164, 0.0036230087280273438, 0.0038182735443115234, 0.004013538360595703, 0.004208803176879883, 0.0044040679931640625, 0.004599332809448242, 0.004794597625732422, 0.0049898624420166016, 0.005185127258300781, 0.005380392074584961, 0.005575656890869141, 0.00577092170715332, 0.0059661865234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 11.0, 7.0, 14.0, 11.0, 14.0, 25.0, 17.0, 37.0, 47.0, 66.0, 78.0, 126.0, 149.0, 196.0, 282.0, 337.0, 509.0, 682.0, 994.0, 1467.0, 2320.0, 4028.0, 8329.0, 22911.0, 84223.0, 496956.0, 325281.0, 63536.0, 18316.0, 7263.0, 3426.0, 2089.0, 1362.0, 918.0, 701.0, 472.0, 369.0, 256.0, 191.0, 146.0, 101.0, 79.0, 48.0, 44.0, 24.0, 25.0, 21.0, 21.0, 9.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-147.625, -142.84765625, -138.0703125, -133.29296875, -128.515625, -123.73828125, -118.9609375, -114.18359375, -109.40625, -104.62890625, -99.8515625, -95.07421875, -90.296875, -85.51953125, -80.7421875, -75.96484375, -71.1875, -66.41015625, -61.6328125, -56.85546875, -52.078125, -47.30078125, -42.5234375, -37.74609375, -32.96875, -28.19140625, -23.4140625, -18.63671875, -13.859375, -9.08203125, -4.3046875, 0.47265625, 5.25, 10.02734375, 14.8046875, 19.58203125, 24.359375, 29.13671875, 33.9140625, 38.69140625, 43.46875, 48.24609375, 53.0234375, 57.80078125, 62.578125, 67.35546875, 72.1328125, 76.91015625, 81.6875, 86.46484375, 91.2421875, 96.01953125, 100.796875, 105.57421875, 110.3515625, 115.12890625, 119.90625, 124.68359375, 129.4609375, 134.23828125, 139.015625, 143.79296875, 148.5703125, 153.34765625, 158.125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 8.0, 9.0, 31.0, 48.0, 80.0, 121.0, 142.0, 155.0, 134.0, 87.0, 80.0, 39.0, 19.0, 9.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.9375, -40.556640625, -39.17578125, -37.794921875, -36.4140625, -35.033203125, -33.65234375, -32.271484375, -30.890625, -29.509765625, -28.12890625, -26.748046875, -25.3671875, -23.986328125, -22.60546875, -21.224609375, -19.84375, -18.462890625, -17.08203125, -15.701171875, -14.3203125, -12.939453125, -11.55859375, -10.177734375, -8.796875, -7.416015625, -6.03515625, -4.654296875, -3.2734375, -1.892578125, -0.51171875, 0.869140625, 2.25, 3.630859375, 5.01171875, 6.392578125, 7.7734375, 9.154296875, 10.53515625, 11.916015625, 13.296875, 14.677734375, 16.05859375, 17.439453125, 18.8203125, 20.201171875, 21.58203125, 22.962890625, 24.34375, 25.724609375, 27.10546875, 28.486328125, 29.8671875, 31.248046875, 32.62890625, 34.009765625, 35.390625, 36.771484375, 38.15234375, 39.533203125, 40.9140625, 42.294921875, 43.67578125, 45.056640625, 46.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 12.0, 11.0, 10.0, 21.0, 20.0, 26.0, 49.0, 56.0, 57.0, 93.0, 117.0, 116.0, 75.0, 78.0, 52.0, 42.0, 36.0, 31.0, 12.0, 14.0, 19.0, 9.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.67796325683594, -123.4287338256836, -119.17950439453125, -114.93026733398438, -110.68103790283203, -106.43180847167969, -102.18257141113281, -97.93334197998047, -93.68411254882812, -89.43488311767578, -85.18565368652344, -80.93641662597656, -76.68718719482422, -72.43795776367188, -68.188720703125, -63.939491271972656, -59.69026184082031, -55.44103240966797, -51.19179916381836, -46.94256591796875, -42.693336486816406, -38.44410705566406, -34.19487380981445, -29.945642471313477, -25.6964111328125, -21.447179794311523, -17.197948455810547, -12.94871711730957, -8.699485778808594, -4.450254440307617, -0.20102310180664062, 4.048208236694336, 8.29742431640625, 12.546655654907227, 16.795886993408203, 21.04511833190918, 25.294349670410156, 29.543581008911133, 33.79281234741211, 38.04204559326172, 42.29127502441406, 46.540504455566406, 50.789737701416016, 55.038970947265625, 59.28820037841797, 63.53742980957031, 67.78666687011719, 72.03589630126953, 76.28512573242188, 80.53435516357422, 84.78358459472656, 89.03282165527344, 93.28205108642578, 97.53128051757812, 101.780517578125, 106.02974700927734, 110.27897644042969, 114.52820587158203, 118.77743530273438, 123.02667236328125, 127.2759017944336, 131.52513122558594, 135.7743682861328, 140.02359008789062, 144.2728271484375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 11.0, 5.0, 18.0, 9.0, 18.0, 17.0, 11.0, 21.0, 21.0, 36.0, 22.0, 25.0, 36.0, 19.0, 48.0, 30.0, 44.0, 45.0, 49.0, 33.0, 46.0, 25.0, 33.0, 38.0, 36.0, 29.0, 25.0, 30.0, 26.0, 19.0, 14.0, 22.0, 16.0, 17.0, 16.0, 14.0, 14.0, 6.0, 10.0, 3.0, 6.0, 6.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.49182891845703, -69.17189025878906, -66.8519515991211, -64.53201293945312, -62.212074279785156, -59.89213562011719, -57.57219696044922, -55.25225830078125, -52.93231964111328, -50.61238098144531, -48.292442321777344, -45.972503662109375, -43.652565002441406, -41.33262634277344, -39.01268768310547, -36.6927490234375, -34.3728141784668, -32.05287551879883, -29.73293685913086, -27.41299819946289, -25.093059539794922, -22.773120880126953, -20.453184127807617, -18.13324546813965, -15.81330680847168, -13.493368148803711, -11.173429489135742, -8.85349178314209, -6.533553123474121, -4.213614463806152, -1.8936767578125, 0.42626190185546875, 2.7462005615234375, 5.066139221191406, 7.386077404022217, 9.706015586853027, 12.025954246520996, 14.345892906188965, 16.665830612182617, 18.985769271850586, 21.305707931518555, 23.625646591186523, 25.945585250854492, 28.265522003173828, 30.585460662841797, 32.905399322509766, 35.225337982177734, 37.5452766418457, 39.86521530151367, 42.18515396118164, 44.50509262084961, 46.82503128051758, 49.14496994018555, 51.464908599853516, 53.78484344482422, 56.10478210449219, 58.424720764160156, 60.744659423828125, 63.064598083496094, 65.38453674316406, 67.70447540283203, 70.0244140625, 72.34435272216797, 74.66429138183594, 76.9842300415039]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 21.0, 28.0, 34.0, 60.0, 60.0, 102.0, 164.0, 229.0, 369.0, 543.0, 787.0, 1122.0, 1882.0, 2696.0, 4008.0, 6020.0, 9239.0, 13867.0, 21551.0, 33797.0, 54421.0, 90532.0, 148929.0, 212498.0, 169801.0, 104281.0, 62601.0, 38366.0, 24355.0, 15604.0, 10158.0, 6766.0, 4431.0, 3034.0, 2014.0, 1379.0, 962.0, 605.0, 427.0, 254.0, 190.0, 123.0, 65.0, 50.0, 58.0, 18.0, 18.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-127.875, -123.95703125, -120.0390625, -116.12109375, -112.203125, -108.28515625, -104.3671875, -100.44921875, -96.53125, -92.61328125, -88.6953125, -84.77734375, -80.859375, -76.94140625, -73.0234375, -69.10546875, -65.1875, -61.26953125, -57.3515625, -53.43359375, -49.515625, -45.59765625, -41.6796875, -37.76171875, -33.84375, -29.92578125, -26.0078125, -22.08984375, -18.171875, -14.25390625, -10.3359375, -6.41796875, -2.5, 1.41796875, 5.3359375, 9.25390625, 13.171875, 17.08984375, 21.0078125, 24.92578125, 28.84375, 32.76171875, 36.6796875, 40.59765625, 44.515625, 48.43359375, 52.3515625, 56.26953125, 60.1875, 64.10546875, 68.0234375, 71.94140625, 75.859375, 79.77734375, 83.6953125, 87.61328125, 91.53125, 95.44921875, 99.3671875, 103.28515625, 107.203125, 111.12109375, 115.0390625, 118.95703125, 122.875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 3.0, 2.0, 7.0, 10.0, 10.0, 14.0, 12.0, 18.0, 15.0, 12.0, 23.0, 24.0, 31.0, 41.0, 39.0, 29.0, 32.0, 31.0, 50.0, 40.0, 49.0, 45.0, 50.0, 45.0, 50.0, 37.0, 29.0, 30.0, 21.0, 37.0, 28.0, 20.0, 25.0, 22.0, 24.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.96875, -62.02099609375, -60.0732421875, -58.12548828125, -56.177734375, -54.22998046875, -52.2822265625, -50.33447265625, -48.38671875, -46.43896484375, -44.4912109375, -42.54345703125, -40.595703125, -38.64794921875, -36.7001953125, -34.75244140625, -32.8046875, -30.85693359375, -28.9091796875, -26.96142578125, -25.013671875, -23.06591796875, -21.1181640625, -19.17041015625, -17.22265625, -15.27490234375, -13.3271484375, -11.37939453125, -9.431640625, -7.48388671875, -5.5361328125, -3.58837890625, -1.640625, 0.30712890625, 2.2548828125, 4.20263671875, 6.150390625, 8.09814453125, 10.0458984375, 11.99365234375, 13.94140625, 15.88916015625, 17.8369140625, 19.78466796875, 21.732421875, 23.68017578125, 25.6279296875, 27.57568359375, 29.5234375, 31.47119140625, 33.4189453125, 35.36669921875, 37.314453125, 39.26220703125, 41.2099609375, 43.15771484375, 45.10546875, 47.05322265625, 49.0009765625, 50.94873046875, 52.896484375, 54.84423828125, 56.7919921875, 58.73974609375, 60.6875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 16.0, 22.0, 30.0, 42.0, 54.0, 101.0, 185.0, 214.0, 334.0, 491.0, 694.0, 984.0, 1577.0, 2264.0, 3378.0, 5036.0, 7661.0, 11998.0, 18933.0, 30546.0, 49225.0, 83496.0, 144415.0, 218814.0, 186025.0, 110391.0, 64485.0, 39062.0, 24167.0, 15257.0, 9686.0, 6403.0, 4126.0, 2727.0, 1854.0, 1245.0, 832.0, 538.0, 385.0, 282.0, 185.0, 119.0, 85.0, 63.0, 39.0, 28.0, 27.0, 12.0, 8.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-99.0, -95.78125, -92.5625, -89.34375, -86.125, -82.90625, -79.6875, -76.46875, -73.25, -70.03125, -66.8125, -63.59375, -60.375, -57.15625, -53.9375, -50.71875, -47.5, -44.28125, -41.0625, -37.84375, -34.625, -31.40625, -28.1875, -24.96875, -21.75, -18.53125, -15.3125, -12.09375, -8.875, -5.65625, -2.4375, 0.78125, 4.0, 7.21875, 10.4375, 13.65625, 16.875, 20.09375, 23.3125, 26.53125, 29.75, 32.96875, 36.1875, 39.40625, 42.625, 45.84375, 49.0625, 52.28125, 55.5, 58.71875, 61.9375, 65.15625, 68.375, 71.59375, 74.8125, 78.03125, 81.25, 84.46875, 87.6875, 90.90625, 94.125, 97.34375, 100.5625, 103.78125, 107.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 4.0, 5.0, 4.0, 13.0, 13.0, 12.0, 9.0, 15.0, 13.0, 23.0, 24.0, 20.0, 21.0, 28.0, 36.0, 32.0, 31.0, 31.0, 45.0, 55.0, 51.0, 32.0, 47.0, 42.0, 34.0, 29.0, 36.0, 38.0, 27.0, 25.0, 21.0, 25.0, 30.0, 22.0, 20.0, 14.0, 11.0, 11.0, 8.0, 11.0, 7.0, 8.0, 8.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.375, -34.1318359375, -32.888671875, -31.6455078125, -30.40234375, -29.1591796875, -27.916015625, -26.6728515625, -25.4296875, -24.1865234375, -22.943359375, -21.7001953125, -20.45703125, -19.2138671875, -17.970703125, -16.7275390625, -15.484375, -14.2412109375, -12.998046875, -11.7548828125, -10.51171875, -9.2685546875, -8.025390625, -6.7822265625, -5.5390625, -4.2958984375, -3.052734375, -1.8095703125, -0.56640625, 0.6767578125, 1.919921875, 3.1630859375, 4.40625, 5.6494140625, 6.892578125, 8.1357421875, 9.37890625, 10.6220703125, 11.865234375, 13.1083984375, 14.3515625, 15.5947265625, 16.837890625, 18.0810546875, 19.32421875, 20.5673828125, 21.810546875, 23.0537109375, 24.296875, 25.5400390625, 26.783203125, 28.0263671875, 29.26953125, 30.5126953125, 31.755859375, 32.9990234375, 34.2421875, 35.4853515625, 36.728515625, 37.9716796875, 39.21484375, 40.4580078125, 41.701171875, 42.9443359375, 44.1875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 8.0, 8.0, 12.0, 10.0, 8.0, 19.0, 21.0, 16.0, 40.0, 49.0, 65.0, 88.0, 132.0, 180.0, 253.0, 302.0, 395.0, 590.0, 931.0, 1418.0, 2213.0, 4159.0, 8740.0, 22507.0, 73684.0, 570883.0, 279461.0, 49679.0, 16524.0, 6905.0, 3355.0, 1845.0, 1236.0, 762.0, 566.0, 439.0, 279.0, 181.0, 151.0, 136.0, 72.0, 58.0, 40.0, 27.0, 30.0, 14.0, 19.0, 12.0, 11.0, 11.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-291.0, -281.86328125, -272.7265625, -263.58984375, -254.453125, -245.31640625, -236.1796875, -227.04296875, -217.90625, -208.76953125, -199.6328125, -190.49609375, -181.359375, -172.22265625, -163.0859375, -153.94921875, -144.8125, -135.67578125, -126.5390625, -117.40234375, -108.265625, -99.12890625, -89.9921875, -80.85546875, -71.71875, -62.58203125, -53.4453125, -44.30859375, -35.171875, -26.03515625, -16.8984375, -7.76171875, 1.375, 10.51171875, 19.6484375, 28.78515625, 37.921875, 47.05859375, 56.1953125, 65.33203125, 74.46875, 83.60546875, 92.7421875, 101.87890625, 111.015625, 120.15234375, 129.2890625, 138.42578125, 147.5625, 156.69921875, 165.8359375, 174.97265625, 184.109375, 193.24609375, 202.3828125, 211.51953125, 220.65625, 229.79296875, 238.9296875, 248.06640625, 257.203125, 266.33984375, 275.4765625, 284.61328125, 293.75]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 11.0, 21.0, 30.0, 58.0, 94.0, 138.0, 137.0, 176.0, 123.0, 68.0, 44.0, 22.0, 21.0, 13.0, 9.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01025390625, -0.009781837463378906, -0.009309768676757812, -0.008837699890136719, -0.008365631103515625, -0.007893562316894531, -0.0074214935302734375, -0.006949424743652344, -0.00647735595703125, -0.006005287170410156, -0.0055332183837890625, -0.005061149597167969, -0.004589080810546875, -0.004117012023925781, -0.0036449432373046875, -0.0031728744506835938, -0.0027008056640625, -0.0022287368774414062, -0.0017566680908203125, -0.0012845993041992188, -0.000812530517578125, -0.00034046173095703125, 0.0001316070556640625, 0.0006036758422851562, 0.00107574462890625, 0.0015478134155273438, 0.0020198822021484375, 0.0024919509887695312, 0.002964019775390625, 0.0034360885620117188, 0.0039081573486328125, 0.004380226135253906, 0.004852294921875, 0.005324363708496094, 0.0057964324951171875, 0.006268501281738281, 0.006740570068359375, 0.007212638854980469, 0.0076847076416015625, 0.008156776428222656, 0.00862884521484375, 0.009100914001464844, 0.009572982788085938, 0.010045051574707031, 0.010517120361328125, 0.010989189147949219, 0.011461257934570312, 0.011933326721191406, 0.0124053955078125, 0.012877464294433594, 0.013349533081054688, 0.013821601867675781, 0.014293670654296875, 0.014765739440917969, 0.015237808227539062, 0.015709877014160156, 0.01618194580078125, 0.016654014587402344, 0.017126083374023438, 0.01759815216064453, 0.018070220947265625, 0.01854228973388672, 0.019014358520507812, 0.019486427307128906, 0.01995849609375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 14.0, 10.0, 20.0, 30.0, 41.0, 55.0, 79.0, 102.0, 131.0, 214.0, 257.0, 375.0, 557.0, 813.0, 1350.0, 2146.0, 4281.0, 11013.0, 58551.0, 787293.0, 149880.0, 18026.0, 5827.0, 2737.0, 1645.0, 957.0, 656.0, 435.0, 300.0, 218.0, 145.0, 97.0, 77.0, 48.0, 43.0, 28.0, 23.0, 16.0, 11.0, 7.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-326.0, -313.78125, -301.5625, -289.34375, -277.125, -264.90625, -252.6875, -240.46875, -228.25, -216.03125, -203.8125, -191.59375, -179.375, -167.15625, -154.9375, -142.71875, -130.5, -118.28125, -106.0625, -93.84375, -81.625, -69.40625, -57.1875, -44.96875, -32.75, -20.53125, -8.3125, 3.90625, 16.125, 28.34375, 40.5625, 52.78125, 65.0, 77.21875, 89.4375, 101.65625, 113.875, 126.09375, 138.3125, 150.53125, 162.75, 174.96875, 187.1875, 199.40625, 211.625, 223.84375, 236.0625, 248.28125, 260.5, 272.71875, 284.9375, 297.15625, 309.375, 321.59375, 333.8125, 346.03125, 358.25, 370.46875, 382.6875, 394.90625, 407.125, 419.34375, 431.5625, 443.78125, 456.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 16.0, 25.0, 36.0, 74.0, 114.0, 159.0, 180.0, 154.0, 107.0, 47.0, 33.0, 19.0, 6.0, 2.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.375, -91.8564453125, -89.337890625, -86.8193359375, -84.30078125, -81.7822265625, -79.263671875, -76.7451171875, -74.2265625, -71.7080078125, -69.189453125, -66.6708984375, -64.15234375, -61.6337890625, -59.115234375, -56.5966796875, -54.078125, -51.5595703125, -49.041015625, -46.5224609375, -44.00390625, -41.4853515625, -38.966796875, -36.4482421875, -33.9296875, -31.4111328125, -28.892578125, -26.3740234375, -23.85546875, -21.3369140625, -18.818359375, -16.2998046875, -13.78125, -11.2626953125, -8.744140625, -6.2255859375, -3.70703125, -1.1884765625, 1.330078125, 3.8486328125, 6.3671875, 8.8857421875, 11.404296875, 13.9228515625, 16.44140625, 18.9599609375, 21.478515625, 23.9970703125, 26.515625, 29.0341796875, 31.552734375, 34.0712890625, 36.58984375, 39.1083984375, 41.626953125, 44.1455078125, 46.6640625, 49.1826171875, 51.701171875, 54.2197265625, 56.73828125, 59.2568359375, 61.775390625, 64.2939453125, 66.8125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 8.0, 15.0, 17.0, 30.0, 35.0, 47.0, 76.0, 107.0, 119.0, 107.0, 74.0, 86.0, 49.0, 41.0, 25.0, 31.0, 23.0, 12.0, 18.0, 5.0, 7.0, 7.0, 10.0, 3.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.25507354736328, -78.41082763671875, -74.56658172607422, -70.72233581542969, -66.87809753417969, -63.033851623535156, -59.189605712890625, -55.345359802246094, -51.50111770629883, -47.6568717956543, -43.81262969970703, -39.9683837890625, -36.12413787841797, -32.2798957824707, -28.435649871826172, -24.591405868530273, -20.747161865234375, -16.902917861938477, -13.058672904968262, -9.214427947998047, -5.370183944702148, -1.52593994140625, 2.3183059692382812, 6.16254997253418, 10.006793975830078, 13.851037979125977, 17.695281982421875, 21.539527893066406, 25.383771896362305, 29.228015899658203, 33.072261810302734, 36.91650390625, 40.76075744628906, 44.605003356933594, 48.44924545288086, 52.29349136352539, 56.137733459472656, 59.98197937011719, 63.82622528076172, 67.67047119140625, 71.51470947265625, 75.35895538330078, 79.20320129394531, 83.04743957519531, 86.89168548583984, 90.73593139648438, 94.5801773071289, 98.42442321777344, 102.26866912841797, 106.1129150390625, 109.95716094970703, 113.80140686035156, 117.64564514160156, 121.4898910522461, 125.33413696289062, 129.17837524414062, 133.0226287841797, 136.8668670654297, 140.71112060546875, 144.55535888671875, 148.3996124267578, 152.2438507080078, 156.08810424804688, 159.93234252929688, 163.77658081054688]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 4.0, 5.0, 7.0, 18.0, 9.0, 22.0, 15.0, 16.0, 18.0, 17.0, 22.0, 29.0, 43.0, 25.0, 44.0, 39.0, 50.0, 49.0, 43.0, 42.0, 48.0, 40.0, 33.0, 40.0, 45.0, 51.0, 35.0, 27.0, 32.0, 22.0, 20.0, 24.0, 15.0, 10.0, 10.0, 8.0, 11.0, 1.0, 3.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-75.36639404296875, -73.18787384033203, -71.00934600830078, -68.83082580566406, -66.65230560302734, -64.47378540039062, -62.295257568359375, -60.116737365722656, -57.93821716308594, -55.75969314575195, -53.581172943115234, -51.40264892578125, -49.22412872314453, -47.04560470581055, -44.86708068847656, -42.688560485839844, -40.51003646850586, -38.331512451171875, -36.152992248535156, -33.97446823120117, -31.795948028564453, -29.61742401123047, -27.438901901245117, -25.260379791259766, -23.081857681274414, -20.903335571289062, -18.72481346130371, -16.54629135131836, -14.367768287658691, -12.18924617767334, -10.010723114013672, -7.83220100402832, -5.653678894042969, -3.475156545639038, -1.2966341972351074, 0.8818883895874023, 3.060410499572754, 5.2389326095581055, 7.417455673217773, 9.595977783203125, 11.774499893188477, 13.953022003173828, 16.13154411315918, 18.31006622314453, 20.488590240478516, 22.667110443115234, 24.84563446044922, 27.02415657043457, 29.202678680419922, 31.381200790405273, 33.559722900390625, 35.73824691772461, 37.91676712036133, 40.09529113769531, 42.27381134033203, 44.452335357666016, 46.630859375, 48.809383392333984, 50.9879035949707, 53.16642761230469, 55.344947814941406, 57.52347183227539, 59.701995849609375, 61.880516052246094, 64.05903625488281]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 8.0, 5.0, 15.0, 12.0, 21.0, 37.0, 58.0, 82.0, 136.0, 181.0, 249.0, 414.0, 629.0, 965.0, 1488.0, 2064.0, 3432.0, 5163.0, 7923.0, 12877.0, 20627.0, 33902.0, 58625.0, 106007.0, 218129.0, 622104.0, 1670665.0, 875180.0, 266282.0, 121655.0, 65053.0, 37801.0, 22615.0, 13756.0, 8840.0, 5878.0, 3720.0, 2447.0, 1613.0, 1103.0, 758.0, 509.0, 407.0, 262.0, 206.0, 122.0, 79.0, 51.0, 45.0, 26.0, 17.0, 18.0, 14.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.0625, -73.4951171875, -70.927734375, -68.3603515625, -65.79296875, -63.2255859375, -60.658203125, -58.0908203125, -55.5234375, -52.9560546875, -50.388671875, -47.8212890625, -45.25390625, -42.6865234375, -40.119140625, -37.5517578125, -34.984375, -32.4169921875, -29.849609375, -27.2822265625, -24.71484375, -22.1474609375, -19.580078125, -17.0126953125, -14.4453125, -11.8779296875, -9.310546875, -6.7431640625, -4.17578125, -1.6083984375, 0.958984375, 3.5263671875, 6.09375, 8.6611328125, 11.228515625, 13.7958984375, 16.36328125, 18.9306640625, 21.498046875, 24.0654296875, 26.6328125, 29.2001953125, 31.767578125, 34.3349609375, 36.90234375, 39.4697265625, 42.037109375, 44.6044921875, 47.171875, 49.7392578125, 52.306640625, 54.8740234375, 57.44140625, 60.0087890625, 62.576171875, 65.1435546875, 67.7109375, 70.2783203125, 72.845703125, 75.4130859375, 77.98046875, 80.5478515625, 83.115234375, 85.6826171875, 88.25]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 9.0, 7.0, 9.0, 15.0, 8.0, 13.0, 19.0, 19.0, 25.0, 35.0, 25.0, 28.0, 24.0, 37.0, 45.0, 33.0, 37.0, 40.0, 46.0, 48.0, 47.0, 43.0, 46.0, 37.0, 37.0, 43.0, 36.0, 34.0, 28.0, 21.0, 16.0, 19.0, 6.0, 14.0, 8.0, 5.0, 13.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.91552734375, -34.8310546875, -33.74658203125, -32.662109375, -31.57763671875, -30.4931640625, -29.40869140625, -28.32421875, -27.23974609375, -26.1552734375, -25.07080078125, -23.986328125, -22.90185546875, -21.8173828125, -20.73291015625, -19.6484375, -18.56396484375, -17.4794921875, -16.39501953125, -15.310546875, -14.22607421875, -13.1416015625, -12.05712890625, -10.97265625, -9.88818359375, -8.8037109375, -7.71923828125, -6.634765625, -5.55029296875, -4.4658203125, -3.38134765625, -2.296875, -1.21240234375, -0.1279296875, 0.95654296875, 2.041015625, 3.12548828125, 4.2099609375, 5.29443359375, 6.37890625, 7.46337890625, 8.5478515625, 9.63232421875, 10.716796875, 11.80126953125, 12.8857421875, 13.97021484375, 15.0546875, 16.13916015625, 17.2236328125, 18.30810546875, 19.392578125, 20.47705078125, 21.5615234375, 22.64599609375, 23.73046875, 24.81494140625, 25.8994140625, 26.98388671875, 28.068359375, 29.15283203125, 30.2373046875, 31.32177734375, 32.40625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 6.0, 5.0, 6.0, 13.0, 15.0, 18.0, 29.0, 49.0, 45.0, 72.0, 100.0, 131.0, 154.0, 243.0, 298.0, 444.0, 657.0, 935.0, 1381.0, 2100.0, 3368.0, 5708.0, 9923.0, 18781.0, 38687.0, 87469.0, 228177.0, 758607.0, 2036654.0, 643830.0, 200068.0, 78611.0, 35774.0, 17809.0, 9369.0, 5317.0, 3262.0, 2001.0, 1286.0, 889.0, 612.0, 396.0, 283.0, 187.0, 146.0, 104.0, 56.0, 65.0, 42.0, 24.0, 29.0, 22.0, 8.0, 11.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-92.875, -89.9208984375, -86.966796875, -84.0126953125, -81.05859375, -78.1044921875, -75.150390625, -72.1962890625, -69.2421875, -66.2880859375, -63.333984375, -60.3798828125, -57.42578125, -54.4716796875, -51.517578125, -48.5634765625, -45.609375, -42.6552734375, -39.701171875, -36.7470703125, -33.79296875, -30.8388671875, -27.884765625, -24.9306640625, -21.9765625, -19.0224609375, -16.068359375, -13.1142578125, -10.16015625, -7.2060546875, -4.251953125, -1.2978515625, 1.65625, 4.6103515625, 7.564453125, 10.5185546875, 13.47265625, 16.4267578125, 19.380859375, 22.3349609375, 25.2890625, 28.2431640625, 31.197265625, 34.1513671875, 37.10546875, 40.0595703125, 43.013671875, 45.9677734375, 48.921875, 51.8759765625, 54.830078125, 57.7841796875, 60.73828125, 63.6923828125, 66.646484375, 69.6005859375, 72.5546875, 75.5087890625, 78.462890625, 81.4169921875, 84.37109375, 87.3251953125, 90.279296875, 93.2333984375, 96.1875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 0.0, 3.0, 5.0, 9.0, 14.0, 16.0, 28.0, 25.0, 37.0, 41.0, 53.0, 77.0, 95.0, 132.0, 162.0, 171.0, 235.0, 288.0, 325.0, 431.0, 361.0, 344.0, 265.0, 202.0, 169.0, 132.0, 95.0, 68.0, 68.0, 59.0, 38.0, 25.0, 14.0, 17.0, 16.0, 9.0, 11.0, 8.0, 4.0, 5.0, 3.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.544921875, -17.85546875, -17.166015625, -16.4765625, -15.787109375, -15.09765625, -14.408203125, -13.71875, -13.029296875, -12.33984375, -11.650390625, -10.9609375, -10.271484375, -9.58203125, -8.892578125, -8.203125, -7.513671875, -6.82421875, -6.134765625, -5.4453125, -4.755859375, -4.06640625, -3.376953125, -2.6875, -1.998046875, -1.30859375, -0.619140625, 0.0703125, 0.759765625, 1.44921875, 2.138671875, 2.828125, 3.517578125, 4.20703125, 4.896484375, 5.5859375, 6.275390625, 6.96484375, 7.654296875, 8.34375, 9.033203125, 9.72265625, 10.412109375, 11.1015625, 11.791015625, 12.48046875, 13.169921875, 13.859375, 14.548828125, 15.23828125, 15.927734375, 16.6171875, 17.306640625, 17.99609375, 18.685546875, 19.375, 20.064453125, 20.75390625, 21.443359375, 22.1328125, 22.822265625, 23.51171875, 24.201171875, 24.890625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 13.0, 19.0, 14.0, 29.0, 34.0, 42.0, 53.0, 77.0, 98.0, 131.0, 111.0, 95.0, 71.0, 43.0, 38.0, 25.0, 14.0, 18.0, 8.0, 9.0, 7.0, 3.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.93960952758789, -58.42152404785156, -55.90343475341797, -53.38534927368164, -50.86726379394531, -48.34917449951172, -45.83108901977539, -43.31300354003906, -40.79491424560547, -38.27682876586914, -35.75873947143555, -33.24065399169922, -30.72256851196289, -28.20448112487793, -25.68639373779297, -23.16830825805664, -20.650222778320312, -18.13213539123535, -15.614049911499023, -13.095962524414062, -10.577876091003418, -8.059789657592773, -5.5417022705078125, -3.0236167907714844, -0.5055294036865234, 2.0125572681427, 4.530643939971924, 7.048730850219727, 9.566817283630371, 12.084903717041016, 14.602991104125977, 17.121076583862305, 19.63916778564453, 22.157255172729492, 24.67534065246582, 27.19342803955078, 29.71151351928711, 32.22959899902344, 34.74768829345703, 37.26577377319336, 39.78385925292969, 42.301944732666016, 44.82003402709961, 47.33811950683594, 49.856204986572266, 52.374290466308594, 54.89237976074219, 57.410465240478516, 59.92855453491211, 62.44664001464844, 64.96472930908203, 67.48281860351562, 70.00090026855469, 72.51898956298828, 75.03707885742188, 77.55516052246094, 80.07324981689453, 82.59133911132812, 85.10942077636719, 87.62751007080078, 90.14559936523438, 92.66368103027344, 95.18177032470703, 97.69985961914062, 100.21794128417969]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 11.0, 7.0, 6.0, 8.0, 12.0, 25.0, 11.0, 17.0, 17.0, 27.0, 14.0, 20.0, 17.0, 26.0, 23.0, 35.0, 31.0, 32.0, 55.0, 41.0, 40.0, 48.0, 36.0, 35.0, 33.0, 27.0, 40.0, 27.0, 34.0, 31.0, 22.0, 29.0, 20.0, 21.0, 12.0, 20.0, 8.0, 13.0, 11.0, 8.0, 10.0, 11.0, 4.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.36384201049805, -34.25358963012695, -33.14333724975586, -32.03308868408203, -30.922836303710938, -29.812583923339844, -28.70233154296875, -27.592079162597656, -26.481828689575195, -25.3715763092041, -24.26132583618164, -23.151073455810547, -22.040821075439453, -20.930570602416992, -19.8203182220459, -18.710067749023438, -17.599815368652344, -16.48956298828125, -15.379312515258789, -14.269060134887695, -13.158808708190918, -12.04855728149414, -10.938304901123047, -9.82805347442627, -8.717802047729492, -7.607550621032715, -6.497298717498779, -5.387046813964844, -4.276795387268066, -3.166543960571289, -2.0562920570373535, -0.946040153503418, 0.164215087890625, 1.2744667530059814, 2.384718418121338, 3.4949700832366943, 4.605221748352051, 5.715473175048828, 6.825725078582764, 7.935976982116699, 9.046228408813477, 10.156479835510254, 11.266731262207031, 12.376983642578125, 13.487235069274902, 14.59748649597168, 15.707738876342773, 16.817989349365234, 17.928241729736328, 19.038494110107422, 20.148744583129883, 21.258996963500977, 22.369247436523438, 23.47949981689453, 24.589752197265625, 25.70000457763672, 26.81025505065918, 27.920507431030273, 29.030757904052734, 30.141010284423828, 31.251262664794922, 32.36151123046875, 33.471763610839844, 34.58201599121094, 35.69226837158203]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 16.0, 12.0, 25.0, 37.0, 55.0, 62.0, 79.0, 119.0, 153.0, 234.0, 338.0, 460.0, 670.0, 991.0, 1528.0, 2011.0, 3145.0, 4656.0, 7229.0, 11948.0, 20254.0, 36284.0, 70830.0, 160901.0, 359452.0, 188320.0, 79831.0, 40591.0, 22010.0, 12958.0, 7914.0, 4993.0, 3273.0, 2164.0, 1475.0, 990.0, 759.0, 496.0, 374.0, 254.0, 183.0, 130.0, 91.0, 59.0, 60.0, 37.0, 35.0, 20.0, 13.0, 12.0, 6.0, 3.0, 6.0, 4.0, 4.0, 0.0, 4.0], "bins": [-47.1875, -45.693359375, -44.19921875, -42.705078125, -41.2109375, -39.716796875, -38.22265625, -36.728515625, -35.234375, -33.740234375, -32.24609375, -30.751953125, -29.2578125, -27.763671875, -26.26953125, -24.775390625, -23.28125, -21.787109375, -20.29296875, -18.798828125, -17.3046875, -15.810546875, -14.31640625, -12.822265625, -11.328125, -9.833984375, -8.33984375, -6.845703125, -5.3515625, -3.857421875, -2.36328125, -0.869140625, 0.625, 2.119140625, 3.61328125, 5.107421875, 6.6015625, 8.095703125, 9.58984375, 11.083984375, 12.578125, 14.072265625, 15.56640625, 17.060546875, 18.5546875, 20.048828125, 21.54296875, 23.037109375, 24.53125, 26.025390625, 27.51953125, 29.013671875, 30.5078125, 32.001953125, 33.49609375, 34.990234375, 36.484375, 37.978515625, 39.47265625, 40.966796875, 42.4609375, 43.955078125, 45.44921875, 46.943359375, 48.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 10.0, 4.0, 6.0, 8.0, 5.0, 5.0, 12.0, 10.0, 17.0, 18.0, 14.0, 23.0, 17.0, 20.0, 22.0, 23.0, 25.0, 33.0, 50.0, 38.0, 51.0, 45.0, 40.0, 38.0, 53.0, 38.0, 46.0, 46.0, 36.0, 32.0, 26.0, 32.0, 16.0, 18.0, 24.0, 11.0, 11.0, 13.0, 15.0, 17.0, 8.0, 10.0, 6.0, 5.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-47.1875, -45.87744140625, -44.5673828125, -43.25732421875, -41.947265625, -40.63720703125, -39.3271484375, -38.01708984375, -36.70703125, -35.39697265625, -34.0869140625, -32.77685546875, -31.466796875, -30.15673828125, -28.8466796875, -27.53662109375, -26.2265625, -24.91650390625, -23.6064453125, -22.29638671875, -20.986328125, -19.67626953125, -18.3662109375, -17.05615234375, -15.74609375, -14.43603515625, -13.1259765625, -11.81591796875, -10.505859375, -9.19580078125, -7.8857421875, -6.57568359375, -5.265625, -3.95556640625, -2.6455078125, -1.33544921875, -0.025390625, 1.28466796875, 2.5947265625, 3.90478515625, 5.21484375, 6.52490234375, 7.8349609375, 9.14501953125, 10.455078125, 11.76513671875, 13.0751953125, 14.38525390625, 15.6953125, 17.00537109375, 18.3154296875, 19.62548828125, 20.935546875, 22.24560546875, 23.5556640625, 24.86572265625, 26.17578125, 27.48583984375, 28.7958984375, 30.10595703125, 31.416015625, 32.72607421875, 34.0361328125, 35.34619140625, 36.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 11.0, 14.0, 21.0, 16.0, 24.0, 44.0, 71.0, 78.0, 108.0, 161.0, 231.0, 289.0, 441.0, 640.0, 893.0, 1400.0, 2153.0, 3529.0, 6350.0, 12672.0, 29647.0, 94396.0, 578183.0, 225895.0, 50614.0, 18915.0, 8662.0, 4712.0, 2799.0, 1812.0, 1190.0, 807.0, 528.0, 373.0, 254.0, 174.0, 128.0, 99.0, 54.0, 35.0, 32.0, 22.0, 29.0, 11.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-70.1875, -67.9052734375, -65.623046875, -63.3408203125, -61.05859375, -58.7763671875, -56.494140625, -54.2119140625, -51.9296875, -49.6474609375, -47.365234375, -45.0830078125, -42.80078125, -40.5185546875, -38.236328125, -35.9541015625, -33.671875, -31.3896484375, -29.107421875, -26.8251953125, -24.54296875, -22.2607421875, -19.978515625, -17.6962890625, -15.4140625, -13.1318359375, -10.849609375, -8.5673828125, -6.28515625, -4.0029296875, -1.720703125, 0.5615234375, 2.84375, 5.1259765625, 7.408203125, 9.6904296875, 11.97265625, 14.2548828125, 16.537109375, 18.8193359375, 21.1015625, 23.3837890625, 25.666015625, 27.9482421875, 30.23046875, 32.5126953125, 34.794921875, 37.0771484375, 39.359375, 41.6416015625, 43.923828125, 46.2060546875, 48.48828125, 50.7705078125, 53.052734375, 55.3349609375, 57.6171875, 59.8994140625, 62.181640625, 64.4638671875, 66.74609375, 69.0283203125, 71.310546875, 73.5927734375, 75.875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 3.0, 9.0, 14.0, 8.0, 12.0, 13.0, 16.0, 17.0, 24.0, 17.0, 23.0, 23.0, 31.0, 28.0, 44.0, 30.0, 29.0, 37.0, 27.0, 35.0, 55.0, 41.0, 40.0, 33.0, 32.0, 31.0, 31.0, 30.0, 39.0, 26.0, 23.0, 23.0, 25.0, 23.0, 13.0, 12.0, 14.0, 8.0, 15.0, 9.0, 4.0, 8.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-35.8125, -34.70556640625, -33.5986328125, -32.49169921875, -31.384765625, -30.27783203125, -29.1708984375, -28.06396484375, -26.95703125, -25.85009765625, -24.7431640625, -23.63623046875, -22.529296875, -21.42236328125, -20.3154296875, -19.20849609375, -18.1015625, -16.99462890625, -15.8876953125, -14.78076171875, -13.673828125, -12.56689453125, -11.4599609375, -10.35302734375, -9.24609375, -8.13916015625, -7.0322265625, -5.92529296875, -4.818359375, -3.71142578125, -2.6044921875, -1.49755859375, -0.390625, 0.71630859375, 1.8232421875, 2.93017578125, 4.037109375, 5.14404296875, 6.2509765625, 7.35791015625, 8.46484375, 9.57177734375, 10.6787109375, 11.78564453125, 12.892578125, 13.99951171875, 15.1064453125, 16.21337890625, 17.3203125, 18.42724609375, 19.5341796875, 20.64111328125, 21.748046875, 22.85498046875, 23.9619140625, 25.06884765625, 26.17578125, 27.28271484375, 28.3896484375, 29.49658203125, 30.603515625, 31.71044921875, 32.8173828125, 33.92431640625, 35.03125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 7.0, 5.0, 5.0, 4.0, 11.0, 14.0, 17.0, 26.0, 26.0, 50.0, 77.0, 95.0, 120.0, 168.0, 234.0, 307.0, 440.0, 652.0, 927.0, 1194.0, 1801.0, 2686.0, 4055.0, 6633.0, 12172.0, 25481.0, 73999.0, 550597.0, 266633.0, 52329.0, 20532.0, 9906.0, 5747.0, 3618.0, 2334.0, 1551.0, 1197.0, 756.0, 625.0, 442.0, 275.0, 215.0, 173.0, 121.0, 81.0, 68.0, 48.0, 35.0, 14.0, 14.0, 15.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0], "bins": [-64.4375, -62.4765625, -60.515625, -58.5546875, -56.59375, -54.6328125, -52.671875, -50.7109375, -48.75, -46.7890625, -44.828125, -42.8671875, -40.90625, -38.9453125, -36.984375, -35.0234375, -33.0625, -31.1015625, -29.140625, -27.1796875, -25.21875, -23.2578125, -21.296875, -19.3359375, -17.375, -15.4140625, -13.453125, -11.4921875, -9.53125, -7.5703125, -5.609375, -3.6484375, -1.6875, 0.2734375, 2.234375, 4.1953125, 6.15625, 8.1171875, 10.078125, 12.0390625, 14.0, 15.9609375, 17.921875, 19.8828125, 21.84375, 23.8046875, 25.765625, 27.7265625, 29.6875, 31.6484375, 33.609375, 35.5703125, 37.53125, 39.4921875, 41.453125, 43.4140625, 45.375, 47.3359375, 49.296875, 51.2578125, 53.21875, 55.1796875, 57.140625, 59.1015625, 61.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 2.0, 5.0, 6.0, 9.0, 8.0, 10.0, 10.0, 13.0, 17.0, 25.0, 19.0, 28.0, 32.0, 37.0, 43.0, 53.0, 62.0, 70.0, 65.0, 67.0, 58.0, 50.0, 44.0, 34.0, 29.0, 27.0, 23.0, 32.0, 16.0, 13.0, 18.0, 14.0, 9.0, 6.0, 5.0, 9.0, 6.0, 8.0, 3.0, 3.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0019702911376953125, -0.0019056499004364014, -0.0018410086631774902, -0.001776367425918579, -0.001711726188659668, -0.0016470849514007568, -0.0015824437141418457, -0.0015178024768829346, -0.0014531612396240234, -0.0013885200023651123, -0.0013238787651062012, -0.00125923752784729, -0.001194596290588379, -0.0011299550533294678, -0.0010653138160705566, -0.0010006725788116455, -0.0009360313415527344, -0.0008713901042938232, -0.0008067488670349121, -0.000742107629776001, -0.0006774663925170898, -0.0006128251552581787, -0.0005481839179992676, -0.00048354268074035645, -0.0004189014434814453, -0.0003542602062225342, -0.00028961896896362305, -0.00022497773170471191, -0.00016033649444580078, -9.569525718688965e-05, -3.1054019927978516e-05, 3.358721733093262e-05, 9.822845458984375e-05, 0.00016286969184875488, 0.00022751092910766602, 0.00029215216636657715, 0.0003567934036254883, 0.0004214346408843994, 0.00048607587814331055, 0.0005507171154022217, 0.0006153583526611328, 0.0006799995899200439, 0.0007446408271789551, 0.0008092820644378662, 0.0008739233016967773, 0.0009385645389556885, 0.0010032057762145996, 0.0010678470134735107, 0.0011324882507324219, 0.001197129487991333, 0.0012617707252502441, 0.0013264119625091553, 0.0013910531997680664, 0.0014556944370269775, 0.0015203356742858887, 0.0015849769115447998, 0.001649618148803711, 0.001714259386062622, 0.0017789006233215332, 0.0018435418605804443, 0.0019081830978393555, 0.0019728243350982666, 0.0020374655723571777, 0.002102106809616089, 0.002166748046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 10.0, 21.0, 25.0, 36.0, 63.0, 95.0, 135.0, 231.0, 371.0, 624.0, 1047.0, 1950.0, 3646.0, 6980.0, 14358.0, 31961.0, 88294.0, 389440.0, 363297.0, 85603.0, 31502.0, 13874.0, 6814.0, 3603.0, 1884.0, 1093.0, 615.0, 353.0, 214.0, 134.0, 83.0, 63.0, 37.0, 34.0, 21.0, 9.0, 9.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.25, -67.0849609375, -64.919921875, -62.7548828125, -60.58984375, -58.4248046875, -56.259765625, -54.0947265625, -51.9296875, -49.7646484375, -47.599609375, -45.4345703125, -43.26953125, -41.1044921875, -38.939453125, -36.7744140625, -34.609375, -32.4443359375, -30.279296875, -28.1142578125, -25.94921875, -23.7841796875, -21.619140625, -19.4541015625, -17.2890625, -15.1240234375, -12.958984375, -10.7939453125, -8.62890625, -6.4638671875, -4.298828125, -2.1337890625, 0.03125, 2.1962890625, 4.361328125, 6.5263671875, 8.69140625, 10.8564453125, 13.021484375, 15.1865234375, 17.3515625, 19.5166015625, 21.681640625, 23.8466796875, 26.01171875, 28.1767578125, 30.341796875, 32.5068359375, 34.671875, 36.8369140625, 39.001953125, 41.1669921875, 43.33203125, 45.4970703125, 47.662109375, 49.8271484375, 51.9921875, 54.1572265625, 56.322265625, 58.4873046875, 60.65234375, 62.8173828125, 64.982421875, 67.1474609375, 69.3125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 13.0, 14.0, 18.0, 22.0, 25.0, 19.0, 31.0, 39.0, 48.0, 51.0, 77.0, 88.0, 95.0, 69.0, 59.0, 52.0, 42.0, 39.0, 28.0, 25.0, 19.0, 25.0, 17.0, 16.0, 13.0, 13.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.140625, -8.7945556640625, -8.448486328125, -8.1024169921875, -7.75634765625, -7.4102783203125, -7.064208984375, -6.7181396484375, -6.3720703125, -6.0260009765625, -5.679931640625, -5.3338623046875, -4.98779296875, -4.6417236328125, -4.295654296875, -3.9495849609375, -3.603515625, -3.2574462890625, -2.911376953125, -2.5653076171875, -2.21923828125, -1.8731689453125, -1.527099609375, -1.1810302734375, -0.8349609375, -0.4888916015625, -0.142822265625, 0.2032470703125, 0.54931640625, 0.8953857421875, 1.241455078125, 1.5875244140625, 1.93359375, 2.2796630859375, 2.625732421875, 2.9718017578125, 3.31787109375, 3.6639404296875, 4.010009765625, 4.3560791015625, 4.7021484375, 5.0482177734375, 5.394287109375, 5.7403564453125, 6.08642578125, 6.4324951171875, 6.778564453125, 7.1246337890625, 7.470703125, 7.8167724609375, 8.162841796875, 8.5089111328125, 8.85498046875, 9.2010498046875, 9.547119140625, 9.8931884765625, 10.2392578125, 10.5853271484375, 10.931396484375, 11.2774658203125, 11.62353515625, 11.9696044921875, 12.315673828125, 12.6617431640625, 13.0078125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 12.0, 7.0, 9.0, 17.0, 25.0, 26.0, 44.0, 69.0, 83.0, 107.0, 145.0, 125.0, 86.0, 62.0, 46.0, 28.0, 19.0, 15.0, 12.0, 7.0, 10.0, 4.0, 9.0, 2.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.72271728515625, -67.87286376953125, -65.02301025390625, -62.173160552978516, -59.32331085205078, -56.47345733642578, -53.62360382080078, -50.77375030517578, -47.92390060424805, -45.07404708862305, -42.22419738769531, -39.37434387207031, -36.52449035644531, -33.67464065551758, -30.824787139892578, -27.97493553161621, -25.125083923339844, -22.275232315063477, -19.42538070678711, -16.57552719116211, -13.725675582885742, -10.875823974609375, -8.025970458984375, -5.176118850708008, -2.3262672424316406, 0.5235848426818848, 3.37343692779541, 6.223289489746094, 9.073141098022461, 11.922992706298828, 14.772846221923828, 17.622697830200195, 20.472549438476562, 23.32240104675293, 26.172252655029297, 29.022106170654297, 31.871957778930664, 34.72180938720703, 37.57166290283203, 40.42151641845703, 43.271366119384766, 46.121219635009766, 48.9710693359375, 51.8209228515625, 54.6707763671875, 57.520626068115234, 60.370479583740234, 63.22032928466797, 66.07018280029297, 68.92003631591797, 71.76988983154297, 74.61973571777344, 77.46958923339844, 80.31944274902344, 83.16929626464844, 86.01914978027344, 88.86900329589844, 91.71885681152344, 94.56871032714844, 97.41856384277344, 100.2684097290039, 103.1182632446289, 105.9681167602539, 108.8179702758789, 111.66781616210938]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 3.0, 9.0, 12.0, 8.0, 11.0, 13.0, 10.0, 8.0, 23.0, 15.0, 23.0, 16.0, 23.0, 18.0, 22.0, 25.0, 43.0, 33.0, 38.0, 28.0, 50.0, 36.0, 41.0, 33.0, 46.0, 37.0, 36.0, 32.0, 27.0, 30.0, 22.0, 21.0, 25.0, 24.0, 21.0, 19.0, 18.0, 19.0, 11.0, 16.0, 11.0, 5.0, 4.0, 7.0, 10.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-37.795108795166016, -36.66645050048828, -35.53779602050781, -34.40913772583008, -33.280479431152344, -32.151824951171875, -31.02316665649414, -29.89451026916504, -28.765853881835938, -27.637197494506836, -26.5085391998291, -25.3798828125, -24.2512264251709, -23.122570037841797, -21.993911743164062, -20.86525535583496, -19.736597061157227, -18.607940673828125, -17.47928237915039, -16.35062599182129, -15.221969604492188, -14.09331226348877, -12.964654922485352, -11.83599853515625, -10.707341194152832, -9.578683853149414, -8.450027465820312, -7.3213701248168945, -6.192713260650635, -5.064056396484375, -3.935399055480957, -2.8067421913146973, -1.6780853271484375, -0.5494283437728882, 0.5792286396026611, 1.7078857421875, 2.8365426063537598, 3.9651994705200195, 5.0938568115234375, 6.222513675689697, 7.351170539855957, 8.479827880859375, 9.608484268188477, 10.737141609191895, 11.865798950195312, 12.994455337524414, 14.123112678527832, 15.25177001953125, 16.38042640686035, 17.509082794189453, 18.637741088867188, 19.76639747619629, 20.89505386352539, 22.023712158203125, 23.152368545532227, 24.281024932861328, 25.409683227539062, 26.538339614868164, 27.6669979095459, 28.795654296875, 29.9243106842041, 31.052967071533203, 32.18162536621094, 33.31028366088867, 34.43893814086914]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 8.0, 14.0, 19.0, 35.0, 46.0, 72.0, 101.0, 146.0, 180.0, 287.0, 413.0, 615.0, 877.0, 1277.0, 1999.0, 3143.0, 4860.0, 7771.0, 12220.0, 20161.0, 32195.0, 52488.0, 86078.0, 140565.0, 207628.0, 180526.0, 112451.0, 69557.0, 42395.0, 26218.0, 16077.0, 10085.0, 6295.0, 4062.0, 2595.0, 1656.0, 1069.0, 691.0, 527.0, 361.0, 240.0, 176.0, 114.0, 75.0, 44.0, 48.0, 27.0, 30.0, 7.0, 7.0, 9.0, 5.0, 5.0, 0.0, 1.0], "bins": [-78.375, -76.0546875, -73.734375, -71.4140625, -69.09375, -66.7734375, -64.453125, -62.1328125, -59.8125, -57.4921875, -55.171875, -52.8515625, -50.53125, -48.2109375, -45.890625, -43.5703125, -41.25, -38.9296875, -36.609375, -34.2890625, -31.96875, -29.6484375, -27.328125, -25.0078125, -22.6875, -20.3671875, -18.046875, -15.7265625, -13.40625, -11.0859375, -8.765625, -6.4453125, -4.125, -1.8046875, 0.515625, 2.8359375, 5.15625, 7.4765625, 9.796875, 12.1171875, 14.4375, 16.7578125, 19.078125, 21.3984375, 23.71875, 26.0390625, 28.359375, 30.6796875, 33.0, 35.3203125, 37.640625, 39.9609375, 42.28125, 44.6015625, 46.921875, 49.2421875, 51.5625, 53.8828125, 56.203125, 58.5234375, 60.84375, 63.1640625, 65.484375, 67.8046875, 70.125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 3.0, 9.0, 6.0, 6.0, 10.0, 10.0, 20.0, 12.0, 14.0, 21.0, 19.0, 29.0, 27.0, 22.0, 41.0, 28.0, 30.0, 29.0, 33.0, 37.0, 39.0, 36.0, 42.0, 41.0, 38.0, 49.0, 40.0, 29.0, 26.0, 22.0, 40.0, 30.0, 22.0, 17.0, 11.0, 17.0, 18.0, 14.0, 17.0, 5.0, 8.0, 11.0, 6.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-35.1875, -34.1552734375, -33.123046875, -32.0908203125, -31.05859375, -30.0263671875, -28.994140625, -27.9619140625, -26.9296875, -25.8974609375, -24.865234375, -23.8330078125, -22.80078125, -21.7685546875, -20.736328125, -19.7041015625, -18.671875, -17.6396484375, -16.607421875, -15.5751953125, -14.54296875, -13.5107421875, -12.478515625, -11.4462890625, -10.4140625, -9.3818359375, -8.349609375, -7.3173828125, -6.28515625, -5.2529296875, -4.220703125, -3.1884765625, -2.15625, -1.1240234375, -0.091796875, 0.9404296875, 1.97265625, 3.0048828125, 4.037109375, 5.0693359375, 6.1015625, 7.1337890625, 8.166015625, 9.1982421875, 10.23046875, 11.2626953125, 12.294921875, 13.3271484375, 14.359375, 15.3916015625, 16.423828125, 17.4560546875, 18.48828125, 19.5205078125, 20.552734375, 21.5849609375, 22.6171875, 23.6494140625, 24.681640625, 25.7138671875, 26.74609375, 27.7783203125, 28.810546875, 29.8427734375, 30.875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 15.0, 9.0, 20.0, 31.0, 44.0, 64.0, 109.0, 177.0, 247.0, 376.0, 561.0, 870.0, 1312.0, 2042.0, 3195.0, 5083.0, 8476.0, 14059.0, 24764.0, 43771.0, 82524.0, 163631.0, 275619.0, 197833.0, 99987.0, 52098.0, 29056.0, 16633.0, 9733.0, 5981.0, 3625.0, 2237.0, 1477.0, 994.0, 596.0, 409.0, 282.0, 202.0, 129.0, 87.0, 58.0, 38.0, 37.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0], "bins": [-90.1875, -87.6572265625, -85.126953125, -82.5966796875, -80.06640625, -77.5361328125, -75.005859375, -72.4755859375, -69.9453125, -67.4150390625, -64.884765625, -62.3544921875, -59.82421875, -57.2939453125, -54.763671875, -52.2333984375, -49.703125, -47.1728515625, -44.642578125, -42.1123046875, -39.58203125, -37.0517578125, -34.521484375, -31.9912109375, -29.4609375, -26.9306640625, -24.400390625, -21.8701171875, -19.33984375, -16.8095703125, -14.279296875, -11.7490234375, -9.21875, -6.6884765625, -4.158203125, -1.6279296875, 0.90234375, 3.4326171875, 5.962890625, 8.4931640625, 11.0234375, 13.5537109375, 16.083984375, 18.6142578125, 21.14453125, 23.6748046875, 26.205078125, 28.7353515625, 31.265625, 33.7958984375, 36.326171875, 38.8564453125, 41.38671875, 43.9169921875, 46.447265625, 48.9775390625, 51.5078125, 54.0380859375, 56.568359375, 59.0986328125, 61.62890625, 64.1591796875, 66.689453125, 69.2197265625, 71.75]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 10.0, 10.0, 13.0, 4.0, 16.0, 19.0, 26.0, 24.0, 22.0, 27.0, 28.0, 32.0, 33.0, 33.0, 30.0, 26.0, 44.0, 41.0, 35.0, 39.0, 38.0, 46.0, 47.0, 31.0, 33.0, 31.0, 26.0, 25.0, 31.0, 20.0, 17.0, 15.0, 16.0, 16.0, 10.0, 17.0, 9.0, 10.0, 3.0, 7.0, 3.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0], "bins": [-29.0625, -28.242919921875, -27.42333984375, -26.603759765625, -25.7841796875, -24.964599609375, -24.14501953125, -23.325439453125, -22.505859375, -21.686279296875, -20.86669921875, -20.047119140625, -19.2275390625, -18.407958984375, -17.58837890625, -16.768798828125, -15.94921875, -15.129638671875, -14.31005859375, -13.490478515625, -12.6708984375, -11.851318359375, -11.03173828125, -10.212158203125, -9.392578125, -8.572998046875, -7.75341796875, -6.933837890625, -6.1142578125, -5.294677734375, -4.47509765625, -3.655517578125, -2.8359375, -2.016357421875, -1.19677734375, -0.377197265625, 0.4423828125, 1.261962890625, 2.08154296875, 2.901123046875, 3.720703125, 4.540283203125, 5.35986328125, 6.179443359375, 6.9990234375, 7.818603515625, 8.63818359375, 9.457763671875, 10.27734375, 11.096923828125, 11.91650390625, 12.736083984375, 13.5556640625, 14.375244140625, 15.19482421875, 16.014404296875, 16.833984375, 17.653564453125, 18.47314453125, 19.292724609375, 20.1123046875, 20.931884765625, 21.75146484375, 22.571044921875, 23.390625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 23.0, 13.0, 23.0, 22.0, 31.0, 36.0, 61.0, 74.0, 141.0, 180.0, 263.0, 373.0, 609.0, 1115.0, 2178.0, 5503.0, 20731.0, 209966.0, 758386.0, 34694.0, 7785.0, 2865.0, 1335.0, 699.0, 435.0, 325.0, 169.0, 136.0, 108.0, 71.0, 69.0, 41.0, 26.0, 19.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-486.25, -472.01171875, -457.7734375, -443.53515625, -429.296875, -415.05859375, -400.8203125, -386.58203125, -372.34375, -358.10546875, -343.8671875, -329.62890625, -315.390625, -301.15234375, -286.9140625, -272.67578125, -258.4375, -244.19921875, -229.9609375, -215.72265625, -201.484375, -187.24609375, -173.0078125, -158.76953125, -144.53125, -130.29296875, -116.0546875, -101.81640625, -87.578125, -73.33984375, -59.1015625, -44.86328125, -30.625, -16.38671875, -2.1484375, 12.08984375, 26.328125, 40.56640625, 54.8046875, 69.04296875, 83.28125, 97.51953125, 111.7578125, 125.99609375, 140.234375, 154.47265625, 168.7109375, 182.94921875, 197.1875, 211.42578125, 225.6640625, 239.90234375, 254.140625, 268.37890625, 282.6171875, 296.85546875, 311.09375, 325.33203125, 339.5703125, 353.80859375, 368.046875, 382.28515625, 396.5234375, 410.76171875, 425.0]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 8.0, 21.0, 20.0, 33.0, 77.0, 115.0, 180.0, 206.0, 119.0, 72.0, 46.0, 29.0, 20.0, 11.0, 8.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.012542724609375, -0.012204885482788086, -0.011867046356201172, -0.011529207229614258, -0.011191368103027344, -0.01085352897644043, -0.010515689849853516, -0.010177850723266602, -0.009840011596679688, -0.009502172470092773, -0.00916433334350586, -0.008826494216918945, -0.008488655090332031, -0.008150815963745117, -0.007812976837158203, -0.007475137710571289, -0.007137298583984375, -0.006799459457397461, -0.006461620330810547, -0.006123781204223633, -0.005785942077636719, -0.005448102951049805, -0.005110263824462891, -0.0047724246978759766, -0.0044345855712890625, -0.0040967464447021484, -0.0037589073181152344, -0.0034210681915283203, -0.0030832290649414062, -0.002745389938354492, -0.002407550811767578, -0.002069711685180664, -0.00173187255859375, -0.001394033432006836, -0.0010561943054199219, -0.0007183551788330078, -0.00038051605224609375, -4.267692565917969e-05, 0.0002951622009277344, 0.0006330013275146484, 0.0009708404541015625, 0.0013086795806884766, 0.0016465187072753906, 0.0019843578338623047, 0.0023221969604492188, 0.002660036087036133, 0.002997875213623047, 0.003335714340209961, 0.003673553466796875, 0.004011392593383789, 0.004349231719970703, 0.004687070846557617, 0.005024909973144531, 0.005362749099731445, 0.005700588226318359, 0.0060384273529052734, 0.0063762664794921875, 0.0067141056060791016, 0.007051944732666016, 0.00738978385925293, 0.007727622985839844, 0.008065462112426758, 0.008403301239013672, 0.008741140365600586, 0.0090789794921875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 7.0, 9.0, 9.0, 18.0, 28.0, 39.0, 32.0, 53.0, 58.0, 87.0, 136.0, 158.0, 232.0, 349.0, 455.0, 746.0, 1051.0, 1802.0, 3515.0, 8798.0, 35209.0, 719803.0, 239665.0, 22092.0, 6589.0, 2920.0, 1541.0, 980.0, 603.0, 464.0, 299.0, 204.0, 142.0, 110.0, 82.0, 57.0, 53.0, 42.0, 18.0, 17.0, 23.0, 17.0, 9.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-392.75, -380.0234375, -367.296875, -354.5703125, -341.84375, -329.1171875, -316.390625, -303.6640625, -290.9375, -278.2109375, -265.484375, -252.7578125, -240.03125, -227.3046875, -214.578125, -201.8515625, -189.125, -176.3984375, -163.671875, -150.9453125, -138.21875, -125.4921875, -112.765625, -100.0390625, -87.3125, -74.5859375, -61.859375, -49.1328125, -36.40625, -23.6796875, -10.953125, 1.7734375, 14.5, 27.2265625, 39.953125, 52.6796875, 65.40625, 78.1328125, 90.859375, 103.5859375, 116.3125, 129.0390625, 141.765625, 154.4921875, 167.21875, 179.9453125, 192.671875, 205.3984375, 218.125, 230.8515625, 243.578125, 256.3046875, 269.03125, 281.7578125, 294.484375, 307.2109375, 319.9375, 332.6640625, 345.390625, 358.1171875, 370.84375, 383.5703125, 396.296875, 409.0234375, 421.75]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 9.0, 12.0, 18.0, 56.0, 80.0, 181.0, 230.0, 167.0, 133.0, 48.0, 26.0, 8.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.875, -108.6533203125, -105.431640625, -102.2099609375, -98.98828125, -95.7666015625, -92.544921875, -89.3232421875, -86.1015625, -82.8798828125, -79.658203125, -76.4365234375, -73.21484375, -69.9931640625, -66.771484375, -63.5498046875, -60.328125, -57.1064453125, -53.884765625, -50.6630859375, -47.44140625, -44.2197265625, -40.998046875, -37.7763671875, -34.5546875, -31.3330078125, -28.111328125, -24.8896484375, -21.66796875, -18.4462890625, -15.224609375, -12.0029296875, -8.78125, -5.5595703125, -2.337890625, 0.8837890625, 4.10546875, 7.3271484375, 10.548828125, 13.7705078125, 16.9921875, 20.2138671875, 23.435546875, 26.6572265625, 29.87890625, 33.1005859375, 36.322265625, 39.5439453125, 42.765625, 45.9873046875, 49.208984375, 52.4306640625, 55.65234375, 58.8740234375, 62.095703125, 65.3173828125, 68.5390625, 71.7607421875, 74.982421875, 78.2041015625, 81.42578125, 84.6474609375, 87.869140625, 91.0908203125, 94.3125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 13.0, 20.0, 39.0, 63.0, 135.0, 198.0, 188.0, 118.0, 61.0, 37.0, 25.0, 25.0, 23.0, 11.0, 9.0, 4.0, 5.0, 7.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.72150421142578, -49.136714935302734, -44.55192565917969, -39.967140197753906, -35.38235092163086, -30.797561645507812, -26.2127742767334, -21.627986907958984, -17.043197631835938, -12.458409309387207, -7.873620986938477, -3.288832664489746, 1.2959556579589844, 5.880744934082031, 10.465532302856445, 15.05031967163086, 19.635108947753906, 24.219898223876953, 28.804685592651367, 33.38947296142578, 37.97426223754883, 42.559051513671875, 47.143836975097656, 51.7286262512207, 56.31341552734375, 60.8982048034668, 65.48299407958984, 70.06777954101562, 74.65257263183594, 79.23735809326172, 83.8221435546875, 88.40693664550781, 92.99172973632812, 97.5765151977539, 102.16130828857422, 106.74609375, 111.33088684082031, 115.9156723022461, 120.50045776367188, 125.08525085449219, 129.6700439453125, 134.2548370361328, 138.83961486816406, 143.42440795898438, 148.0092010498047, 152.593994140625, 157.17877197265625, 161.76356506347656, 166.3483428955078, 170.93313598632812, 175.51791381835938, 180.1027069091797, 184.6875, 189.27227783203125, 193.85707092285156, 198.44186401367188, 203.02664184570312, 207.61143493652344, 212.1962127685547, 216.781005859375, 221.3657989501953, 225.95059204101562, 230.53536987304688, 235.1201629638672, 239.7049560546875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 13.0, 9.0, 13.0, 17.0, 16.0, 10.0, 14.0, 15.0, 18.0, 28.0, 27.0, 25.0, 30.0, 48.0, 35.0, 42.0, 28.0, 39.0, 42.0, 47.0, 34.0, 48.0, 32.0, 33.0, 35.0, 30.0, 39.0, 24.0, 22.0, 29.0, 30.0, 17.0, 17.0, 12.0, 13.0, 8.0, 12.0, 12.0, 3.0, 6.0, 7.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-45.45261001586914, -44.18706130981445, -42.92151641845703, -41.655967712402344, -40.39042282104492, -39.124874114990234, -37.85932922363281, -36.593780517578125, -35.32823181152344, -34.06268310546875, -32.79713821411133, -31.531591415405273, -30.26604461669922, -29.00049591064453, -27.734949111938477, -26.469402313232422, -25.203857421875, -23.938310623168945, -22.67276382446289, -21.407217025756836, -20.14167022705078, -18.876121520996094, -17.61057472229004, -16.345027923583984, -15.07948112487793, -13.813934326171875, -12.54838752746582, -11.28283977508545, -10.017292976379395, -8.75174617767334, -7.486198902130127, -6.220651626586914, -4.955104827880859, -3.6895577907562256, -2.424010753631592, -1.158463716506958, 0.10708332061767578, 1.3726301193237305, 2.6381773948669434, 3.9037246704101562, 5.169271469116211, 6.434818267822266, 7.7003655433654785, 8.965912818908691, 10.231459617614746, 11.4970064163208, 12.762554168701172, 14.028100967407227, 15.293647766113281, 16.559194564819336, 17.82474136352539, 19.090288162231445, 20.3558349609375, 21.621383666992188, 22.886930465698242, 24.152477264404297, 25.41802406311035, 26.683570861816406, 27.94911766052246, 29.214664459228516, 30.480213165283203, 31.745758056640625, 33.01130676269531, 34.27685546875, 35.54240036010742]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 9.0, 10.0, 12.0, 24.0, 34.0, 32.0, 68.0, 90.0, 149.0, 205.0, 311.0, 440.0, 668.0, 966.0, 1504.0, 2222.0, 3311.0, 4994.0, 7774.0, 12559.0, 20460.0, 35309.0, 63384.0, 123844.0, 286025.0, 1015646.0, 1702913.0, 517908.0, 187772.0, 89034.0, 47664.0, 26783.0, 15954.0, 9516.0, 5943.0, 3675.0, 2453.0, 1570.0, 988.0, 652.0, 441.0, 325.0, 201.0, 134.0, 111.0, 56.0, 48.0, 29.0, 21.0, 19.0, 6.0, 11.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-64.875, -62.86376953125, -60.8525390625, -58.84130859375, -56.830078125, -54.81884765625, -52.8076171875, -50.79638671875, -48.78515625, -46.77392578125, -44.7626953125, -42.75146484375, -40.740234375, -38.72900390625, -36.7177734375, -34.70654296875, -32.6953125, -30.68408203125, -28.6728515625, -26.66162109375, -24.650390625, -22.63916015625, -20.6279296875, -18.61669921875, -16.60546875, -14.59423828125, -12.5830078125, -10.57177734375, -8.560546875, -6.54931640625, -4.5380859375, -2.52685546875, -0.515625, 1.49560546875, 3.5068359375, 5.51806640625, 7.529296875, 9.54052734375, 11.5517578125, 13.56298828125, 15.57421875, 17.58544921875, 19.5966796875, 21.60791015625, 23.619140625, 25.63037109375, 27.6416015625, 29.65283203125, 31.6640625, 33.67529296875, 35.6865234375, 37.69775390625, 39.708984375, 41.72021484375, 43.7314453125, 45.74267578125, 47.75390625, 49.76513671875, 51.7763671875, 53.78759765625, 55.798828125, 57.81005859375, 59.8212890625, 61.83251953125, 63.84375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 3.0, 2.0, 6.0, 4.0, 6.0, 9.0, 10.0, 11.0, 11.0, 17.0, 19.0, 14.0, 20.0, 22.0, 31.0, 24.0, 18.0, 40.0, 43.0, 35.0, 38.0, 44.0, 42.0, 35.0, 53.0, 36.0, 46.0, 31.0, 27.0, 39.0, 39.0, 26.0, 22.0, 26.0, 25.0, 12.0, 20.0, 20.0, 18.0, 11.0, 8.0, 6.0, 6.0, 7.0, 3.0, 4.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.62109375, -19.9453125, -19.26953125, -18.59375, -17.91796875, -17.2421875, -16.56640625, -15.890625, -15.21484375, -14.5390625, -13.86328125, -13.1875, -12.51171875, -11.8359375, -11.16015625, -10.484375, -9.80859375, -9.1328125, -8.45703125, -7.78125, -7.10546875, -6.4296875, -5.75390625, -5.078125, -4.40234375, -3.7265625, -3.05078125, -2.375, -1.69921875, -1.0234375, -0.34765625, 0.328125, 1.00390625, 1.6796875, 2.35546875, 3.03125, 3.70703125, 4.3828125, 5.05859375, 5.734375, 6.41015625, 7.0859375, 7.76171875, 8.4375, 9.11328125, 9.7890625, 10.46484375, 11.140625, 11.81640625, 12.4921875, 13.16796875, 13.84375, 14.51953125, 15.1953125, 15.87109375, 16.546875, 17.22265625, 17.8984375, 18.57421875, 19.25, 19.92578125, 20.6015625, 21.27734375, 21.953125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 9.0, 12.0, 15.0, 15.0, 27.0, 31.0, 48.0, 64.0, 96.0, 115.0, 174.0, 217.0, 298.0, 467.0, 659.0, 946.0, 1423.0, 2180.0, 3424.0, 5583.0, 9778.0, 18028.0, 35565.0, 80023.0, 212406.0, 767342.0, 2148176.0, 591014.0, 176447.0, 68209.0, 31489.0, 16313.0, 9131.0, 5258.0, 3290.0, 2054.0, 1314.0, 899.0, 571.0, 366.0, 262.0, 181.0, 125.0, 83.0, 60.0, 26.0, 27.0, 17.0, 9.0, 11.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-79.0, -76.76904296875, -74.5380859375, -72.30712890625, -70.076171875, -67.84521484375, -65.6142578125, -63.38330078125, -61.15234375, -58.92138671875, -56.6904296875, -54.45947265625, -52.228515625, -49.99755859375, -47.7666015625, -45.53564453125, -43.3046875, -41.07373046875, -38.8427734375, -36.61181640625, -34.380859375, -32.14990234375, -29.9189453125, -27.68798828125, -25.45703125, -23.22607421875, -20.9951171875, -18.76416015625, -16.533203125, -14.30224609375, -12.0712890625, -9.84033203125, -7.609375, -5.37841796875, -3.1474609375, -0.91650390625, 1.314453125, 3.54541015625, 5.7763671875, 8.00732421875, 10.23828125, 12.46923828125, 14.7001953125, 16.93115234375, 19.162109375, 21.39306640625, 23.6240234375, 25.85498046875, 28.0859375, 30.31689453125, 32.5478515625, 34.77880859375, 37.009765625, 39.24072265625, 41.4716796875, 43.70263671875, 45.93359375, 48.16455078125, 50.3955078125, 52.62646484375, 54.857421875, 57.08837890625, 59.3193359375, 61.55029296875, 63.78125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 6.0, 9.0, 4.0, 17.0, 25.0, 18.0, 35.0, 43.0, 46.0, 74.0, 85.0, 124.0, 124.0, 169.0, 192.0, 246.0, 320.0, 367.0, 346.0, 372.0, 288.0, 207.0, 191.0, 169.0, 106.0, 80.0, 83.0, 57.0, 45.0, 51.0, 22.0, 31.0, 19.0, 9.0, 16.0, 11.0, 8.0, 10.0, 12.0, 7.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-14.4140625, -13.954833984375, -13.49560546875, -13.036376953125, -12.5771484375, -12.117919921875, -11.65869140625, -11.199462890625, -10.740234375, -10.281005859375, -9.82177734375, -9.362548828125, -8.9033203125, -8.444091796875, -7.98486328125, -7.525634765625, -7.06640625, -6.607177734375, -6.14794921875, -5.688720703125, -5.2294921875, -4.770263671875, -4.31103515625, -3.851806640625, -3.392578125, -2.933349609375, -2.47412109375, -2.014892578125, -1.5556640625, -1.096435546875, -0.63720703125, -0.177978515625, 0.28125, 0.740478515625, 1.19970703125, 1.658935546875, 2.1181640625, 2.577392578125, 3.03662109375, 3.495849609375, 3.955078125, 4.414306640625, 4.87353515625, 5.332763671875, 5.7919921875, 6.251220703125, 6.71044921875, 7.169677734375, 7.62890625, 8.088134765625, 8.54736328125, 9.006591796875, 9.4658203125, 9.925048828125, 10.38427734375, 10.843505859375, 11.302734375, 11.761962890625, 12.22119140625, 12.680419921875, 13.1396484375, 13.598876953125, 14.05810546875, 14.517333984375, 14.9765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 12.0, 8.0, 20.0, 23.0, 55.0, 79.0, 119.0, 209.0, 183.0, 107.0, 56.0, 27.0, 38.0, 17.0, 7.0, 4.0, 4.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.68571472167969, -54.830745697021484, -51.97578048706055, -49.120811462402344, -46.265846252441406, -43.4108772277832, -40.555908203125, -37.70094299316406, -34.845977783203125, -31.991010665893555, -29.136043548583984, -26.28107452392578, -23.426109313964844, -20.57114028930664, -17.71617317199707, -14.8612060546875, -12.006237030029297, -9.151269912719727, -6.296302318572998, -3.4413347244262695, -0.5863676071166992, 2.268599510192871, 5.123567581176758, 7.978534698486328, 10.833501815795898, 13.688468933105469, 16.54343605041504, 19.39840316772461, 22.253372192382812, 25.10833740234375, 27.963306427001953, 30.818273544311523, 33.673240661621094, 36.5282096862793, 39.383174896240234, 42.23814392089844, 45.093109130859375, 47.94807815551758, 50.80304718017578, 53.65801239013672, 56.512977600097656, 59.36794662475586, 62.2229118347168, 65.077880859375, 67.93284606933594, 70.78781127929688, 73.64278411865234, 76.49774932861328, 79.35272216796875, 82.20768737792969, 85.06266021728516, 87.9176254272461, 90.77259063720703, 93.62755584716797, 96.48252868652344, 99.33749389648438, 102.19245910644531, 105.04742431640625, 107.90239715576172, 110.75736236572266, 113.6123275756836, 116.46729278564453, 119.322265625, 122.17723083496094, 125.03219604492188]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 15.0, 6.0, 16.0, 11.0, 11.0, 17.0, 24.0, 27.0, 25.0, 21.0, 39.0, 26.0, 41.0, 33.0, 26.0, 37.0, 48.0, 46.0, 34.0, 49.0, 42.0, 41.0, 53.0, 35.0, 39.0, 30.0, 23.0, 25.0, 21.0, 22.0, 14.0, 18.0, 14.0, 16.0, 7.0, 7.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-31.70625114440918, -30.815082550048828, -29.923912048339844, -29.032743453979492, -28.14157485961914, -27.250404357910156, -26.359235763549805, -25.468067169189453, -24.5768985748291, -23.68572998046875, -22.794559478759766, -21.903390884399414, -21.012222290039062, -20.121051788330078, -19.229883193969727, -18.338714599609375, -17.44754409790039, -16.55637550354004, -15.665205955505371, -14.774036407470703, -13.882867813110352, -12.991698265075684, -12.100528717041016, -11.209360122680664, -10.318191528320312, -9.427021980285645, -8.535853385925293, -7.644683837890625, -6.753515243530273, -5.8623456954956055, -4.971176624298096, -4.080007553100586, -3.1888389587402344, -2.2976698875427246, -1.4065006971359253, -0.515331506729126, 0.3758375644683838, 1.2670068740844727, 2.1581759452819824, 3.049345016479492, 3.940514087677002, 4.831683158874512, 5.7228522300720215, 6.614021301269531, 7.505190849304199, 8.396360397338867, 9.287528991699219, 10.17869758605957, 11.069867134094238, 11.961036682128906, 12.852205276489258, 13.743374824523926, 14.634543418884277, 15.525712966918945, 16.416881561279297, 17.30805206298828, 18.199220657348633, 19.090389251708984, 19.98155975341797, 20.87272834777832, 21.763896942138672, 22.655067443847656, 23.546236038208008, 24.43740463256836, 25.32857322692871]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 10.0, 17.0, 23.0, 36.0, 44.0, 63.0, 108.0, 139.0, 252.0, 385.0, 551.0, 933.0, 1559.0, 2570.0, 4375.0, 7614.0, 13835.0, 26590.0, 57482.0, 157478.0, 457497.0, 187022.0, 65176.0, 29522.0, 15093.0, 8402.0, 4656.0, 2775.0, 1602.0, 987.0, 604.0, 412.0, 261.0, 151.0, 122.0, 72.0, 47.0, 26.0, 19.0, 17.0, 8.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.71875, -57.8271484375, -55.935546875, -54.0439453125, -52.15234375, -50.2607421875, -48.369140625, -46.4775390625, -44.5859375, -42.6943359375, -40.802734375, -38.9111328125, -37.01953125, -35.1279296875, -33.236328125, -31.3447265625, -29.453125, -27.5615234375, -25.669921875, -23.7783203125, -21.88671875, -19.9951171875, -18.103515625, -16.2119140625, -14.3203125, -12.4287109375, -10.537109375, -8.6455078125, -6.75390625, -4.8623046875, -2.970703125, -1.0791015625, 0.8125, 2.7041015625, 4.595703125, 6.4873046875, 8.37890625, 10.2705078125, 12.162109375, 14.0537109375, 15.9453125, 17.8369140625, 19.728515625, 21.6201171875, 23.51171875, 25.4033203125, 27.294921875, 29.1865234375, 31.078125, 32.9697265625, 34.861328125, 36.7529296875, 38.64453125, 40.5361328125, 42.427734375, 44.3193359375, 46.2109375, 48.1025390625, 49.994140625, 51.8857421875, 53.77734375, 55.6689453125, 57.560546875, 59.4521484375, 61.34375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 4.0, 5.0, 7.0, 13.0, 16.0, 20.0, 23.0, 19.0, 26.0, 31.0, 28.0, 25.0, 37.0, 38.0, 42.0, 42.0, 35.0, 42.0, 32.0, 57.0, 51.0, 49.0, 44.0, 37.0, 49.0, 34.0, 31.0, 23.0, 26.0, 27.0, 21.0, 11.0, 12.0, 5.0, 9.0, 8.0, 8.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.359375, -29.418701171875, -28.47802734375, -27.537353515625, -26.5966796875, -25.656005859375, -24.71533203125, -23.774658203125, -22.833984375, -21.893310546875, -20.95263671875, -20.011962890625, -19.0712890625, -18.130615234375, -17.18994140625, -16.249267578125, -15.30859375, -14.367919921875, -13.42724609375, -12.486572265625, -11.5458984375, -10.605224609375, -9.66455078125, -8.723876953125, -7.783203125, -6.842529296875, -5.90185546875, -4.961181640625, -4.0205078125, -3.079833984375, -2.13916015625, -1.198486328125, -0.2578125, 0.682861328125, 1.62353515625, 2.564208984375, 3.5048828125, 4.445556640625, 5.38623046875, 6.326904296875, 7.267578125, 8.208251953125, 9.14892578125, 10.089599609375, 11.0302734375, 11.970947265625, 12.91162109375, 13.852294921875, 14.79296875, 15.733642578125, 16.67431640625, 17.614990234375, 18.5556640625, 19.496337890625, 20.43701171875, 21.377685546875, 22.318359375, 23.259033203125, 24.19970703125, 25.140380859375, 26.0810546875, 27.021728515625, 27.96240234375, 28.903076171875, 29.84375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 7.0, 14.0, 17.0, 21.0, 41.0, 50.0, 68.0, 100.0, 99.0, 167.0, 229.0, 279.0, 421.0, 618.0, 888.0, 1233.0, 1939.0, 3119.0, 5433.0, 10035.0, 22183.0, 70555.0, 644038.0, 212114.0, 39740.0, 15377.0, 7690.0, 4272.0, 2564.0, 1578.0, 1121.0, 694.0, 522.0, 383.0, 241.0, 208.0, 131.0, 104.0, 78.0, 46.0, 26.0, 22.0, 27.0, 17.0, 12.0, 4.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-85.4375, -82.662109375, -79.88671875, -77.111328125, -74.3359375, -71.560546875, -68.78515625, -66.009765625, -63.234375, -60.458984375, -57.68359375, -54.908203125, -52.1328125, -49.357421875, -46.58203125, -43.806640625, -41.03125, -38.255859375, -35.48046875, -32.705078125, -29.9296875, -27.154296875, -24.37890625, -21.603515625, -18.828125, -16.052734375, -13.27734375, -10.501953125, -7.7265625, -4.951171875, -2.17578125, 0.599609375, 3.375, 6.150390625, 8.92578125, 11.701171875, 14.4765625, 17.251953125, 20.02734375, 22.802734375, 25.578125, 28.353515625, 31.12890625, 33.904296875, 36.6796875, 39.455078125, 42.23046875, 45.005859375, 47.78125, 50.556640625, 53.33203125, 56.107421875, 58.8828125, 61.658203125, 64.43359375, 67.208984375, 69.984375, 72.759765625, 75.53515625, 78.310546875, 81.0859375, 83.861328125, 86.63671875, 89.412109375, 92.1875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 5.0, 11.0, 15.0, 7.0, 10.0, 23.0, 15.0, 22.0, 19.0, 17.0, 30.0, 25.0, 29.0, 31.0, 31.0, 30.0, 37.0, 33.0, 26.0, 45.0, 27.0, 27.0, 36.0, 40.0, 35.0, 28.0, 28.0, 34.0, 28.0, 24.0, 29.0, 26.0, 23.0, 23.0, 10.0, 18.0, 14.0, 13.0, 10.0, 14.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-20.9375, -20.33251953125, -19.7275390625, -19.12255859375, -18.517578125, -17.91259765625, -17.3076171875, -16.70263671875, -16.09765625, -15.49267578125, -14.8876953125, -14.28271484375, -13.677734375, -13.07275390625, -12.4677734375, -11.86279296875, -11.2578125, -10.65283203125, -10.0478515625, -9.44287109375, -8.837890625, -8.23291015625, -7.6279296875, -7.02294921875, -6.41796875, -5.81298828125, -5.2080078125, -4.60302734375, -3.998046875, -3.39306640625, -2.7880859375, -2.18310546875, -1.578125, -0.97314453125, -0.3681640625, 0.23681640625, 0.841796875, 1.44677734375, 2.0517578125, 2.65673828125, 3.26171875, 3.86669921875, 4.4716796875, 5.07666015625, 5.681640625, 6.28662109375, 6.8916015625, 7.49658203125, 8.1015625, 8.70654296875, 9.3115234375, 9.91650390625, 10.521484375, 11.12646484375, 11.7314453125, 12.33642578125, 12.94140625, 13.54638671875, 14.1513671875, 14.75634765625, 15.361328125, 15.96630859375, 16.5712890625, 17.17626953125, 17.78125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 9.0, 17.0, 18.0, 39.0, 48.0, 49.0, 54.0, 103.0, 122.0, 178.0, 247.0, 320.0, 436.0, 635.0, 838.0, 1117.0, 1665.0, 2446.0, 3448.0, 5433.0, 8652.0, 14912.0, 28925.0, 72888.0, 536440.0, 256604.0, 53778.0, 23644.0, 12552.0, 7432.0, 4686.0, 3139.0, 2155.0, 1553.0, 1051.0, 780.0, 545.0, 428.0, 330.0, 252.0, 158.0, 121.0, 91.0, 62.0, 52.0, 28.0, 18.0, 22.0, 10.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-39.25, -38.01806640625, -36.7861328125, -35.55419921875, -34.322265625, -33.09033203125, -31.8583984375, -30.62646484375, -29.39453125, -28.16259765625, -26.9306640625, -25.69873046875, -24.466796875, -23.23486328125, -22.0029296875, -20.77099609375, -19.5390625, -18.30712890625, -17.0751953125, -15.84326171875, -14.611328125, -13.37939453125, -12.1474609375, -10.91552734375, -9.68359375, -8.45166015625, -7.2197265625, -5.98779296875, -4.755859375, -3.52392578125, -2.2919921875, -1.06005859375, 0.171875, 1.40380859375, 2.6357421875, 3.86767578125, 5.099609375, 6.33154296875, 7.5634765625, 8.79541015625, 10.02734375, 11.25927734375, 12.4912109375, 13.72314453125, 14.955078125, 16.18701171875, 17.4189453125, 18.65087890625, 19.8828125, 21.11474609375, 22.3466796875, 23.57861328125, 24.810546875, 26.04248046875, 27.2744140625, 28.50634765625, 29.73828125, 30.97021484375, 32.2021484375, 33.43408203125, 34.666015625, 35.89794921875, 37.1298828125, 38.36181640625, 39.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 8.0, 7.0, 17.0, 20.0, 36.0, 38.0, 61.0, 79.0, 90.0, 112.0, 128.0, 130.0, 75.0, 72.0, 41.0, 30.0, 19.0, 14.0, 12.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019292831420898438, -0.001861080527305603, -0.0017928779125213623, -0.0017246752977371216, -0.0016564726829528809, -0.0015882700681686401, -0.0015200674533843994, -0.0014518648386001587, -0.001383662223815918, -0.0013154596090316772, -0.0012472569942474365, -0.0011790543794631958, -0.001110851764678955, -0.0010426491498947144, -0.0009744465351104736, -0.0009062439203262329, -0.0008380413055419922, -0.0007698386907577515, -0.0007016360759735107, -0.00063343346118927, -0.0005652308464050293, -0.0004970282316207886, -0.00042882561683654785, -0.00036062300205230713, -0.0002924203872680664, -0.00022421777248382568, -0.00015601515769958496, -8.781254291534424e-05, -1.9609928131103516e-05, 4.859268665313721e-05, 0.00011679530143737793, 0.00018499791622161865, 0.0002532005310058594, 0.0003214031457901001, 0.0003896057605743408, 0.00045780837535858154, 0.0005260109901428223, 0.000594213604927063, 0.0006624162197113037, 0.0007306188344955444, 0.0007988214492797852, 0.0008670240640640259, 0.0009352266788482666, 0.0010034292936325073, 0.001071631908416748, 0.0011398345232009888, 0.0012080371379852295, 0.0012762397527694702, 0.001344442367553711, 0.0014126449823379517, 0.0014808475971221924, 0.001549050211906433, 0.0016172528266906738, 0.0016854554414749146, 0.0017536580562591553, 0.001821860671043396, 0.0018900632858276367, 0.0019582659006118774, 0.002026468515396118, 0.002094671130180359, 0.0021628737449645996, 0.0022310763597488403, 0.002299278974533081, 0.0023674815893173218, 0.0024356842041015625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 4.0, 8.0, 13.0, 25.0, 26.0, 45.0, 52.0, 89.0, 175.0, 227.0, 319.0, 493.0, 851.0, 1307.0, 2371.0, 4281.0, 8390.0, 17958.0, 43559.0, 130162.0, 511814.0, 214690.0, 63328.0, 24724.0, 11055.0, 5461.0, 2843.0, 1611.0, 922.0, 597.0, 381.0, 244.0, 160.0, 136.0, 55.0, 68.0, 29.0, 25.0, 15.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6875, -34.443359375, -33.19921875, -31.955078125, -30.7109375, -29.466796875, -28.22265625, -26.978515625, -25.734375, -24.490234375, -23.24609375, -22.001953125, -20.7578125, -19.513671875, -18.26953125, -17.025390625, -15.78125, -14.537109375, -13.29296875, -12.048828125, -10.8046875, -9.560546875, -8.31640625, -7.072265625, -5.828125, -4.583984375, -3.33984375, -2.095703125, -0.8515625, 0.392578125, 1.63671875, 2.880859375, 4.125, 5.369140625, 6.61328125, 7.857421875, 9.1015625, 10.345703125, 11.58984375, 12.833984375, 14.078125, 15.322265625, 16.56640625, 17.810546875, 19.0546875, 20.298828125, 21.54296875, 22.787109375, 24.03125, 25.275390625, 26.51953125, 27.763671875, 29.0078125, 30.251953125, 31.49609375, 32.740234375, 33.984375, 35.228515625, 36.47265625, 37.716796875, 38.9609375, 40.205078125, 41.44921875, 42.693359375, 43.9375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 10.0, 12.0, 20.0, 16.0, 27.0, 34.0, 51.0, 63.0, 70.0, 76.0, 78.0, 104.0, 88.0, 71.0, 58.0, 49.0, 43.0, 29.0, 25.0, 13.0, 17.0, 7.0, 3.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.73553466796875, -8.4866943359375, -8.23785400390625, -7.989013671875, -7.74017333984375, -7.4913330078125, -7.24249267578125, -6.99365234375, -6.74481201171875, -6.4959716796875, -6.24713134765625, -5.998291015625, -5.74945068359375, -5.5006103515625, -5.25177001953125, -5.0029296875, -4.75408935546875, -4.5052490234375, -4.25640869140625, -4.007568359375, -3.75872802734375, -3.5098876953125, -3.26104736328125, -3.01220703125, -2.76336669921875, -2.5145263671875, -2.26568603515625, -2.016845703125, -1.76800537109375, -1.5191650390625, -1.27032470703125, -1.021484375, -0.77264404296875, -0.5238037109375, -0.27496337890625, -0.026123046875, 0.22271728515625, 0.4715576171875, 0.72039794921875, 0.96923828125, 1.21807861328125, 1.4669189453125, 1.71575927734375, 1.964599609375, 2.21343994140625, 2.4622802734375, 2.71112060546875, 2.9599609375, 3.20880126953125, 3.4576416015625, 3.70648193359375, 3.955322265625, 4.20416259765625, 4.4530029296875, 4.70184326171875, 4.95068359375, 5.19952392578125, 5.4483642578125, 5.69720458984375, 5.946044921875, 6.19488525390625, 6.4437255859375, 6.69256591796875, 6.94140625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 2.0, 8.0, 6.0, 15.0, 12.0, 17.0, 49.0, 51.0, 92.0, 161.0, 199.0, 144.0, 78.0, 48.0, 36.0, 23.0, 17.0, 6.0, 6.0, 4.0, 6.0, 9.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84046936035156, -50.256866455078125, -47.67326354980469, -45.08966064453125, -42.50605773925781, -39.922454833984375, -37.33885192871094, -34.7552490234375, -32.17164611816406, -29.588043212890625, -27.004440307617188, -24.42083740234375, -21.837234497070312, -19.253631591796875, -16.670028686523438, -14.08642578125, -11.502822875976562, -8.919219970703125, -6.3356170654296875, -3.75201416015625, -1.1684112548828125, 1.415191650390625, 3.9987945556640625, 6.5823974609375, 9.166000366210938, 11.749603271484375, 14.333206176757812, 16.91680908203125, 19.500411987304688, 22.084014892578125, 24.667617797851562, 27.251220703125, 29.834823608398438, 32.418426513671875, 35.00202941894531, 37.58563232421875, 40.16923522949219, 42.752838134765625, 45.33644104003906, 47.9200439453125, 50.50364685058594, 53.087249755859375, 55.67085266113281, 58.25445556640625, 60.83805847167969, 63.421661376953125, 66.00526428222656, 68.5888671875, 71.17247009277344, 73.75607299804688, 76.33967590332031, 78.92327880859375, 81.50688171386719, 84.09048461914062, 86.67408752441406, 89.2576904296875, 91.84129333496094, 94.42489624023438, 97.00849914550781, 99.59210205078125, 102.17570495605469, 104.75930786132812, 107.34291076660156, 109.926513671875, 112.51011657714844]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 6.0, 11.0, 8.0, 7.0, 12.0, 14.0, 12.0, 17.0, 20.0, 23.0, 20.0, 27.0, 20.0, 33.0, 43.0, 36.0, 33.0, 40.0, 30.0, 41.0, 38.0, 45.0, 39.0, 43.0, 44.0, 36.0, 36.0, 33.0, 31.0, 39.0, 22.0, 18.0, 20.0, 23.0, 12.0, 12.0, 14.0, 9.0, 8.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.143213272094727, -27.320280075073242, -26.497346878051758, -25.674413681030273, -24.85148048400879, -24.028547286987305, -23.20561408996582, -22.382680892944336, -21.55974769592285, -20.736814498901367, -19.913881301879883, -19.0909481048584, -18.268014907836914, -17.44508171081543, -16.622148513793945, -15.799215316772461, -14.97628116607666, -14.153347969055176, -13.330414772033691, -12.507481575012207, -11.684548377990723, -10.861614227294922, -10.038681030273438, -9.215747833251953, -8.392814636230469, -7.569881439208984, -6.7469482421875, -5.924015045166016, -5.101081848144531, -4.278148174285889, -3.4552149772644043, -2.63228178024292, -1.8093490600585938, -0.9864158034324646, -0.16348254680633545, 0.6594507694244385, 1.4823839664459229, 2.3053174018859863, 3.1282505989074707, 3.951183795928955, 4.7741169929504395, 5.597050189971924, 6.419983386993408, 7.242917060852051, 8.065850257873535, 8.88878345489502, 9.711716651916504, 10.534649848937988, 11.357583045959473, 12.180516242980957, 13.003449440002441, 13.826382637023926, 14.64931583404541, 15.472249984741211, 16.295183181762695, 17.11811637878418, 17.941049575805664, 18.76398277282715, 19.586915969848633, 20.409849166870117, 21.2327823638916, 22.055715560913086, 22.87864875793457, 23.701581954956055, 24.52451515197754]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 14.0, 11.0, 27.0, 41.0, 46.0, 83.0, 135.0, 221.0, 331.0, 523.0, 802.0, 1351.0, 2189.0, 3673.0, 5872.0, 9776.0, 16654.0, 28712.0, 50494.0, 91479.0, 164644.0, 235453.0, 188206.0, 107567.0, 59347.0, 33417.0, 19026.0, 11341.0, 6527.0, 3967.0, 2455.0, 1572.0, 1003.0, 581.0, 366.0, 216.0, 141.0, 124.0, 59.0, 40.0, 24.0, 16.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -50.0732421875, -48.490234375, -46.9072265625, -45.32421875, -43.7412109375, -42.158203125, -40.5751953125, -38.9921875, -37.4091796875, -35.826171875, -34.2431640625, -32.66015625, -31.0771484375, -29.494140625, -27.9111328125, -26.328125, -24.7451171875, -23.162109375, -21.5791015625, -19.99609375, -18.4130859375, -16.830078125, -15.2470703125, -13.6640625, -12.0810546875, -10.498046875, -8.9150390625, -7.33203125, -5.7490234375, -4.166015625, -2.5830078125, -1.0, 0.5830078125, 2.166015625, 3.7490234375, 5.33203125, 6.9150390625, 8.498046875, 10.0810546875, 11.6640625, 13.2470703125, 14.830078125, 16.4130859375, 17.99609375, 19.5791015625, 21.162109375, 22.7451171875, 24.328125, 25.9111328125, 27.494140625, 29.0771484375, 30.66015625, 32.2431640625, 33.826171875, 35.4091796875, 36.9921875, 38.5751953125, 40.158203125, 41.7412109375, 43.32421875, 44.9072265625, 46.490234375, 48.0732421875, 49.65625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 9.0, 7.0, 9.0, 12.0, 15.0, 8.0, 14.0, 21.0, 24.0, 25.0, 33.0, 43.0, 44.0, 32.0, 31.0, 46.0, 42.0, 52.0, 49.0, 48.0, 53.0, 47.0, 41.0, 40.0, 40.0, 27.0, 34.0, 27.0, 19.0, 28.0, 19.0, 17.0, 7.0, 11.0, 3.0, 13.0, 2.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.4375, -32.519287109375, -31.60107421875, -30.682861328125, -29.7646484375, -28.846435546875, -27.92822265625, -27.010009765625, -26.091796875, -25.173583984375, -24.25537109375, -23.337158203125, -22.4189453125, -21.500732421875, -20.58251953125, -19.664306640625, -18.74609375, -17.827880859375, -16.90966796875, -15.991455078125, -15.0732421875, -14.155029296875, -13.23681640625, -12.318603515625, -11.400390625, -10.482177734375, -9.56396484375, -8.645751953125, -7.7275390625, -6.809326171875, -5.89111328125, -4.972900390625, -4.0546875, -3.136474609375, -2.21826171875, -1.300048828125, -0.3818359375, 0.536376953125, 1.45458984375, 2.372802734375, 3.291015625, 4.209228515625, 5.12744140625, 6.045654296875, 6.9638671875, 7.882080078125, 8.80029296875, 9.718505859375, 10.63671875, 11.554931640625, 12.47314453125, 13.391357421875, 14.3095703125, 15.227783203125, 16.14599609375, 17.064208984375, 17.982421875, 18.900634765625, 19.81884765625, 20.737060546875, 21.6552734375, 22.573486328125, 23.49169921875, 24.409912109375, 25.328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 6.0, 3.0, 7.0, 7.0, 8.0, 9.0, 22.0, 28.0, 29.0, 52.0, 71.0, 103.0, 153.0, 214.0, 310.0, 475.0, 651.0, 1073.0, 1600.0, 2713.0, 4328.0, 7326.0, 12918.0, 24339.0, 47402.0, 103244.0, 239646.0, 319636.0, 144164.0, 65534.0, 31991.0, 16775.0, 9330.0, 5404.0, 3154.0, 1994.0, 1308.0, 826.0, 551.0, 385.0, 237.0, 164.0, 120.0, 84.0, 57.0, 31.0, 27.0, 18.0, 12.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-66.0625, -64.13134765625, -62.2001953125, -60.26904296875, -58.337890625, -56.40673828125, -54.4755859375, -52.54443359375, -50.61328125, -48.68212890625, -46.7509765625, -44.81982421875, -42.888671875, -40.95751953125, -39.0263671875, -37.09521484375, -35.1640625, -33.23291015625, -31.3017578125, -29.37060546875, -27.439453125, -25.50830078125, -23.5771484375, -21.64599609375, -19.71484375, -17.78369140625, -15.8525390625, -13.92138671875, -11.990234375, -10.05908203125, -8.1279296875, -6.19677734375, -4.265625, -2.33447265625, -0.4033203125, 1.52783203125, 3.458984375, 5.39013671875, 7.3212890625, 9.25244140625, 11.18359375, 13.11474609375, 15.0458984375, 16.97705078125, 18.908203125, 20.83935546875, 22.7705078125, 24.70166015625, 26.6328125, 28.56396484375, 30.4951171875, 32.42626953125, 34.357421875, 36.28857421875, 38.2197265625, 40.15087890625, 42.08203125, 44.01318359375, 45.9443359375, 47.87548828125, 49.806640625, 51.73779296875, 53.6689453125, 55.60009765625, 57.53125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 4.0, 4.0, 6.0, 16.0, 14.0, 12.0, 22.0, 23.0, 26.0, 24.0, 25.0, 28.0, 37.0, 31.0, 35.0, 44.0, 30.0, 42.0, 41.0, 40.0, 29.0, 35.0, 36.0, 39.0, 35.0, 37.0, 37.0, 36.0, 29.0, 24.0, 18.0, 16.0, 22.0, 6.0, 20.0, 11.0, 7.0, 11.0, 9.0, 7.0, 10.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.125, -17.478759765625, -16.83251953125, -16.186279296875, -15.5400390625, -14.893798828125, -14.24755859375, -13.601318359375, -12.955078125, -12.308837890625, -11.66259765625, -11.016357421875, -10.3701171875, -9.723876953125, -9.07763671875, -8.431396484375, -7.78515625, -7.138916015625, -6.49267578125, -5.846435546875, -5.2001953125, -4.553955078125, -3.90771484375, -3.261474609375, -2.615234375, -1.968994140625, -1.32275390625, -0.676513671875, -0.0302734375, 0.615966796875, 1.26220703125, 1.908447265625, 2.5546875, 3.200927734375, 3.84716796875, 4.493408203125, 5.1396484375, 5.785888671875, 6.43212890625, 7.078369140625, 7.724609375, 8.370849609375, 9.01708984375, 9.663330078125, 10.3095703125, 10.955810546875, 11.60205078125, 12.248291015625, 12.89453125, 13.540771484375, 14.18701171875, 14.833251953125, 15.4794921875, 16.125732421875, 16.77197265625, 17.418212890625, 18.064453125, 18.710693359375, 19.35693359375, 20.003173828125, 20.6494140625, 21.295654296875, 21.94189453125, 22.588134765625, 23.234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 7.0, 10.0, 16.0, 17.0, 28.0, 45.0, 51.0, 80.0, 143.0, 217.0, 385.0, 688.0, 1398.0, 3317.0, 9706.0, 38262.0, 613080.0, 335265.0, 31645.0, 8290.0, 3048.0, 1250.0, 664.0, 315.0, 200.0, 140.0, 88.0, 55.0, 37.0, 27.0, 21.0, 20.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.5, -282.60546875, -271.7109375, -260.81640625, -249.921875, -239.02734375, -228.1328125, -217.23828125, -206.34375, -195.44921875, -184.5546875, -173.66015625, -162.765625, -151.87109375, -140.9765625, -130.08203125, -119.1875, -108.29296875, -97.3984375, -86.50390625, -75.609375, -64.71484375, -53.8203125, -42.92578125, -32.03125, -21.13671875, -10.2421875, 0.65234375, 11.546875, 22.44140625, 33.3359375, 44.23046875, 55.125, 66.01953125, 76.9140625, 87.80859375, 98.703125, 109.59765625, 120.4921875, 131.38671875, 142.28125, 153.17578125, 164.0703125, 174.96484375, 185.859375, 196.75390625, 207.6484375, 218.54296875, 229.4375, 240.33203125, 251.2265625, 262.12109375, 273.015625, 283.91015625, 294.8046875, 305.69921875, 316.59375, 327.48828125, 338.3828125, 349.27734375, 360.171875, 371.06640625, 381.9609375, 392.85546875, 403.75]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 6.0, 10.0, 26.0, 35.0, 47.0, 80.0, 83.0, 141.0, 179.0, 133.0, 83.0, 55.0, 31.0, 30.0, 16.0, 6.0, 5.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.008209228515625, -0.007918477058410645, -0.007627725601196289, -0.007336974143981934, -0.007046222686767578, -0.006755471229553223, -0.006464719772338867, -0.006173968315124512, -0.005883216857910156, -0.005592465400695801, -0.005301713943481445, -0.00501096248626709, -0.004720211029052734, -0.004429459571838379, -0.0041387081146240234, -0.003847956657409668, -0.0035572052001953125, -0.003266453742980957, -0.0029757022857666016, -0.002684950828552246, -0.0023941993713378906, -0.002103447914123535, -0.0018126964569091797, -0.0015219449996948242, -0.0012311935424804688, -0.0009404420852661133, -0.0006496906280517578, -0.00035893917083740234, -6.818771362304688e-05, 0.0002225637435913086, 0.0005133152008056641, 0.0008040666580200195, 0.001094818115234375, 0.0013855695724487305, 0.001676321029663086, 0.0019670724868774414, 0.002257823944091797, 0.0025485754013061523, 0.002839326858520508, 0.0031300783157348633, 0.0034208297729492188, 0.0037115812301635742, 0.00400233268737793, 0.004293084144592285, 0.004583835601806641, 0.004874587059020996, 0.0051653385162353516, 0.005456089973449707, 0.0057468414306640625, 0.006037592887878418, 0.0063283443450927734, 0.006619095802307129, 0.006909847259521484, 0.00720059871673584, 0.007491350173950195, 0.007782101631164551, 0.008072853088378906, 0.008363604545593262, 0.008654356002807617, 0.008945107460021973, 0.009235858917236328, 0.009526610374450684, 0.009817361831665039, 0.010108113288879395, 0.01039886474609375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 8.0, 18.0, 13.0, 32.0, 36.0, 45.0, 60.0, 80.0, 102.0, 151.0, 246.0, 372.0, 586.0, 1006.0, 1940.0, 4630.0, 13910.0, 74563.0, 822857.0, 100777.0, 16826.0, 5124.0, 2208.0, 1093.0, 630.0, 377.0, 261.0, 159.0, 117.0, 78.0, 67.0, 50.0, 43.0, 12.0, 18.0, 16.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-335.25, -325.26171875, -315.2734375, -305.28515625, -295.296875, -285.30859375, -275.3203125, -265.33203125, -255.34375, -245.35546875, -235.3671875, -225.37890625, -215.390625, -205.40234375, -195.4140625, -185.42578125, -175.4375, -165.44921875, -155.4609375, -145.47265625, -135.484375, -125.49609375, -115.5078125, -105.51953125, -95.53125, -85.54296875, -75.5546875, -65.56640625, -55.578125, -45.58984375, -35.6015625, -25.61328125, -15.625, -5.63671875, 4.3515625, 14.33984375, 24.328125, 34.31640625, 44.3046875, 54.29296875, 64.28125, 74.26953125, 84.2578125, 94.24609375, 104.234375, 114.22265625, 124.2109375, 134.19921875, 144.1875, 154.17578125, 164.1640625, 174.15234375, 184.140625, 194.12890625, 204.1171875, 214.10546875, 224.09375, 234.08203125, 244.0703125, 254.05859375, 264.046875, 274.03515625, 284.0234375, 294.01171875, 304.0]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 5.0, 1.0, 7.0, 10.0, 19.0, 38.0, 55.0, 92.0, 119.0, 146.0, 144.0, 139.0, 79.0, 46.0, 45.0, 12.0, 17.0, 4.0, 8.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.6875, -57.6943359375, -55.701171875, -53.7080078125, -51.71484375, -49.7216796875, -47.728515625, -45.7353515625, -43.7421875, -41.7490234375, -39.755859375, -37.7626953125, -35.76953125, -33.7763671875, -31.783203125, -29.7900390625, -27.796875, -25.8037109375, -23.810546875, -21.8173828125, -19.82421875, -17.8310546875, -15.837890625, -13.8447265625, -11.8515625, -9.8583984375, -7.865234375, -5.8720703125, -3.87890625, -1.8857421875, 0.107421875, 2.1005859375, 4.09375, 6.0869140625, 8.080078125, 10.0732421875, 12.06640625, 14.0595703125, 16.052734375, 18.0458984375, 20.0390625, 22.0322265625, 24.025390625, 26.0185546875, 28.01171875, 30.0048828125, 31.998046875, 33.9912109375, 35.984375, 37.9775390625, 39.970703125, 41.9638671875, 43.95703125, 45.9501953125, 47.943359375, 49.9365234375, 51.9296875, 53.9228515625, 55.916015625, 57.9091796875, 59.90234375, 61.8955078125, 63.888671875, 65.8818359375, 67.875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 14.0, 19.0, 41.0, 55.0, 107.0, 155.0, 200.0, 103.0, 74.0, 46.0, 30.0, 27.0, 17.0, 18.0, 15.0, 9.0, 16.0, 5.0, 4.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.27420425415039, -33.833919525146484, -31.393634796142578, -28.953350067138672, -26.513065338134766, -24.07278060913086, -21.63249397277832, -19.192209243774414, -16.751924514770508, -14.311639785766602, -11.871355056762695, -9.431069374084473, -6.990784645080566, -4.55049991607666, -2.1102142333984375, 0.33007049560546875, 2.770355224609375, 5.210639953613281, 7.650925159454346, 10.09121036529541, 12.531495094299316, 14.971779823303223, 17.412065505981445, 19.85235023498535, 22.292634963989258, 24.732919692993164, 27.17320442199707, 29.61349105834961, 32.053775787353516, 34.49406051635742, 36.93434524536133, 39.374629974365234, 41.814918518066406, 44.25520324707031, 46.69548797607422, 49.135772705078125, 51.57605743408203, 54.01634216308594, 56.456626892089844, 58.89691162109375, 61.337196350097656, 63.77748107910156, 66.21776580810547, 68.65805053710938, 71.09833526611328, 73.53861999511719, 75.9789047241211, 78.419189453125, 80.85948181152344, 83.29976654052734, 85.74005126953125, 88.18033599853516, 90.62062072753906, 93.06090545654297, 95.50119018554688, 97.94147491455078, 100.38175964355469, 102.8220443725586, 105.2623291015625, 107.7026138305664, 110.14289855957031, 112.58318328857422, 115.02346801757812, 117.46375274658203, 119.90403747558594]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 1.0, 6.0, 5.0, 10.0, 6.0, 6.0, 14.0, 8.0, 16.0, 23.0, 17.0, 25.0, 17.0, 31.0, 25.0, 35.0, 26.0, 43.0, 38.0, 27.0, 40.0, 42.0, 39.0, 42.0, 43.0, 52.0, 37.0, 37.0, 31.0, 40.0, 28.0, 26.0, 24.0, 17.0, 22.0, 27.0, 25.0, 4.0, 10.0, 9.0, 5.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.479450225830078, -29.516387939453125, -28.553325653076172, -27.59026527404785, -26.6272029876709, -25.664140701293945, -24.701078414916992, -23.738018035888672, -22.77495574951172, -21.811893463134766, -20.848831176757812, -19.885770797729492, -18.92270851135254, -17.959646224975586, -16.996583938598633, -16.033523559570312, -15.070460319519043, -14.10739803314209, -13.144336700439453, -12.1812744140625, -11.218213081359863, -10.25515079498291, -9.292089462280273, -8.32902717590332, -7.365965366363525, -6.4029035568237305, -5.4398417472839355, -4.476779937744141, -3.5137178897857666, -2.5506558418273926, -1.5875940322875977, -0.6245322227478027, 0.3385295867919922, 1.301591396331787, 2.264653205871582, 3.227715253829956, 4.190776824951172, 5.153839111328125, 6.11690092086792, 7.079962730407715, 8.043024063110352, 9.006086349487305, 9.969147682189941, 10.932209968566895, 11.895271301269531, 12.858333587646484, 13.821395874023438, 14.784457206726074, 15.747519493103027, 16.710580825805664, 17.673643112182617, 18.63670539855957, 19.599767684936523, 20.562828063964844, 21.525890350341797, 22.48895263671875, 23.452014923095703, 24.415077209472656, 25.37813949584961, 26.34119987487793, 27.304262161254883, 28.267324447631836, 29.23038673400879, 30.19344711303711, 31.156509399414062]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 8.0, 3.0, 8.0, 13.0, 27.0, 35.0, 43.0, 62.0, 85.0, 98.0, 164.0, 266.0, 343.0, 518.0, 800.0, 1145.0, 1723.0, 2627.0, 4143.0, 6510.0, 10540.0, 17598.0, 31060.0, 57714.0, 120320.0, 325144.0, 1540298.0, 1486963.0, 332009.0, 121585.0, 57800.0, 30675.0, 17261.0, 10165.0, 6088.0, 3818.0, 2304.0, 1476.0, 1045.0, 641.0, 416.0, 254.0, 179.0, 103.0, 71.0, 47.0, 28.0, 23.0, 23.0, 10.0, 9.0, 1.0, 0.0, 1.0], "bins": [-57.0, -55.458984375, -53.91796875, -52.376953125, -50.8359375, -49.294921875, -47.75390625, -46.212890625, -44.671875, -43.130859375, -41.58984375, -40.048828125, -38.5078125, -36.966796875, -35.42578125, -33.884765625, -32.34375, -30.802734375, -29.26171875, -27.720703125, -26.1796875, -24.638671875, -23.09765625, -21.556640625, -20.015625, -18.474609375, -16.93359375, -15.392578125, -13.8515625, -12.310546875, -10.76953125, -9.228515625, -7.6875, -6.146484375, -4.60546875, -3.064453125, -1.5234375, 0.017578125, 1.55859375, 3.099609375, 4.640625, 6.181640625, 7.72265625, 9.263671875, 10.8046875, 12.345703125, 13.88671875, 15.427734375, 16.96875, 18.509765625, 20.05078125, 21.591796875, 23.1328125, 24.673828125, 26.21484375, 27.755859375, 29.296875, 30.837890625, 32.37890625, 33.919921875, 35.4609375, 37.001953125, 38.54296875, 40.083984375, 41.625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 10.0, 8.0, 4.0, 7.0, 9.0, 19.0, 9.0, 10.0, 17.0, 12.0, 23.0, 28.0, 33.0, 32.0, 29.0, 39.0, 36.0, 40.0, 45.0, 39.0, 44.0, 50.0, 38.0, 36.0, 40.0, 37.0, 45.0, 34.0, 35.0, 28.0, 32.0, 26.0, 13.0, 18.0, 13.0, 15.0, 17.0, 7.0, 6.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.78125, -18.24462890625, -17.7080078125, -17.17138671875, -16.634765625, -16.09814453125, -15.5615234375, -15.02490234375, -14.48828125, -13.95166015625, -13.4150390625, -12.87841796875, -12.341796875, -11.80517578125, -11.2685546875, -10.73193359375, -10.1953125, -9.65869140625, -9.1220703125, -8.58544921875, -8.048828125, -7.51220703125, -6.9755859375, -6.43896484375, -5.90234375, -5.36572265625, -4.8291015625, -4.29248046875, -3.755859375, -3.21923828125, -2.6826171875, -2.14599609375, -1.609375, -1.07275390625, -0.5361328125, 0.00048828125, 0.537109375, 1.07373046875, 1.6103515625, 2.14697265625, 2.68359375, 3.22021484375, 3.7568359375, 4.29345703125, 4.830078125, 5.36669921875, 5.9033203125, 6.43994140625, 6.9765625, 7.51318359375, 8.0498046875, 8.58642578125, 9.123046875, 9.65966796875, 10.1962890625, 10.73291015625, 11.26953125, 11.80615234375, 12.3427734375, 12.87939453125, 13.416015625, 13.95263671875, 14.4892578125, 15.02587890625, 15.5625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 8.0, 6.0, 20.0, 33.0, 33.0, 44.0, 61.0, 85.0, 149.0, 204.0, 314.0, 472.0, 790.0, 1255.0, 2123.0, 3717.0, 6825.0, 13618.0, 29629.0, 74860.0, 246439.0, 1425632.0, 1932050.0, 301615.0, 87498.0, 33599.0, 15351.0, 7676.0, 4119.0, 2340.0, 1381.0, 851.0, 534.0, 352.0, 202.0, 135.0, 85.0, 55.0, 33.0, 36.0, 11.0, 11.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-65.5, -63.57763671875, -61.6552734375, -59.73291015625, -57.810546875, -55.88818359375, -53.9658203125, -52.04345703125, -50.12109375, -48.19873046875, -46.2763671875, -44.35400390625, -42.431640625, -40.50927734375, -38.5869140625, -36.66455078125, -34.7421875, -32.81982421875, -30.8974609375, -28.97509765625, -27.052734375, -25.13037109375, -23.2080078125, -21.28564453125, -19.36328125, -17.44091796875, -15.5185546875, -13.59619140625, -11.673828125, -9.75146484375, -7.8291015625, -5.90673828125, -3.984375, -2.06201171875, -0.1396484375, 1.78271484375, 3.705078125, 5.62744140625, 7.5498046875, 9.47216796875, 11.39453125, 13.31689453125, 15.2392578125, 17.16162109375, 19.083984375, 21.00634765625, 22.9287109375, 24.85107421875, 26.7734375, 28.69580078125, 30.6181640625, 32.54052734375, 34.462890625, 36.38525390625, 38.3076171875, 40.22998046875, 42.15234375, 44.07470703125, 45.9970703125, 47.91943359375, 49.841796875, 51.76416015625, 53.6865234375, 55.60888671875, 57.53125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 8.0, 11.0, 11.0, 23.0, 29.0, 37.0, 63.0, 66.0, 96.0, 131.0, 164.0, 220.0, 250.0, 337.0, 412.0, 410.0, 405.0, 303.0, 210.0, 195.0, 134.0, 104.0, 80.0, 70.0, 51.0, 48.0, 32.0, 26.0, 25.0, 12.0, 21.0, 16.0, 14.0, 3.0, 6.0, 8.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.6640625, -10.301513671875, -9.93896484375, -9.576416015625, -9.2138671875, -8.851318359375, -8.48876953125, -8.126220703125, -7.763671875, -7.401123046875, -7.03857421875, -6.676025390625, -6.3134765625, -5.950927734375, -5.58837890625, -5.225830078125, -4.86328125, -4.500732421875, -4.13818359375, -3.775634765625, -3.4130859375, -3.050537109375, -2.68798828125, -2.325439453125, -1.962890625, -1.600341796875, -1.23779296875, -0.875244140625, -0.5126953125, -0.150146484375, 0.21240234375, 0.574951171875, 0.9375, 1.300048828125, 1.66259765625, 2.025146484375, 2.3876953125, 2.750244140625, 3.11279296875, 3.475341796875, 3.837890625, 4.200439453125, 4.56298828125, 4.925537109375, 5.2880859375, 5.650634765625, 6.01318359375, 6.375732421875, 6.73828125, 7.100830078125, 7.46337890625, 7.825927734375, 8.1884765625, 8.551025390625, 8.91357421875, 9.276123046875, 9.638671875, 10.001220703125, 10.36376953125, 10.726318359375, 11.0888671875, 11.451416015625, 11.81396484375, 12.176513671875, 12.5390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 2.0, 14.0, 11.0, 19.0, 36.0, 49.0, 62.0, 129.0, 202.0, 201.0, 85.0, 55.0, 38.0, 21.0, 23.0, 12.0, 9.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.578548431396484, -49.67729568481445, -47.776039123535156, -45.874786376953125, -43.973533630371094, -42.07228088378906, -40.171024322509766, -38.269771575927734, -36.36851501464844, -34.467262268066406, -32.56600570678711, -30.664752960205078, -28.763500213623047, -26.862245559692383, -24.96099090576172, -23.059738159179688, -21.158485412597656, -19.257230758666992, -17.35597801208496, -15.454723358154297, -13.55346965789795, -11.652215957641602, -9.750961303710938, -7.84970760345459, -5.948453903198242, -4.0472002029418945, -2.1459460258483887, -0.2446918487548828, 1.6565618515014648, 3.5578155517578125, 5.459070205688477, 7.360323905944824, 9.261581420898438, 11.162835121154785, 13.064088821411133, 14.965343475341797, 16.866596221923828, 18.767850875854492, 20.669105529785156, 22.570358276367188, 24.47161293029785, 26.372867584228516, 28.274120330810547, 30.17537498474121, 32.076629638671875, 33.977882385253906, 35.87913513183594, 37.780391693115234, 39.681644439697266, 41.5828971862793, 43.484153747558594, 45.385406494140625, 47.286659240722656, 49.18791198730469, 51.089168548583984, 52.990421295166016, 54.89167785644531, 56.792930603027344, 58.69418716430664, 60.59543991088867, 62.4966926574707, 64.39794921875, 66.29920196533203, 68.20045471191406, 70.1017074584961]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 11.0, 5.0, 13.0, 21.0, 19.0, 8.0, 16.0, 20.0, 20.0, 17.0, 28.0, 30.0, 18.0, 31.0, 40.0, 28.0, 34.0, 25.0, 33.0, 38.0, 36.0, 41.0, 37.0, 37.0, 28.0, 27.0, 28.0, 30.0, 27.0, 26.0, 24.0, 18.0, 23.0, 25.0, 14.0, 11.0, 18.0, 11.0, 10.0, 12.0, 7.0, 5.0, 7.0, 8.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.62067413330078, -16.076560974121094, -15.532445907592773, -14.988332748413086, -14.444218635559082, -13.900104522705078, -13.355990409851074, -12.81187629699707, -12.267763137817383, -11.723649024963379, -11.179534912109375, -10.635421752929688, -10.091307640075684, -9.54719352722168, -9.003079414367676, -8.458965301513672, -7.914851188659668, -7.370737075805664, -6.826623439788818, -6.2825093269348145, -5.738395690917969, -5.194281578063965, -4.650167465209961, -4.106053352355957, -3.5619397163391113, -3.0178258419036865, -2.4737119674682617, -1.9295978546142578, -1.385483980178833, -0.8413701057434082, -0.2972559928894043, 0.2468578815460205, 0.7909717559814453, 1.3350856304168701, 1.8791996240615845, 2.423313617706299, 2.9674274921417236, 3.5115413665771484, 4.055655479431152, 4.599769592285156, 5.143883228302002, 5.687997341156006, 6.232110977172852, 6.7762250900268555, 7.320339202880859, 7.864452838897705, 8.408567428588867, 8.952680587768555, 9.496794700622559, 10.040908813476562, 10.585022926330566, 11.12913703918457, 11.673250198364258, 12.217364311218262, 12.761478424072266, 13.30559253692627, 13.849706649780273, 14.393820762634277, 14.937934875488281, 15.482048034667969, 16.02616310119629, 16.570276260375977, 17.114391326904297, 17.658504486083984, 18.202617645263672]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 9.0, 7.0, 8.0, 19.0, 18.0, 28.0, 38.0, 57.0, 78.0, 97.0, 155.0, 203.0, 301.0, 426.0, 614.0, 879.0, 1276.0, 1938.0, 2889.0, 4412.0, 7184.0, 11933.0, 21065.0, 42438.0, 100798.0, 382711.0, 295949.0, 86178.0, 37490.0, 19281.0, 10902.0, 6545.0, 4170.0, 2678.0, 1789.0, 1242.0, 820.0, 577.0, 387.0, 267.0, 199.0, 147.0, 106.0, 74.0, 56.0, 39.0, 26.0, 20.0, 11.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.71875, -34.52490234375, -33.3310546875, -32.13720703125, -30.943359375, -29.74951171875, -28.5556640625, -27.36181640625, -26.16796875, -24.97412109375, -23.7802734375, -22.58642578125, -21.392578125, -20.19873046875, -19.0048828125, -17.81103515625, -16.6171875, -15.42333984375, -14.2294921875, -13.03564453125, -11.841796875, -10.64794921875, -9.4541015625, -8.26025390625, -7.06640625, -5.87255859375, -4.6787109375, -3.48486328125, -2.291015625, -1.09716796875, 0.0966796875, 1.29052734375, 2.484375, 3.67822265625, 4.8720703125, 6.06591796875, 7.259765625, 8.45361328125, 9.6474609375, 10.84130859375, 12.03515625, 13.22900390625, 14.4228515625, 15.61669921875, 16.810546875, 18.00439453125, 19.1982421875, 20.39208984375, 21.5859375, 22.77978515625, 23.9736328125, 25.16748046875, 26.361328125, 27.55517578125, 28.7490234375, 29.94287109375, 31.13671875, 32.33056640625, 33.5244140625, 34.71826171875, 35.912109375, 37.10595703125, 38.2998046875, 39.49365234375, 40.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 10.0, 12.0, 15.0, 18.0, 19.0, 16.0, 11.0, 31.0, 27.0, 30.0, 34.0, 37.0, 50.0, 31.0, 38.0, 35.0, 38.0, 41.0, 45.0, 37.0, 34.0, 42.0, 33.0, 33.0, 35.0, 37.0, 18.0, 21.0, 22.0, 15.0, 17.0, 18.0, 13.0, 11.0, 9.0, 8.0, 11.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.953125, -19.35498046875, -18.7568359375, -18.15869140625, -17.560546875, -16.96240234375, -16.3642578125, -15.76611328125, -15.16796875, -14.56982421875, -13.9716796875, -13.37353515625, -12.775390625, -12.17724609375, -11.5791015625, -10.98095703125, -10.3828125, -9.78466796875, -9.1865234375, -8.58837890625, -7.990234375, -7.39208984375, -6.7939453125, -6.19580078125, -5.59765625, -4.99951171875, -4.4013671875, -3.80322265625, -3.205078125, -2.60693359375, -2.0087890625, -1.41064453125, -0.8125, -0.21435546875, 0.3837890625, 0.98193359375, 1.580078125, 2.17822265625, 2.7763671875, 3.37451171875, 3.97265625, 4.57080078125, 5.1689453125, 5.76708984375, 6.365234375, 6.96337890625, 7.5615234375, 8.15966796875, 8.7578125, 9.35595703125, 9.9541015625, 10.55224609375, 11.150390625, 11.74853515625, 12.3466796875, 12.94482421875, 13.54296875, 14.14111328125, 14.7392578125, 15.33740234375, 15.935546875, 16.53369140625, 17.1318359375, 17.72998046875, 18.328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 13.0, 15.0, 30.0, 34.0, 46.0, 58.0, 89.0, 109.0, 152.0, 185.0, 271.0, 364.0, 480.0, 682.0, 958.0, 1249.0, 1935.0, 2969.0, 4760.0, 8425.0, 16355.0, 41489.0, 339272.0, 538964.0, 47705.0, 17895.0, 8898.0, 5086.0, 3133.0, 1978.0, 1373.0, 973.0, 674.0, 514.0, 342.0, 254.0, 220.0, 161.0, 109.0, 82.0, 58.0, 51.0, 35.0, 21.0, 19.0, 13.0, 11.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-57.0, -55.16455078125, -53.3291015625, -51.49365234375, -49.658203125, -47.82275390625, -45.9873046875, -44.15185546875, -42.31640625, -40.48095703125, -38.6455078125, -36.81005859375, -34.974609375, -33.13916015625, -31.3037109375, -29.46826171875, -27.6328125, -25.79736328125, -23.9619140625, -22.12646484375, -20.291015625, -18.45556640625, -16.6201171875, -14.78466796875, -12.94921875, -11.11376953125, -9.2783203125, -7.44287109375, -5.607421875, -3.77197265625, -1.9365234375, -0.10107421875, 1.734375, 3.56982421875, 5.4052734375, 7.24072265625, 9.076171875, 10.91162109375, 12.7470703125, 14.58251953125, 16.41796875, 18.25341796875, 20.0888671875, 21.92431640625, 23.759765625, 25.59521484375, 27.4306640625, 29.26611328125, 31.1015625, 32.93701171875, 34.7724609375, 36.60791015625, 38.443359375, 40.27880859375, 42.1142578125, 43.94970703125, 45.78515625, 47.62060546875, 49.4560546875, 51.29150390625, 53.126953125, 54.96240234375, 56.7978515625, 58.63330078125, 60.46875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 12.0, 13.0, 24.0, 18.0, 20.0, 14.0, 27.0, 45.0, 19.0, 26.0, 26.0, 45.0, 46.0, 32.0, 48.0, 44.0, 44.0, 40.0, 36.0, 44.0, 35.0, 40.0, 38.0, 31.0, 33.0, 34.0, 24.0, 18.0, 23.0, 15.0, 10.0, 10.0, 16.0, 4.0, 6.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.442626953125, -13.90087890625, -13.359130859375, -12.8173828125, -12.275634765625, -11.73388671875, -11.192138671875, -10.650390625, -10.108642578125, -9.56689453125, -9.025146484375, -8.4833984375, -7.941650390625, -7.39990234375, -6.858154296875, -6.31640625, -5.774658203125, -5.23291015625, -4.691162109375, -4.1494140625, -3.607666015625, -3.06591796875, -2.524169921875, -1.982421875, -1.440673828125, -0.89892578125, -0.357177734375, 0.1845703125, 0.726318359375, 1.26806640625, 1.809814453125, 2.3515625, 2.893310546875, 3.43505859375, 3.976806640625, 4.5185546875, 5.060302734375, 5.60205078125, 6.143798828125, 6.685546875, 7.227294921875, 7.76904296875, 8.310791015625, 8.8525390625, 9.394287109375, 9.93603515625, 10.477783203125, 11.01953125, 11.561279296875, 12.10302734375, 12.644775390625, 13.1865234375, 13.728271484375, 14.27001953125, 14.811767578125, 15.353515625, 15.895263671875, 16.43701171875, 16.978759765625, 17.5205078125, 18.062255859375, 18.60400390625, 19.145751953125, 19.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 13.0, 16.0, 22.0, 29.0, 44.0, 46.0, 81.0, 125.0, 157.0, 260.0, 328.0, 553.0, 866.0, 1443.0, 2769.0, 5806.0, 13560.0, 42424.0, 507421.0, 406914.0, 40060.0, 13161.0, 5751.0, 2748.0, 1483.0, 854.0, 524.0, 316.0, 220.0, 154.0, 117.0, 79.0, 55.0, 42.0, 24.0, 23.0, 14.0, 9.0, 6.0, 9.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-44.0625, -42.7265625, -41.390625, -40.0546875, -38.71875, -37.3828125, -36.046875, -34.7109375, -33.375, -32.0390625, -30.703125, -29.3671875, -28.03125, -26.6953125, -25.359375, -24.0234375, -22.6875, -21.3515625, -20.015625, -18.6796875, -17.34375, -16.0078125, -14.671875, -13.3359375, -12.0, -10.6640625, -9.328125, -7.9921875, -6.65625, -5.3203125, -3.984375, -2.6484375, -1.3125, 0.0234375, 1.359375, 2.6953125, 4.03125, 5.3671875, 6.703125, 8.0390625, 9.375, 10.7109375, 12.046875, 13.3828125, 14.71875, 16.0546875, 17.390625, 18.7265625, 20.0625, 21.3984375, 22.734375, 24.0703125, 25.40625, 26.7421875, 28.078125, 29.4140625, 30.75, 32.0859375, 33.421875, 34.7578125, 36.09375, 37.4296875, 38.765625, 40.1015625, 41.4375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 13.0, 9.0, 26.0, 33.0, 68.0, 91.0, 153.0, 205.0, 143.0, 104.0, 60.0, 32.0, 17.0, 9.0, 10.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020580291748046875, -0.0019996613264083862, -0.001941293478012085, -0.0018829256296157837, -0.0018245577812194824, -0.0017661899328231812, -0.0017078220844268799, -0.0016494542360305786, -0.0015910863876342773, -0.001532718539237976, -0.0014743506908416748, -0.0014159828424453735, -0.0013576149940490723, -0.001299247145652771, -0.0012408792972564697, -0.0011825114488601685, -0.0011241436004638672, -0.001065775752067566, -0.0010074079036712646, -0.0009490400552749634, -0.0008906722068786621, -0.0008323043584823608, -0.0007739365100860596, -0.0007155686616897583, -0.000657200813293457, -0.0005988329648971558, -0.0005404651165008545, -0.0004820972681045532, -0.00042372941970825195, -0.0003653615713119507, -0.0003069937229156494, -0.00024862587451934814, -0.00019025802612304688, -0.0001318901777267456, -7.352232933044434e-05, -1.5154480934143066e-05, 4.32133674621582e-05, 0.00010158121585845947, 0.00015994906425476074, 0.000218316912651062, 0.0002766847610473633, 0.00033505260944366455, 0.0003934204578399658, 0.0004517883062362671, 0.0005101561546325684, 0.0005685240030288696, 0.0006268918514251709, 0.0006852596998214722, 0.0007436275482177734, 0.0008019953966140747, 0.000860363245010376, 0.0009187310934066772, 0.0009770989418029785, 0.0010354667901992798, 0.001093834638595581, 0.0011522024869918823, 0.0012105703353881836, 0.0012689381837844849, 0.0013273060321807861, 0.0013856738805770874, 0.0014440417289733887, 0.00150240957736969, 0.0015607774257659912, 0.0016191452741622925, 0.0016775131225585938]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 15.0, 17.0, 38.0, 43.0, 49.0, 68.0, 113.0, 157.0, 249.0, 337.0, 517.0, 818.0, 1299.0, 2007.0, 3380.0, 5699.0, 9990.0, 19192.0, 40321.0, 103468.0, 431950.0, 280599.0, 77821.0, 32645.0, 16090.0, 8570.0, 4988.0, 2832.0, 1897.0, 1130.0, 722.0, 446.0, 318.0, 215.0, 171.0, 103.0, 77.0, 63.0, 33.0, 27.0, 15.0, 12.0, 12.0, 4.0, 4.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.8203125, -15.2906494140625, -14.760986328125, -14.2313232421875, -13.70166015625, -13.1719970703125, -12.642333984375, -12.1126708984375, -11.5830078125, -11.0533447265625, -10.523681640625, -9.9940185546875, -9.46435546875, -8.9346923828125, -8.405029296875, -7.8753662109375, -7.345703125, -6.8160400390625, -6.286376953125, -5.7567138671875, -5.22705078125, -4.6973876953125, -4.167724609375, -3.6380615234375, -3.1083984375, -2.5787353515625, -2.049072265625, -1.5194091796875, -0.98974609375, -0.4600830078125, 0.069580078125, 0.5992431640625, 1.12890625, 1.6585693359375, 2.188232421875, 2.7178955078125, 3.24755859375, 3.7772216796875, 4.306884765625, 4.8365478515625, 5.3662109375, 5.8958740234375, 6.425537109375, 6.9552001953125, 7.48486328125, 8.0145263671875, 8.544189453125, 9.0738525390625, 9.603515625, 10.1331787109375, 10.662841796875, 11.1925048828125, 11.72216796875, 12.2518310546875, 12.781494140625, 13.3111572265625, 13.8408203125, 14.3704833984375, 14.900146484375, 15.4298095703125, 15.95947265625, 16.4891357421875, 17.018798828125, 17.5484619140625, 18.078125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 5.0, 6.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 10.0, 12.0, 20.0, 16.0, 19.0, 33.0, 34.0, 58.0, 68.0, 97.0, 90.0, 114.0, 95.0, 57.0, 45.0, 38.0, 37.0, 22.0, 24.0, 17.0, 16.0, 10.0, 12.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75, -2.64129638671875, -2.5325927734375, -2.42388916015625, -2.315185546875, -2.20648193359375, -2.0977783203125, -1.98907470703125, -1.88037109375, -1.77166748046875, -1.6629638671875, -1.55426025390625, -1.445556640625, -1.33685302734375, -1.2281494140625, -1.11944580078125, -1.0107421875, -0.90203857421875, -0.7933349609375, -0.68463134765625, -0.575927734375, -0.46722412109375, -0.3585205078125, -0.24981689453125, -0.14111328125, -0.03240966796875, 0.0762939453125, 0.18499755859375, 0.293701171875, 0.40240478515625, 0.5111083984375, 0.61981201171875, 0.728515625, 0.83721923828125, 0.9459228515625, 1.05462646484375, 1.163330078125, 1.27203369140625, 1.3807373046875, 1.48944091796875, 1.59814453125, 1.70684814453125, 1.8155517578125, 1.92425537109375, 2.032958984375, 2.14166259765625, 2.2503662109375, 2.35906982421875, 2.4677734375, 2.57647705078125, 2.6851806640625, 2.79388427734375, 2.902587890625, 3.01129150390625, 3.1199951171875, 3.22869873046875, 3.33740234375, 3.44610595703125, 3.5548095703125, 3.66351318359375, 3.772216796875, 3.88092041015625, 3.9896240234375, 4.09832763671875, 4.20703125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 22.0, 27.0, 47.0, 99.0, 163.0, 262.0, 138.0, 74.0, 47.0, 26.0, 25.0, 17.0, 10.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34966278076172, -43.42988586425781, -41.510108947753906, -39.59033203125, -37.670555114746094, -35.75077819824219, -33.83100128173828, -31.911226272583008, -29.9914493560791, -28.071672439575195, -26.15189552307129, -24.232120513916016, -22.31234359741211, -20.392566680908203, -18.472789764404297, -16.55301284790039, -14.633235931396484, -12.713459014892578, -10.793682098388672, -8.873906135559082, -6.954129219055176, -5.0343523025512695, -3.1145763397216797, -1.1947994232177734, 0.7249774932861328, 2.64475417137146, 4.564530849456787, 6.484307289123535, 8.404084205627441, 10.323861122131348, 12.243637084960938, 14.163414001464844, 16.08319091796875, 18.002967834472656, 19.922744750976562, 21.84252166748047, 23.762298583984375, 25.68207550048828, 27.601850509643555, 29.52162742614746, 31.441404342651367, 33.36117935180664, 35.28095626831055, 37.20073318481445, 39.12051010131836, 41.040287017822266, 42.96006393432617, 44.87984085083008, 46.799617767333984, 48.71939468383789, 50.6391716003418, 52.5589485168457, 54.47872543334961, 56.398502349853516, 58.318275451660156, 60.23805236816406, 62.15782928466797, 64.07760620117188, 65.99738311767578, 67.91716003417969, 69.8369369506836, 71.7567138671875, 73.6764907836914, 75.59626770019531, 77.51604461669922]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 3.0, 13.0, 8.0, 16.0, 16.0, 15.0, 21.0, 16.0, 31.0, 18.0, 18.0, 36.0, 32.0, 22.0, 28.0, 31.0, 38.0, 33.0, 35.0, 30.0, 32.0, 32.0, 31.0, 38.0, 42.0, 29.0, 29.0, 28.0, 22.0, 28.0, 23.0, 27.0, 23.0, 14.0, 16.0, 17.0, 13.0, 9.0, 10.0, 10.0, 6.0, 11.0, 3.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.123363494873047, -14.638275146484375, -14.153185844421387, -13.668097496032715, -13.183009147644043, -12.697919845581055, -12.212831497192383, -11.727743148803711, -11.242654800415039, -10.757566452026367, -10.272477149963379, -9.787388801574707, -9.302300453186035, -8.817211151123047, -8.332122802734375, -7.847034454345703, -7.361945152282715, -6.876856327056885, -6.391767978668213, -5.906679153442383, -5.421590805053711, -4.936501979827881, -4.451413154602051, -3.9663245677948, -3.481235980987549, -2.996147394180298, -2.511058807373047, -2.025969982147217, -1.5408813953399658, -1.0557928085327148, -0.5707039833068848, -0.08561539649963379, 0.3994722366333008, 0.8845608830451965, 1.3696495294570923, 1.8547382354736328, 2.339826822280884, 2.8249154090881348, 3.310004234313965, 3.795092821121216, 4.280181407928467, 4.765270233154297, 5.250358581542969, 5.735447406768799, 6.220536231994629, 6.705624580383301, 7.190713405609131, 7.675802230834961, 8.160890579223633, 8.645978927612305, 9.131068229675293, 9.616156578063965, 10.101244926452637, 10.586334228515625, 11.071422576904297, 11.556510925292969, 12.04159927368164, 12.526687622070312, 13.0117769241333, 13.496865272521973, 13.981953620910645, 14.467042922973633, 14.952131271362305, 15.437219619750977, 15.922308921813965]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 12.0, 13.0, 14.0, 26.0, 36.0, 60.0, 80.0, 104.0, 167.0, 209.0, 322.0, 495.0, 774.0, 1134.0, 1789.0, 2936.0, 4651.0, 7478.0, 12424.0, 20902.0, 35336.0, 60699.0, 104903.0, 182049.0, 234797.0, 156912.0, 90402.0, 52378.0, 30617.0, 18185.0, 10841.0, 6591.0, 4049.0, 2501.0, 1584.0, 961.0, 680.0, 462.0, 305.0, 213.0, 153.0, 88.0, 61.0, 55.0, 37.0, 24.0, 13.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-29.171875, -28.2705078125, -27.369140625, -26.4677734375, -25.56640625, -24.6650390625, -23.763671875, -22.8623046875, -21.9609375, -21.0595703125, -20.158203125, -19.2568359375, -18.35546875, -17.4541015625, -16.552734375, -15.6513671875, -14.75, -13.8486328125, -12.947265625, -12.0458984375, -11.14453125, -10.2431640625, -9.341796875, -8.4404296875, -7.5390625, -6.6376953125, -5.736328125, -4.8349609375, -3.93359375, -3.0322265625, -2.130859375, -1.2294921875, -0.328125, 0.5732421875, 1.474609375, 2.3759765625, 3.27734375, 4.1787109375, 5.080078125, 5.9814453125, 6.8828125, 7.7841796875, 8.685546875, 9.5869140625, 10.48828125, 11.3896484375, 12.291015625, 13.1923828125, 14.09375, 14.9951171875, 15.896484375, 16.7978515625, 17.69921875, 18.6005859375, 19.501953125, 20.4033203125, 21.3046875, 22.2060546875, 23.107421875, 24.0087890625, 24.91015625, 25.8115234375, 26.712890625, 27.6142578125, 28.515625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 2.0, 3.0, 15.0, 8.0, 9.0, 7.0, 16.0, 22.0, 20.0, 23.0, 20.0, 34.0, 38.0, 33.0, 41.0, 40.0, 30.0, 41.0, 37.0, 38.0, 47.0, 40.0, 44.0, 37.0, 42.0, 36.0, 30.0, 23.0, 35.0, 28.0, 25.0, 14.0, 13.0, 18.0, 18.0, 15.0, 7.0, 10.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.953125, -14.433349609375, -13.91357421875, -13.393798828125, -12.8740234375, -12.354248046875, -11.83447265625, -11.314697265625, -10.794921875, -10.275146484375, -9.75537109375, -9.235595703125, -8.7158203125, -8.196044921875, -7.67626953125, -7.156494140625, -6.63671875, -6.116943359375, -5.59716796875, -5.077392578125, -4.5576171875, -4.037841796875, -3.51806640625, -2.998291015625, -2.478515625, -1.958740234375, -1.43896484375, -0.919189453125, -0.3994140625, 0.120361328125, 0.64013671875, 1.159912109375, 1.6796875, 2.199462890625, 2.71923828125, 3.239013671875, 3.7587890625, 4.278564453125, 4.79833984375, 5.318115234375, 5.837890625, 6.357666015625, 6.87744140625, 7.397216796875, 7.9169921875, 8.436767578125, 8.95654296875, 9.476318359375, 9.99609375, 10.515869140625, 11.03564453125, 11.555419921875, 12.0751953125, 12.594970703125, 13.11474609375, 13.634521484375, 14.154296875, 14.674072265625, 15.19384765625, 15.713623046875, 16.2333984375, 16.753173828125, 17.27294921875, 17.792724609375, 18.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 2.0, 8.0, 15.0, 20.0, 34.0, 42.0, 68.0, 100.0, 145.0, 247.0, 407.0, 667.0, 1044.0, 1800.0, 3004.0, 5355.0, 10120.0, 20035.0, 42124.0, 97654.0, 249860.0, 348615.0, 148126.0, 60865.0, 27640.0, 13644.0, 7284.0, 3969.0, 2241.0, 1270.0, 828.0, 457.0, 302.0, 194.0, 135.0, 69.0, 54.0, 38.0, 26.0, 15.0, 13.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-45.40625, -44.15283203125, -42.8994140625, -41.64599609375, -40.392578125, -39.13916015625, -37.8857421875, -36.63232421875, -35.37890625, -34.12548828125, -32.8720703125, -31.61865234375, -30.365234375, -29.11181640625, -27.8583984375, -26.60498046875, -25.3515625, -24.09814453125, -22.8447265625, -21.59130859375, -20.337890625, -19.08447265625, -17.8310546875, -16.57763671875, -15.32421875, -14.07080078125, -12.8173828125, -11.56396484375, -10.310546875, -9.05712890625, -7.8037109375, -6.55029296875, -5.296875, -4.04345703125, -2.7900390625, -1.53662109375, -0.283203125, 0.97021484375, 2.2236328125, 3.47705078125, 4.73046875, 5.98388671875, 7.2373046875, 8.49072265625, 9.744140625, 10.99755859375, 12.2509765625, 13.50439453125, 14.7578125, 16.01123046875, 17.2646484375, 18.51806640625, 19.771484375, 21.02490234375, 22.2783203125, 23.53173828125, 24.78515625, 26.03857421875, 27.2919921875, 28.54541015625, 29.798828125, 31.05224609375, 32.3056640625, 33.55908203125, 34.8125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 0.0, 8.0, 7.0, 7.0, 17.0, 12.0, 19.0, 15.0, 28.0, 22.0, 29.0, 39.0, 25.0, 42.0, 45.0, 49.0, 39.0, 54.0, 40.0, 57.0, 38.0, 41.0, 51.0, 34.0, 31.0, 41.0, 27.0, 30.0, 27.0, 22.0, 23.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5859375, -12.1697998046875, -11.753662109375, -11.3375244140625, -10.92138671875, -10.5052490234375, -10.089111328125, -9.6729736328125, -9.2568359375, -8.8406982421875, -8.424560546875, -8.0084228515625, -7.59228515625, -7.1761474609375, -6.760009765625, -6.3438720703125, -5.927734375, -5.5115966796875, -5.095458984375, -4.6793212890625, -4.26318359375, -3.8470458984375, -3.430908203125, -3.0147705078125, -2.5986328125, -2.1824951171875, -1.766357421875, -1.3502197265625, -0.93408203125, -0.5179443359375, -0.101806640625, 0.3143310546875, 0.73046875, 1.1466064453125, 1.562744140625, 1.9788818359375, 2.39501953125, 2.8111572265625, 3.227294921875, 3.6434326171875, 4.0595703125, 4.4757080078125, 4.891845703125, 5.3079833984375, 5.72412109375, 6.1402587890625, 6.556396484375, 6.9725341796875, 7.388671875, 7.8048095703125, 8.220947265625, 8.6370849609375, 9.05322265625, 9.4693603515625, 9.885498046875, 10.3016357421875, 10.7177734375, 11.1339111328125, 11.550048828125, 11.9661865234375, 12.38232421875, 12.7984619140625, 13.214599609375, 13.6307373046875, 14.046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 11.0, 8.0, 18.0, 28.0, 50.0, 73.0, 129.0, 175.0, 253.0, 465.0, 692.0, 1132.0, 2057.0, 4185.0, 8959.0, 23739.0, 85553.0, 715135.0, 149632.0, 33178.0, 11801.0, 5194.0, 2465.0, 1364.0, 860.0, 499.0, 279.0, 191.0, 125.0, 98.0, 68.0, 39.0, 34.0, 14.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-99.5625, -96.4169921875, -93.271484375, -90.1259765625, -86.98046875, -83.8349609375, -80.689453125, -77.5439453125, -74.3984375, -71.2529296875, -68.107421875, -64.9619140625, -61.81640625, -58.6708984375, -55.525390625, -52.3798828125, -49.234375, -46.0888671875, -42.943359375, -39.7978515625, -36.65234375, -33.5068359375, -30.361328125, -27.2158203125, -24.0703125, -20.9248046875, -17.779296875, -14.6337890625, -11.48828125, -8.3427734375, -5.197265625, -2.0517578125, 1.09375, 4.2392578125, 7.384765625, 10.5302734375, 13.67578125, 16.8212890625, 19.966796875, 23.1123046875, 26.2578125, 29.4033203125, 32.548828125, 35.6943359375, 38.83984375, 41.9853515625, 45.130859375, 48.2763671875, 51.421875, 54.5673828125, 57.712890625, 60.8583984375, 64.00390625, 67.1494140625, 70.294921875, 73.4404296875, 76.5859375, 79.7314453125, 82.876953125, 86.0224609375, 89.16796875, 92.3134765625, 95.458984375, 98.6044921875, 101.75]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 7.0, 13.0, 15.0, 15.0, 33.0, 47.0, 49.0, 61.0, 107.0, 170.0, 132.0, 75.0, 71.0, 52.0, 34.0, 41.0, 12.0, 14.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0039520263671875, -0.0038504600524902344, -0.0037488937377929688, -0.003647327423095703, -0.0035457611083984375, -0.003444194793701172, -0.0033426284790039062, -0.0032410621643066406, -0.003139495849609375, -0.0030379295349121094, -0.0029363632202148438, -0.002834796905517578, -0.0027332305908203125, -0.002631664276123047, -0.0025300979614257812, -0.0024285316467285156, -0.00232696533203125, -0.0022253990173339844, -0.0021238327026367188, -0.002022266387939453, -0.0019207000732421875, -0.0018191337585449219, -0.0017175674438476562, -0.0016160011291503906, -0.001514434814453125, -0.0014128684997558594, -0.0013113021850585938, -0.0012097358703613281, -0.0011081695556640625, -0.0010066032409667969, -0.0009050369262695312, -0.0008034706115722656, -0.000701904296875, -0.0006003379821777344, -0.0004987716674804688, -0.0003972053527832031, -0.0002956390380859375, -0.00019407272338867188, -9.250640869140625e-05, 9.059906005859375e-06, 0.000110626220703125, 0.00021219253540039062, 0.00031375885009765625, 0.0004153251647949219, 0.0005168914794921875, 0.0006184577941894531, 0.0007200241088867188, 0.0008215904235839844, 0.00092315673828125, 0.0010247230529785156, 0.0011262893676757812, 0.0012278556823730469, 0.0013294219970703125, 0.0014309883117675781, 0.0015325546264648438, 0.0016341209411621094, 0.001735687255859375, 0.0018372535705566406, 0.0019388198852539062, 0.002040386199951172, 0.0021419525146484375, 0.002243518829345703, 0.0023450851440429688, 0.0024466514587402344, 0.0025482177734375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 3.0, 11.0, 6.0, 9.0, 20.0, 26.0, 42.0, 54.0, 76.0, 128.0, 172.0, 281.0, 426.0, 683.0, 1259.0, 2329.0, 5047.0, 13683.0, 55939.0, 756397.0, 170190.0, 25920.0, 8222.0, 3447.0, 1653.0, 950.0, 578.0, 337.0, 199.0, 127.0, 105.0, 74.0, 50.0, 36.0, 18.0, 20.0, 10.0, 8.0, 3.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.5625, -89.2275390625, -85.892578125, -82.5576171875, -79.22265625, -75.8876953125, -72.552734375, -69.2177734375, -65.8828125, -62.5478515625, -59.212890625, -55.8779296875, -52.54296875, -49.2080078125, -45.873046875, -42.5380859375, -39.203125, -35.8681640625, -32.533203125, -29.1982421875, -25.86328125, -22.5283203125, -19.193359375, -15.8583984375, -12.5234375, -9.1884765625, -5.853515625, -2.5185546875, 0.81640625, 4.1513671875, 7.486328125, 10.8212890625, 14.15625, 17.4912109375, 20.826171875, 24.1611328125, 27.49609375, 30.8310546875, 34.166015625, 37.5009765625, 40.8359375, 44.1708984375, 47.505859375, 50.8408203125, 54.17578125, 57.5107421875, 60.845703125, 64.1806640625, 67.515625, 70.8505859375, 74.185546875, 77.5205078125, 80.85546875, 84.1904296875, 87.525390625, 90.8603515625, 94.1953125, 97.5302734375, 100.865234375, 104.2001953125, 107.53515625, 110.8701171875, 114.205078125, 117.5400390625, 120.875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 3.0, 8.0, 10.0, 9.0, 17.0, 38.0, 49.0, 66.0, 74.0, 111.0, 208.0, 116.0, 82.0, 52.0, 43.0, 32.0, 19.0, 12.0, 10.0, 8.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.984375, -23.3780517578125, -22.771728515625, -22.1654052734375, -21.55908203125, -20.9527587890625, -20.346435546875, -19.7401123046875, -19.1337890625, -18.5274658203125, -17.921142578125, -17.3148193359375, -16.70849609375, -16.1021728515625, -15.495849609375, -14.8895263671875, -14.283203125, -13.6768798828125, -13.070556640625, -12.4642333984375, -11.85791015625, -11.2515869140625, -10.645263671875, -10.0389404296875, -9.4326171875, -8.8262939453125, -8.219970703125, -7.6136474609375, -7.00732421875, -6.4010009765625, -5.794677734375, -5.1883544921875, -4.58203125, -3.9757080078125, -3.369384765625, -2.7630615234375, -2.15673828125, -1.5504150390625, -0.944091796875, -0.3377685546875, 0.2685546875, 0.8748779296875, 1.481201171875, 2.0875244140625, 2.69384765625, 3.3001708984375, 3.906494140625, 4.5128173828125, 5.119140625, 5.7254638671875, 6.331787109375, 6.9381103515625, 7.54443359375, 8.1507568359375, 8.757080078125, 9.3634033203125, 9.9697265625, 10.5760498046875, 11.182373046875, 11.7886962890625, 12.39501953125, 13.0013427734375, 13.607666015625, 14.2139892578125, 14.8203125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 13.0, 30.0, 59.0, 92.0, 194.0, 217.0, 121.0, 72.0, 52.0, 28.0, 25.0, 20.0, 12.0, 13.0, 9.0, 1.0, 11.0, 4.0, 7.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.573490142822266, -41.906944274902344, -40.24039840698242, -38.5738525390625, -36.90730667114258, -35.240760803222656, -33.57421112060547, -31.907665252685547, -30.241119384765625, -28.574573516845703, -26.90802764892578, -25.24148178100586, -23.574934005737305, -21.908388137817383, -20.24184226989746, -18.575294494628906, -16.908750534057617, -15.242204666137695, -13.575657844543457, -11.909111976623535, -10.242565155029297, -8.576019287109375, -6.909473419189453, -5.242926597595215, -3.576380729675293, -1.9098345041275024, -0.24328827857971191, 1.423257827758789, 3.089804172515869, 4.756350517272949, 6.422896385192871, 8.08944320678711, 9.755989074707031, 11.422534942626953, 13.089081764221191, 14.755627632141113, 16.42217445373535, 18.088720321655273, 19.755266189575195, 21.42181396484375, 23.088359832763672, 24.754905700683594, 26.421451568603516, 28.087997436523438, 29.754545211791992, 31.421091079711914, 33.08763885498047, 34.75418472290039, 36.42073059082031, 38.087276458740234, 39.753822326660156, 41.42036819458008, 43.0869140625, 44.75346374511719, 46.420005798339844, 48.08655548095703, 49.75309753417969, 51.41964340209961, 53.08618927001953, 54.75273513793945, 56.419281005859375, 58.08583068847656, 59.75237274169922, 61.418922424316406, 63.08546829223633]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 20.0, 13.0, 21.0, 23.0, 29.0, 13.0, 29.0, 28.0, 33.0, 35.0, 24.0, 36.0, 46.0, 34.0, 42.0, 57.0, 38.0, 36.0, 45.0, 42.0, 33.0, 42.0, 32.0, 35.0, 19.0, 20.0, 17.0, 24.0, 17.0, 17.0, 16.0, 12.0, 11.0, 5.0, 5.0, 7.0, 9.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.829206466674805, -16.264965057373047, -15.700721740722656, -15.136479377746582, -14.572237014770508, -14.00799560546875, -13.443753242492676, -12.879510879516602, -12.315268516540527, -11.751026153564453, -11.186783790588379, -10.622541427612305, -10.058300018310547, -9.494056701660156, -8.929815292358398, -8.365572929382324, -7.80133056640625, -7.237088203430176, -6.672845840454102, -6.1086039543151855, -5.544361591339111, -4.980119228363037, -4.415877342224121, -3.851634979248047, -3.2873926162719727, -2.7231502532958984, -2.1589081287384033, -1.5946658849716187, -1.030423641204834, -0.46618127822875977, 0.09806084632873535, 0.6623029708862305, 1.2265472412109375, 1.7907894849777222, 2.355031728744507, 2.919273853302002, 3.483516216278076, 4.04775857925415, 4.612000465393066, 5.176242828369141, 5.740485191345215, 6.304727554321289, 6.868969917297363, 7.433211803436279, 7.9974541664123535, 8.561697006225586, 9.125938415527344, 9.690180778503418, 10.254423141479492, 10.818665504455566, 11.38290786743164, 11.947150230407715, 12.511392593383789, 13.075634002685547, 13.639876365661621, 14.204118728637695, 14.76836109161377, 15.332603454589844, 15.896845817565918, 16.461088180541992, 17.02532958984375, 17.58957290649414, 18.1538143157959, 18.718055725097656, 19.282299041748047]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 13.0, 27.0, 35.0, 46.0, 67.0, 103.0, 139.0, 215.0, 301.0, 528.0, 787.0, 1148.0, 1703.0, 2766.0, 4323.0, 6707.0, 10810.0, 17829.0, 30597.0, 55231.0, 111427.0, 288500.0, 1226827.0, 1727739.0, 404846.0, 142383.0, 68294.0, 36281.0, 20978.0, 12485.0, 7812.0, 4947.0, 3020.0, 2001.0, 1208.0, 830.0, 532.0, 285.0, 197.0, 114.0, 73.0, 51.0, 23.0, 22.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.265625, -27.412841796875, -26.56005859375, -25.707275390625, -24.8544921875, -24.001708984375, -23.14892578125, -22.296142578125, -21.443359375, -20.590576171875, -19.73779296875, -18.885009765625, -18.0322265625, -17.179443359375, -16.32666015625, -15.473876953125, -14.62109375, -13.768310546875, -12.91552734375, -12.062744140625, -11.2099609375, -10.357177734375, -9.50439453125, -8.651611328125, -7.798828125, -6.946044921875, -6.09326171875, -5.240478515625, -4.3876953125, -3.534912109375, -2.68212890625, -1.829345703125, -0.9765625, -0.123779296875, 0.72900390625, 1.581787109375, 2.4345703125, 3.287353515625, 4.14013671875, 4.992919921875, 5.845703125, 6.698486328125, 7.55126953125, 8.404052734375, 9.2568359375, 10.109619140625, 10.96240234375, 11.815185546875, 12.66796875, 13.520751953125, 14.37353515625, 15.226318359375, 16.0791015625, 16.931884765625, 17.78466796875, 18.637451171875, 19.490234375, 20.343017578125, 21.19580078125, 22.048583984375, 22.9013671875, 23.754150390625, 24.60693359375, 25.459716796875, 26.3125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 5.0, 9.0, 11.0, 15.0, 14.0, 24.0, 30.0, 25.0, 28.0, 25.0, 35.0, 34.0, 35.0, 46.0, 43.0, 46.0, 52.0, 36.0, 38.0, 53.0, 46.0, 44.0, 46.0, 38.0, 29.0, 33.0, 27.0, 26.0, 18.0, 17.0, 18.0, 12.0, 11.0, 5.0, 7.0, 8.0, 4.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.2802734375, -9.943359375, -9.6064453125, -9.26953125, -8.9326171875, -8.595703125, -8.2587890625, -7.921875, -7.5849609375, -7.248046875, -6.9111328125, -6.57421875, -6.2373046875, -5.900390625, -5.5634765625, -5.2265625, -4.8896484375, -4.552734375, -4.2158203125, -3.87890625, -3.5419921875, -3.205078125, -2.8681640625, -2.53125, -2.1943359375, -1.857421875, -1.5205078125, -1.18359375, -0.8466796875, -0.509765625, -0.1728515625, 0.1640625, 0.5009765625, 0.837890625, 1.1748046875, 1.51171875, 1.8486328125, 2.185546875, 2.5224609375, 2.859375, 3.1962890625, 3.533203125, 3.8701171875, 4.20703125, 4.5439453125, 4.880859375, 5.2177734375, 5.5546875, 5.8916015625, 6.228515625, 6.5654296875, 6.90234375, 7.2392578125, 7.576171875, 7.9130859375, 8.25, 8.5869140625, 8.923828125, 9.2607421875, 9.59765625, 9.9345703125, 10.271484375, 10.6083984375, 10.9453125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 26.0, 21.0, 31.0, 49.0, 66.0, 90.0, 125.0, 177.0, 248.0, 369.0, 574.0, 828.0, 1190.0, 1831.0, 2733.0, 4467.0, 7000.0, 11807.0, 20697.0, 38613.0, 79645.0, 186859.0, 558586.0, 1944172.0, 865237.0, 255500.0, 101664.0, 48415.0, 25300.0, 14357.0, 8622.0, 5280.0, 3297.0, 2191.0, 1382.0, 908.0, 620.0, 444.0, 281.0, 167.0, 126.0, 84.0, 72.0, 35.0, 39.0, 16.0, 13.0, 10.0, 3.0, 2.0, 4.0, 2.0, 2.0], "bins": [-25.84375, -25.09814453125, -24.3525390625, -23.60693359375, -22.861328125, -22.11572265625, -21.3701171875, -20.62451171875, -19.87890625, -19.13330078125, -18.3876953125, -17.64208984375, -16.896484375, -16.15087890625, -15.4052734375, -14.65966796875, -13.9140625, -13.16845703125, -12.4228515625, -11.67724609375, -10.931640625, -10.18603515625, -9.4404296875, -8.69482421875, -7.94921875, -7.20361328125, -6.4580078125, -5.71240234375, -4.966796875, -4.22119140625, -3.4755859375, -2.72998046875, -1.984375, -1.23876953125, -0.4931640625, 0.25244140625, 0.998046875, 1.74365234375, 2.4892578125, 3.23486328125, 3.98046875, 4.72607421875, 5.4716796875, 6.21728515625, 6.962890625, 7.70849609375, 8.4541015625, 9.19970703125, 9.9453125, 10.69091796875, 11.4365234375, 12.18212890625, 12.927734375, 13.67333984375, 14.4189453125, 15.16455078125, 15.91015625, 16.65576171875, 17.4013671875, 18.14697265625, 18.892578125, 19.63818359375, 20.3837890625, 21.12939453125, 21.875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 18.0, 13.0, 23.0, 17.0, 30.0, 34.0, 41.0, 49.0, 79.0, 72.0, 96.0, 119.0, 117.0, 158.0, 207.0, 243.0, 314.0, 309.0, 321.0, 329.0, 232.0, 214.0, 172.0, 142.0, 109.0, 100.0, 83.0, 74.0, 56.0, 44.0, 37.0, 26.0, 21.0, 22.0, 16.0, 18.0, 17.0, 18.0, 18.0, 9.0, 10.0, 10.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.921875, -4.76043701171875, -4.5989990234375, -4.43756103515625, -4.276123046875, -4.11468505859375, -3.9532470703125, -3.79180908203125, -3.63037109375, -3.46893310546875, -3.3074951171875, -3.14605712890625, -2.984619140625, -2.82318115234375, -2.6617431640625, -2.50030517578125, -2.3388671875, -2.17742919921875, -2.0159912109375, -1.85455322265625, -1.693115234375, -1.53167724609375, -1.3702392578125, -1.20880126953125, -1.04736328125, -0.88592529296875, -0.7244873046875, -0.56304931640625, -0.401611328125, -0.24017333984375, -0.0787353515625, 0.08270263671875, 0.244140625, 0.40557861328125, 0.5670166015625, 0.72845458984375, 0.889892578125, 1.05133056640625, 1.2127685546875, 1.37420654296875, 1.53564453125, 1.69708251953125, 1.8585205078125, 2.01995849609375, 2.181396484375, 2.34283447265625, 2.5042724609375, 2.66571044921875, 2.8271484375, 2.98858642578125, 3.1500244140625, 3.31146240234375, 3.472900390625, 3.63433837890625, 3.7957763671875, 3.95721435546875, 4.11865234375, 4.28009033203125, 4.4415283203125, 4.60296630859375, 4.764404296875, 4.92584228515625, 5.0872802734375, 5.24871826171875, 5.41015625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 4.0, 8.0, 18.0, 20.0, 20.0, 34.0, 57.0, 63.0, 137.0, 148.0, 157.0, 82.0, 73.0, 54.0, 38.0, 17.0, 12.0, 10.0, 4.0, 11.0, 3.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.900720596313477, -24.07403564453125, -23.24734878540039, -22.420663833618164, -21.593978881835938, -20.767292022705078, -19.94060707092285, -19.113922119140625, -18.287235260009766, -17.46055030822754, -16.63386344909668, -15.807178497314453, -14.980493545532227, -14.153807640075684, -13.32712173461914, -12.500436782836914, -11.673751831054688, -10.847065925598145, -10.020380973815918, -9.193695068359375, -8.367010116577148, -7.5403242111206055, -6.7136383056640625, -5.886952877044678, -5.060267448425293, -4.233582019805908, -3.4068963527679443, -2.5802106857299805, -1.7535252571105957, -0.9268398284912109, -0.10015392303466797, 0.7265315055847168, 1.5532188415527344, 2.379904270172119, 3.206589937210083, 4.033275604248047, 4.859961032867432, 5.686646461486816, 6.513332366943359, 7.340017795562744, 8.166703224182129, 8.993389129638672, 9.820074081420898, 10.646759986877441, 11.473445892333984, 12.300130844116211, 13.126816749572754, 13.953502655029297, 14.780187606811523, 15.606873512268066, 16.43355941772461, 17.260244369506836, 18.086929321289062, 18.913616180419922, 19.74030113220215, 20.566986083984375, 21.393672943115234, 22.22035789489746, 23.04704475402832, 23.873729705810547, 24.700414657592773, 25.527099609375, 26.35378646850586, 27.180471420288086, 28.007156372070312]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 2.0, 8.0, 10.0, 9.0, 9.0, 8.0, 26.0, 12.0, 16.0, 23.0, 25.0, 27.0, 28.0, 28.0, 31.0, 30.0, 31.0, 28.0, 41.0, 41.0, 44.0, 35.0, 40.0, 38.0, 32.0, 33.0, 41.0, 35.0, 23.0, 26.0, 31.0, 27.0, 28.0, 14.0, 21.0, 14.0, 12.0, 11.0, 9.0, 8.0, 7.0, 5.0, 8.0, 2.0, 9.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.787965774536133, -9.46242904663086, -9.136892318725586, -8.811356544494629, -8.485819816589355, -8.160283088684082, -7.834746837615967, -7.509210586547852, -7.183673858642578, -6.858137130737305, -6.5326008796691895, -6.207064628601074, -5.881527900695801, -5.555991172790527, -5.230454921722412, -4.904918670654297, -4.579381942749023, -4.25384521484375, -3.9283089637756348, -3.6027724742889404, -3.277235984802246, -2.9516994953155518, -2.6261630058288574, -2.300626516342163, -1.9750900268554688, -1.6495535373687744, -1.32401704788208, -0.9984805583953857, -0.6729440689086914, -0.34740757942199707, -0.021871089935302734, 0.3036653995513916, 0.6292018890380859, 0.9547383785247803, 1.2802748680114746, 1.605811357498169, 1.9313478469848633, 2.2568843364715576, 2.582420825958252, 2.9079573154449463, 3.2334938049316406, 3.559030294418335, 3.8845667839050293, 4.2101030349731445, 4.535639762878418, 4.861176490783691, 5.186712741851807, 5.512248992919922, 5.837785720825195, 6.163322448730469, 6.488858699798584, 6.814394950866699, 7.139931678771973, 7.465468406677246, 7.791004657745361, 8.116540908813477, 8.44207763671875, 8.767614364624023, 9.093151092529297, 9.418686866760254, 9.744223594665527, 10.0697603225708, 10.395296096801758, 10.720832824707031, 11.046369552612305]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 4.0, 7.0, 9.0, 15.0, 22.0, 48.0, 65.0, 75.0, 117.0, 146.0, 239.0, 343.0, 512.0, 795.0, 1124.0, 1668.0, 2663.0, 4103.0, 6646.0, 11252.0, 20200.0, 39471.0, 89296.0, 295751.0, 371620.0, 103205.0, 44104.0, 22699.0, 12194.0, 7340.0, 4492.0, 2789.0, 1868.0, 1195.0, 825.0, 536.0, 359.0, 266.0, 155.0, 109.0, 72.0, 53.0, 42.0, 25.0, 11.0, 11.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.7822265625, -16.205078125, -15.6279296875, -15.05078125, -14.4736328125, -13.896484375, -13.3193359375, -12.7421875, -12.1650390625, -11.587890625, -11.0107421875, -10.43359375, -9.8564453125, -9.279296875, -8.7021484375, -8.125, -7.5478515625, -6.970703125, -6.3935546875, -5.81640625, -5.2392578125, -4.662109375, -4.0849609375, -3.5078125, -2.9306640625, -2.353515625, -1.7763671875, -1.19921875, -0.6220703125, -0.044921875, 0.5322265625, 1.109375, 1.6865234375, 2.263671875, 2.8408203125, 3.41796875, 3.9951171875, 4.572265625, 5.1494140625, 5.7265625, 6.3037109375, 6.880859375, 7.4580078125, 8.03515625, 8.6123046875, 9.189453125, 9.7666015625, 10.34375, 10.9208984375, 11.498046875, 12.0751953125, 12.65234375, 13.2294921875, 13.806640625, 14.3837890625, 14.9609375, 15.5380859375, 16.115234375, 16.6923828125, 17.26953125, 17.8466796875, 18.423828125, 19.0009765625, 19.578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 9.0, 15.0, 18.0, 15.0, 16.0, 16.0, 27.0, 18.0, 24.0, 28.0, 30.0, 35.0, 41.0, 43.0, 42.0, 40.0, 37.0, 47.0, 44.0, 40.0, 43.0, 47.0, 31.0, 37.0, 37.0, 29.0, 25.0, 17.0, 21.0, 23.0, 7.0, 16.0, 8.0, 6.0, 9.0, 9.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-12.1171875, -11.7724609375, -11.427734375, -11.0830078125, -10.73828125, -10.3935546875, -10.048828125, -9.7041015625, -9.359375, -9.0146484375, -8.669921875, -8.3251953125, -7.98046875, -7.6357421875, -7.291015625, -6.9462890625, -6.6015625, -6.2568359375, -5.912109375, -5.5673828125, -5.22265625, -4.8779296875, -4.533203125, -4.1884765625, -3.84375, -3.4990234375, -3.154296875, -2.8095703125, -2.46484375, -2.1201171875, -1.775390625, -1.4306640625, -1.0859375, -0.7412109375, -0.396484375, -0.0517578125, 0.29296875, 0.6376953125, 0.982421875, 1.3271484375, 1.671875, 2.0166015625, 2.361328125, 2.7060546875, 3.05078125, 3.3955078125, 3.740234375, 4.0849609375, 4.4296875, 4.7744140625, 5.119140625, 5.4638671875, 5.80859375, 6.1533203125, 6.498046875, 6.8427734375, 7.1875, 7.5322265625, 7.876953125, 8.2216796875, 8.56640625, 8.9111328125, 9.255859375, 9.6005859375, 9.9453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 5.0, 6.0, 11.0, 18.0, 36.0, 44.0, 52.0, 51.0, 99.0, 127.0, 185.0, 211.0, 317.0, 432.0, 566.0, 798.0, 1106.0, 1760.0, 2744.0, 4486.0, 8241.0, 16833.0, 47299.0, 604867.0, 287673.0, 36929.0, 14268.0, 7244.0, 4036.0, 2541.0, 1653.0, 1098.0, 773.0, 514.0, 431.0, 306.0, 207.0, 156.0, 116.0, 68.0, 65.0, 53.0, 35.0, 23.0, 19.0, 10.0, 17.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-27.515625, -26.625244140625, -25.73486328125, -24.844482421875, -23.9541015625, -23.063720703125, -22.17333984375, -21.282958984375, -20.392578125, -19.502197265625, -18.61181640625, -17.721435546875, -16.8310546875, -15.940673828125, -15.05029296875, -14.159912109375, -13.26953125, -12.379150390625, -11.48876953125, -10.598388671875, -9.7080078125, -8.817626953125, -7.92724609375, -7.036865234375, -6.146484375, -5.256103515625, -4.36572265625, -3.475341796875, -2.5849609375, -1.694580078125, -0.80419921875, 0.086181640625, 0.9765625, 1.866943359375, 2.75732421875, 3.647705078125, 4.5380859375, 5.428466796875, 6.31884765625, 7.209228515625, 8.099609375, 8.989990234375, 9.88037109375, 10.770751953125, 11.6611328125, 12.551513671875, 13.44189453125, 14.332275390625, 15.22265625, 16.113037109375, 17.00341796875, 17.893798828125, 18.7841796875, 19.674560546875, 20.56494140625, 21.455322265625, 22.345703125, 23.236083984375, 24.12646484375, 25.016845703125, 25.9072265625, 26.797607421875, 27.68798828125, 28.578369140625, 29.46875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 4.0, 14.0, 11.0, 15.0, 12.0, 20.0, 23.0, 29.0, 32.0, 30.0, 30.0, 40.0, 46.0, 34.0, 48.0, 59.0, 48.0, 48.0, 33.0, 42.0, 42.0, 41.0, 41.0, 35.0, 35.0, 30.0, 22.0, 27.0, 15.0, 16.0, 9.0, 8.0, 12.0, 3.0, 6.0, 8.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.0859375, -8.78173828125, -8.4775390625, -8.17333984375, -7.869140625, -7.56494140625, -7.2607421875, -6.95654296875, -6.65234375, -6.34814453125, -6.0439453125, -5.73974609375, -5.435546875, -5.13134765625, -4.8271484375, -4.52294921875, -4.21875, -3.91455078125, -3.6103515625, -3.30615234375, -3.001953125, -2.69775390625, -2.3935546875, -2.08935546875, -1.78515625, -1.48095703125, -1.1767578125, -0.87255859375, -0.568359375, -0.26416015625, 0.0400390625, 0.34423828125, 0.6484375, 0.95263671875, 1.2568359375, 1.56103515625, 1.865234375, 2.16943359375, 2.4736328125, 2.77783203125, 3.08203125, 3.38623046875, 3.6904296875, 3.99462890625, 4.298828125, 4.60302734375, 4.9072265625, 5.21142578125, 5.515625, 5.81982421875, 6.1240234375, 6.42822265625, 6.732421875, 7.03662109375, 7.3408203125, 7.64501953125, 7.94921875, 8.25341796875, 8.5576171875, 8.86181640625, 9.166015625, 9.47021484375, 9.7744140625, 10.07861328125, 10.3828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 6.0, 13.0, 12.0, 11.0, 8.0, 21.0, 31.0, 39.0, 63.0, 51.0, 103.0, 155.0, 187.0, 303.0, 465.0, 663.0, 1044.0, 1803.0, 3252.0, 6575.0, 15694.0, 48434.0, 608509.0, 295336.0, 38981.0, 13473.0, 5859.0, 2971.0, 1625.0, 966.0, 587.0, 377.0, 282.0, 166.0, 127.0, 90.0, 79.0, 44.0, 32.0, 26.0, 30.0, 22.0, 11.0, 5.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-15.875, -15.361572265625, -14.84814453125, -14.334716796875, -13.8212890625, -13.307861328125, -12.79443359375, -12.281005859375, -11.767578125, -11.254150390625, -10.74072265625, -10.227294921875, -9.7138671875, -9.200439453125, -8.68701171875, -8.173583984375, -7.66015625, -7.146728515625, -6.63330078125, -6.119873046875, -5.6064453125, -5.093017578125, -4.57958984375, -4.066162109375, -3.552734375, -3.039306640625, -2.52587890625, -2.012451171875, -1.4990234375, -0.985595703125, -0.47216796875, 0.041259765625, 0.5546875, 1.068115234375, 1.58154296875, 2.094970703125, 2.6083984375, 3.121826171875, 3.63525390625, 4.148681640625, 4.662109375, 5.175537109375, 5.68896484375, 6.202392578125, 6.7158203125, 7.229248046875, 7.74267578125, 8.256103515625, 8.76953125, 9.282958984375, 9.79638671875, 10.309814453125, 10.8232421875, 11.336669921875, 11.85009765625, 12.363525390625, 12.876953125, 13.390380859375, 13.90380859375, 14.417236328125, 14.9306640625, 15.444091796875, 15.95751953125, 16.470947265625, 16.984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 3.0, 6.0, 9.0, 14.0, 15.0, 19.0, 25.0, 42.0, 64.0, 110.0, 164.0, 146.0, 125.0, 88.0, 56.0, 29.0, 29.0, 18.0, 11.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009851455688476562, -0.0009617507457733154, -0.0009383559226989746, -0.0009149610996246338, -0.000891566276550293, -0.0008681714534759521, -0.0008447766304016113, -0.0008213818073272705, -0.0007979869842529297, -0.0007745921611785889, -0.000751197338104248, -0.0007278025150299072, -0.0007044076919555664, -0.0006810128688812256, -0.0006576180458068848, -0.0006342232227325439, -0.0006108283996582031, -0.0005874335765838623, -0.0005640387535095215, -0.0005406439304351807, -0.0005172491073608398, -0.000493854284286499, -0.0004704594612121582, -0.0004470646381378174, -0.00042366981506347656, -0.00040027499198913574, -0.0003768801689147949, -0.0003534853458404541, -0.0003300905227661133, -0.00030669569969177246, -0.00028330087661743164, -0.0002599060535430908, -0.00023651123046875, -0.00021311640739440918, -0.00018972158432006836, -0.00016632676124572754, -0.00014293193817138672, -0.0001195371150970459, -9.614229202270508e-05, -7.274746894836426e-05, -4.935264587402344e-05, -2.5957822799682617e-05, -2.562999725341797e-06, 2.0831823348999023e-05, 4.4226646423339844e-05, 6.762146949768066e-05, 9.101629257202148e-05, 0.0001144111156463623, 0.00013780593872070312, 0.00016120076179504395, 0.00018459558486938477, 0.00020799040794372559, 0.0002313852310180664, 0.0002547800540924072, 0.00027817487716674805, 0.00030156970024108887, 0.0003249645233154297, 0.0003483593463897705, 0.00037175416946411133, 0.00039514899253845215, 0.00041854381561279297, 0.0004419386386871338, 0.0004653334617614746, 0.0004887282848358154, 0.0005121231079101562]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 14.0, 22.0, 27.0, 29.0, 42.0, 67.0, 97.0, 123.0, 208.0, 281.0, 431.0, 673.0, 1047.0, 1745.0, 2975.0, 5470.0, 10687.0, 24638.0, 71593.0, 522950.0, 305914.0, 57497.0, 20710.0, 9386.0, 4831.0, 2703.0, 1575.0, 973.0, 632.0, 384.0, 259.0, 162.0, 112.0, 76.0, 61.0, 42.0, 36.0, 12.0, 17.0, 14.0, 10.0, 7.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.9141845703125, -9.531494140625, -9.1488037109375, -8.76611328125, -8.3834228515625, -8.000732421875, -7.6180419921875, -7.2353515625, -6.8526611328125, -6.469970703125, -6.0872802734375, -5.70458984375, -5.3218994140625, -4.939208984375, -4.5565185546875, -4.173828125, -3.7911376953125, -3.408447265625, -3.0257568359375, -2.64306640625, -2.2603759765625, -1.877685546875, -1.4949951171875, -1.1123046875, -0.7296142578125, -0.346923828125, 0.0357666015625, 0.41845703125, 0.8011474609375, 1.183837890625, 1.5665283203125, 1.94921875, 2.3319091796875, 2.714599609375, 3.0972900390625, 3.47998046875, 3.8626708984375, 4.245361328125, 4.6280517578125, 5.0107421875, 5.3934326171875, 5.776123046875, 6.1588134765625, 6.54150390625, 6.9241943359375, 7.306884765625, 7.6895751953125, 8.072265625, 8.4549560546875, 8.837646484375, 9.2203369140625, 9.60302734375, 9.9857177734375, 10.368408203125, 10.7510986328125, 11.1337890625, 11.5164794921875, 11.899169921875, 12.2818603515625, 12.66455078125, 13.0472412109375, 13.429931640625, 13.8126220703125, 14.1953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 7.0, 15.0, 22.0, 21.0, 22.0, 36.0, 70.0, 80.0, 90.0, 117.0, 128.0, 86.0, 50.0, 47.0, 38.0, 27.0, 14.0, 11.0, 12.0, 9.0, 9.0, 11.0, 10.0, 5.0, 5.0, 6.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.19921875, -2.13592529296875, -2.0726318359375, -2.00933837890625, -1.946044921875, -1.88275146484375, -1.8194580078125, -1.75616455078125, -1.69287109375, -1.62957763671875, -1.5662841796875, -1.50299072265625, -1.439697265625, -1.37640380859375, -1.3131103515625, -1.24981689453125, -1.1865234375, -1.12322998046875, -1.0599365234375, -0.99664306640625, -0.933349609375, -0.87005615234375, -0.8067626953125, -0.74346923828125, -0.68017578125, -0.61688232421875, -0.5535888671875, -0.49029541015625, -0.427001953125, -0.36370849609375, -0.3004150390625, -0.23712158203125, -0.173828125, -0.11053466796875, -0.0472412109375, 0.01605224609375, 0.079345703125, 0.14263916015625, 0.2059326171875, 0.26922607421875, 0.33251953125, 0.39581298828125, 0.4591064453125, 0.52239990234375, 0.585693359375, 0.64898681640625, 0.7122802734375, 0.77557373046875, 0.8388671875, 0.90216064453125, 0.9654541015625, 1.02874755859375, 1.092041015625, 1.15533447265625, 1.2186279296875, 1.28192138671875, 1.34521484375, 1.40850830078125, 1.4718017578125, 1.53509521484375, 1.598388671875, 1.66168212890625, 1.7249755859375, 1.78826904296875, 1.8515625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 21.0, 32.0, 42.0, 65.0, 84.0, 164.0, 195.0, 130.0, 78.0, 49.0, 39.0, 18.0, 13.0, 13.0, 11.0, 6.0, 3.0, 7.0, 8.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.304847717285156, -29.42697525024414, -28.549100875854492, -27.671228408813477, -26.793354034423828, -25.915481567382812, -25.037609100341797, -24.15973663330078, -23.281862258911133, -22.403989791870117, -21.52611541748047, -20.648242950439453, -19.770370483398438, -18.89249610900879, -18.014623641967773, -17.136749267578125, -16.25887680053711, -15.381003379821777, -14.503129959106445, -13.62525749206543, -12.747384071350098, -11.869510650634766, -10.99163818359375, -10.113764762878418, -9.235891342163086, -8.358017921447754, -7.48014497756958, -6.602272033691406, -5.724398612976074, -4.846525192260742, -3.9686522483825684, -3.0907793045043945, -2.2129058837890625, -1.3350327014923096, -0.45715951919555664, 0.4207136631011963, 1.2985868453979492, 2.1764602661132812, 3.054333209991455, 3.932206153869629, 4.810079574584961, 5.687952995300293, 6.565825939178467, 7.443698883056641, 8.321572303771973, 9.199445724487305, 10.07731819152832, 10.955191612243652, 11.833065032958984, 12.710938453674316, 13.588811874389648, 14.466684341430664, 15.344557762145996, 16.222431182861328, 17.100303649902344, 17.97817611694336, 18.856050491333008, 19.733922958374023, 20.611797332763672, 21.489669799804688, 22.367542266845703, 23.24541664123535, 24.123289108276367, 25.001163482666016, 25.87903594970703]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 6.0, 9.0, 16.0, 2.0, 20.0, 12.0, 15.0, 18.0, 20.0, 23.0, 26.0, 29.0, 28.0, 26.0, 30.0, 25.0, 41.0, 40.0, 38.0, 28.0, 39.0, 45.0, 35.0, 26.0, 43.0, 43.0, 32.0, 23.0, 33.0, 20.0, 31.0, 24.0, 16.0, 28.0, 9.0, 15.0, 9.0, 8.0, 7.0, 10.0, 7.0, 6.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.379477500915527, -9.082643508911133, -8.785808563232422, -8.488974571228027, -8.192140579223633, -7.895305633544922, -7.598471641540527, -7.301637172698975, -7.004802703857422, -6.707968235015869, -6.411133766174316, -6.114299774169922, -5.817465305328369, -5.520630836486816, -5.223796844482422, -4.926962375640869, -4.630127906799316, -4.333293437957764, -4.036458969116211, -3.7396249771118164, -3.4427905082702637, -3.145956039428711, -2.8491218090057373, -2.5522875785827637, -2.255453109741211, -1.9586187601089478, -1.6617844104766846, -1.3649500608444214, -1.0681157112121582, -0.771281361579895, -0.47444701194763184, -0.1776127815246582, 0.11922264099121094, 0.4160569906234741, 0.7128913402557373, 1.0097256898880005, 1.3065600395202637, 1.6033943891525269, 1.90022873878479, 2.1970629692077637, 2.4938974380493164, 2.790731906890869, 3.0875661373138428, 3.3844003677368164, 3.681234836578369, 3.978069305419922, 4.274903297424316, 4.571737766265869, 4.868572235107422, 5.165406703948975, 5.462241172790527, 5.759075164794922, 6.055909633636475, 6.352744102478027, 6.649578094482422, 6.946412563323975, 7.243247032165527, 7.54008150100708, 7.836915969848633, 8.133749961853027, 8.430583953857422, 8.727418899536133, 9.024252891540527, 9.321086883544922, 9.617921829223633]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 11.0, 5.0, 19.0, 22.0, 33.0, 75.0, 99.0, 182.0, 279.0, 419.0, 634.0, 1049.0, 1658.0, 2949.0, 4881.0, 8537.0, 14727.0, 25828.0, 47280.0, 87402.0, 163468.0, 261290.0, 194359.0, 104631.0, 56407.0, 30639.0, 17293.0, 9960.0, 5601.0, 3429.0, 2095.0, 1279.0, 749.0, 479.0, 307.0, 193.0, 101.0, 70.0, 46.0, 24.0, 24.0, 10.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.49169921875, -16.9208984375, -16.35009765625, -15.779296875, -15.20849609375, -14.6376953125, -14.06689453125, -13.49609375, -12.92529296875, -12.3544921875, -11.78369140625, -11.212890625, -10.64208984375, -10.0712890625, -9.50048828125, -8.9296875, -8.35888671875, -7.7880859375, -7.21728515625, -6.646484375, -6.07568359375, -5.5048828125, -4.93408203125, -4.36328125, -3.79248046875, -3.2216796875, -2.65087890625, -2.080078125, -1.50927734375, -0.9384765625, -0.36767578125, 0.203125, 0.77392578125, 1.3447265625, 1.91552734375, 2.486328125, 3.05712890625, 3.6279296875, 4.19873046875, 4.76953125, 5.34033203125, 5.9111328125, 6.48193359375, 7.052734375, 7.62353515625, 8.1943359375, 8.76513671875, 9.3359375, 9.90673828125, 10.4775390625, 11.04833984375, 11.619140625, 12.18994140625, 12.7607421875, 13.33154296875, 13.90234375, 14.47314453125, 15.0439453125, 15.61474609375, 16.185546875, 16.75634765625, 17.3271484375, 17.89794921875, 18.46875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 12.0, 9.0, 10.0, 16.0, 24.0, 22.0, 27.0, 35.0, 35.0, 15.0, 36.0, 46.0, 46.0, 40.0, 44.0, 39.0, 48.0, 45.0, 39.0, 40.0, 49.0, 35.0, 45.0, 34.0, 27.0, 24.0, 25.0, 21.0, 12.0, 18.0, 11.0, 12.0, 4.0, 9.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.065673828125, -9.73291015625, -9.400146484375, -9.0673828125, -8.734619140625, -8.40185546875, -8.069091796875, -7.736328125, -7.403564453125, -7.07080078125, -6.738037109375, -6.4052734375, -6.072509765625, -5.73974609375, -5.406982421875, -5.07421875, -4.741455078125, -4.40869140625, -4.075927734375, -3.7431640625, -3.410400390625, -3.07763671875, -2.744873046875, -2.412109375, -2.079345703125, -1.74658203125, -1.413818359375, -1.0810546875, -0.748291015625, -0.41552734375, -0.082763671875, 0.25, 0.582763671875, 0.91552734375, 1.248291015625, 1.5810546875, 1.913818359375, 2.24658203125, 2.579345703125, 2.912109375, 3.244873046875, 3.57763671875, 3.910400390625, 4.2431640625, 4.575927734375, 4.90869140625, 5.241455078125, 5.57421875, 5.906982421875, 6.23974609375, 6.572509765625, 6.9052734375, 7.238037109375, 7.57080078125, 7.903564453125, 8.236328125, 8.569091796875, 8.90185546875, 9.234619140625, 9.5673828125, 9.900146484375, 10.23291015625, 10.565673828125, 10.8984375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 6.0, 6.0, 7.0, 8.0, 6.0, 14.0, 22.0, 38.0, 50.0, 81.0, 122.0, 175.0, 278.0, 402.0, 639.0, 1018.0, 1637.0, 2646.0, 4541.0, 7525.0, 13721.0, 25395.0, 49484.0, 100307.0, 212716.0, 305634.0, 160262.0, 76556.0, 37930.0, 20392.0, 11075.0, 6220.0, 3673.0, 2208.0, 1381.0, 845.0, 537.0, 340.0, 216.0, 160.0, 93.0, 50.0, 47.0, 34.0, 22.0, 19.0, 7.0, 10.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-20.140625, -19.517333984375, -18.89404296875, -18.270751953125, -17.6474609375, -17.024169921875, -16.40087890625, -15.777587890625, -15.154296875, -14.531005859375, -13.90771484375, -13.284423828125, -12.6611328125, -12.037841796875, -11.41455078125, -10.791259765625, -10.16796875, -9.544677734375, -8.92138671875, -8.298095703125, -7.6748046875, -7.051513671875, -6.42822265625, -5.804931640625, -5.181640625, -4.558349609375, -3.93505859375, -3.311767578125, -2.6884765625, -2.065185546875, -1.44189453125, -0.818603515625, -0.1953125, 0.427978515625, 1.05126953125, 1.674560546875, 2.2978515625, 2.921142578125, 3.54443359375, 4.167724609375, 4.791015625, 5.414306640625, 6.03759765625, 6.660888671875, 7.2841796875, 7.907470703125, 8.53076171875, 9.154052734375, 9.77734375, 10.400634765625, 11.02392578125, 11.647216796875, 12.2705078125, 12.893798828125, 13.51708984375, 14.140380859375, 14.763671875, 15.386962890625, 16.01025390625, 16.633544921875, 17.2568359375, 17.880126953125, 18.50341796875, 19.126708984375, 19.75]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 16.0, 11.0, 20.0, 17.0, 28.0, 24.0, 17.0, 24.0, 26.0, 35.0, 29.0, 34.0, 26.0, 44.0, 44.0, 44.0, 41.0, 46.0, 30.0, 45.0, 43.0, 39.0, 29.0, 35.0, 30.0, 28.0, 31.0, 15.0, 20.0, 26.0, 16.0, 18.0, 5.0, 9.0, 9.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.53228759765625, -6.3067626953125, -6.08123779296875, -5.855712890625, -5.63018798828125, -5.4046630859375, -5.17913818359375, -4.95361328125, -4.72808837890625, -4.5025634765625, -4.27703857421875, -4.051513671875, -3.82598876953125, -3.6004638671875, -3.37493896484375, -3.1494140625, -2.92388916015625, -2.6983642578125, -2.47283935546875, -2.247314453125, -2.02178955078125, -1.7962646484375, -1.57073974609375, -1.34521484375, -1.11968994140625, -0.8941650390625, -0.66864013671875, -0.443115234375, -0.21759033203125, 0.0079345703125, 0.23345947265625, 0.458984375, 0.68450927734375, 0.9100341796875, 1.13555908203125, 1.361083984375, 1.58660888671875, 1.8121337890625, 2.03765869140625, 2.26318359375, 2.48870849609375, 2.7142333984375, 2.93975830078125, 3.165283203125, 3.39080810546875, 3.6163330078125, 3.84185791015625, 4.0673828125, 4.29290771484375, 4.5184326171875, 4.74395751953125, 4.969482421875, 5.19500732421875, 5.4205322265625, 5.64605712890625, 5.87158203125, 6.09710693359375, 6.3226318359375, 6.54815673828125, 6.773681640625, 6.99920654296875, 7.2247314453125, 7.45025634765625, 7.67578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 7.0, 6.0, 12.0, 21.0, 25.0, 37.0, 38.0, 59.0, 97.0, 149.0, 200.0, 347.0, 593.0, 1133.0, 2039.0, 4007.0, 8862.0, 22683.0, 77740.0, 634395.0, 224232.0, 43794.0, 15091.0, 6335.0, 2898.0, 1570.0, 873.0, 509.0, 280.0, 179.0, 98.0, 70.0, 51.0, 35.0, 19.0, 19.0, 10.0, 11.0, 12.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.875, -41.3857421875, -39.896484375, -38.4072265625, -36.91796875, -35.4287109375, -33.939453125, -32.4501953125, -30.9609375, -29.4716796875, -27.982421875, -26.4931640625, -25.00390625, -23.5146484375, -22.025390625, -20.5361328125, -19.046875, -17.5576171875, -16.068359375, -14.5791015625, -13.08984375, -11.6005859375, -10.111328125, -8.6220703125, -7.1328125, -5.6435546875, -4.154296875, -2.6650390625, -1.17578125, 0.3134765625, 1.802734375, 3.2919921875, 4.78125, 6.2705078125, 7.759765625, 9.2490234375, 10.73828125, 12.2275390625, 13.716796875, 15.2060546875, 16.6953125, 18.1845703125, 19.673828125, 21.1630859375, 22.65234375, 24.1416015625, 25.630859375, 27.1201171875, 28.609375, 30.0986328125, 31.587890625, 33.0771484375, 34.56640625, 36.0556640625, 37.544921875, 39.0341796875, 40.5234375, 42.0126953125, 43.501953125, 44.9912109375, 46.48046875, 47.9697265625, 49.458984375, 50.9482421875, 52.4375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 11.0, 8.0, 5.0, 15.0, 17.0, 30.0, 31.0, 45.0, 64.0, 72.0, 113.0, 150.0, 121.0, 80.0, 66.0, 44.0, 39.0, 20.0, 16.0, 16.0, 13.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001186370849609375, -0.0011431872844696045, -0.001100003719329834, -0.0010568201541900635, -0.001013636589050293, -0.0009704530239105225, -0.000927269458770752, -0.0008840858936309814, -0.0008409023284912109, -0.0007977187633514404, -0.0007545351982116699, -0.0007113516330718994, -0.0006681680679321289, -0.0006249845027923584, -0.0005818009376525879, -0.0005386173725128174, -0.0004954338073730469, -0.00045225024223327637, -0.00040906667709350586, -0.00036588311195373535, -0.00032269954681396484, -0.00027951598167419434, -0.00023633241653442383, -0.00019314885139465332, -0.0001499652862548828, -0.0001067817211151123, -6.35981559753418e-05, -2.041459083557129e-05, 2.276897430419922e-05, 6.595253944396973e-05, 0.00010913610458374023, 0.00015231966972351074, 0.00019550323486328125, 0.00023868680000305176, 0.00028187036514282227, 0.0003250539302825928, 0.0003682374954223633, 0.0004114210605621338, 0.0004546046257019043, 0.0004977881908416748, 0.0005409717559814453, 0.0005841553211212158, 0.0006273388862609863, 0.0006705224514007568, 0.0007137060165405273, 0.0007568895816802979, 0.0008000731468200684, 0.0008432567119598389, 0.0008864402770996094, 0.0009296238422393799, 0.0009728074073791504, 0.001015990972518921, 0.0010591745376586914, 0.001102358102798462, 0.0011455416679382324, 0.001188725233078003, 0.0012319087982177734, 0.001275092363357544, 0.0013182759284973145, 0.001361459493637085, 0.0014046430587768555, 0.001447826623916626, 0.0014910101890563965, 0.001534193754196167, 0.0015773773193359375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 10.0, 15.0, 15.0, 17.0, 27.0, 34.0, 50.0, 68.0, 88.0, 110.0, 163.0, 247.0, 394.0, 569.0, 932.0, 1527.0, 2720.0, 5403.0, 12294.0, 37752.0, 223061.0, 658021.0, 69424.0, 19214.0, 7604.0, 3613.0, 1942.0, 1089.0, 658.0, 424.0, 312.0, 199.0, 143.0, 110.0, 70.0, 57.0, 38.0, 24.0, 23.0, 16.0, 11.0, 20.0, 9.0, 5.0, 5.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-42.6875, -41.3623046875, -40.037109375, -38.7119140625, -37.38671875, -36.0615234375, -34.736328125, -33.4111328125, -32.0859375, -30.7607421875, -29.435546875, -28.1103515625, -26.78515625, -25.4599609375, -24.134765625, -22.8095703125, -21.484375, -20.1591796875, -18.833984375, -17.5087890625, -16.18359375, -14.8583984375, -13.533203125, -12.2080078125, -10.8828125, -9.5576171875, -8.232421875, -6.9072265625, -5.58203125, -4.2568359375, -2.931640625, -1.6064453125, -0.28125, 1.0439453125, 2.369140625, 3.6943359375, 5.01953125, 6.3447265625, 7.669921875, 8.9951171875, 10.3203125, 11.6455078125, 12.970703125, 14.2958984375, 15.62109375, 16.9462890625, 18.271484375, 19.5966796875, 20.921875, 22.2470703125, 23.572265625, 24.8974609375, 26.22265625, 27.5478515625, 28.873046875, 30.1982421875, 31.5234375, 32.8486328125, 34.173828125, 35.4990234375, 36.82421875, 38.1494140625, 39.474609375, 40.7998046875, 42.125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 17.0, 26.0, 45.0, 74.0, 103.0, 126.0, 146.0, 108.0, 102.0, 72.0, 36.0, 31.0, 23.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.4927978515625, -8.180908203125, -7.8690185546875, -7.55712890625, -7.2452392578125, -6.933349609375, -6.6214599609375, -6.3095703125, -5.9976806640625, -5.685791015625, -5.3739013671875, -5.06201171875, -4.7501220703125, -4.438232421875, -4.1263427734375, -3.814453125, -3.5025634765625, -3.190673828125, -2.8787841796875, -2.56689453125, -2.2550048828125, -1.943115234375, -1.6312255859375, -1.3193359375, -1.0074462890625, -0.695556640625, -0.3836669921875, -0.07177734375, 0.2401123046875, 0.552001953125, 0.8638916015625, 1.17578125, 1.4876708984375, 1.799560546875, 2.1114501953125, 2.42333984375, 2.7352294921875, 3.047119140625, 3.3590087890625, 3.6708984375, 3.9827880859375, 4.294677734375, 4.6065673828125, 4.91845703125, 5.2303466796875, 5.542236328125, 5.8541259765625, 6.166015625, 6.4779052734375, 6.789794921875, 7.1016845703125, 7.41357421875, 7.7254638671875, 8.037353515625, 8.3492431640625, 8.6611328125, 8.9730224609375, 9.284912109375, 9.5968017578125, 9.90869140625, 10.2205810546875, 10.532470703125, 10.8443603515625, 11.15625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 7.0, 6.0, 10.0, 30.0, 51.0, 95.0, 151.0, 252.0, 146.0, 79.0, 53.0, 28.0, 20.0, 17.0, 11.0, 12.0, 7.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.832868576049805, -18.856258392333984, -17.879648208618164, -16.903038024902344, -15.926427841186523, -14.949817657470703, -13.9732084274292, -12.996598243713379, -12.019988059997559, -11.043377876281738, -10.066767692565918, -9.090158462524414, -8.113548278808594, -7.136937618255615, -6.160327911376953, -5.183717727661133, -4.2071075439453125, -3.230497360229492, -2.253887414932251, -1.2772774696350098, -0.30066728591918945, 0.6759428977966309, 1.652552604675293, 2.6291627883911133, 3.6057729721069336, 4.582383155822754, 5.558993339538574, 6.535603046417236, 7.512213230133057, 8.488822937011719, 9.465433120727539, 10.44204330444336, 11.418651580810547, 12.395261764526367, 13.371871948242188, 14.348482131958008, 15.325092315673828, 16.30170249938965, 17.27831268310547, 18.254920959472656, 19.23153305053711, 20.20814323425293, 21.18475341796875, 22.16136360168457, 23.13797378540039, 24.11458396911621, 25.09119415283203, 26.06780242919922, 27.04441261291504, 28.02102279663086, 28.99763298034668, 29.9742431640625, 30.95085334777832, 31.92746353149414, 32.90407180786133, 33.88068389892578, 34.85729217529297, 35.833900451660156, 36.81051254272461, 37.7871208190918, 38.76373291015625, 39.74034118652344, 40.71695327758789, 41.69356155395508, 42.67017364501953]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 2.0, 4.0, 4.0, 11.0, 9.0, 22.0, 13.0, 21.0, 24.0, 21.0, 16.0, 27.0, 20.0, 32.0, 37.0, 31.0, 32.0, 45.0, 37.0, 37.0, 46.0, 41.0, 39.0, 48.0, 33.0, 34.0, 40.0, 33.0, 28.0, 29.0, 17.0, 28.0, 18.0, 20.0, 18.0, 10.0, 17.0, 7.0, 16.0, 8.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.943132400512695, -9.624908447265625, -9.306684494018555, -8.988460540771484, -8.670236587524414, -8.352012634277344, -8.033788681030273, -7.715564250946045, -7.397340297698975, -7.079116344451904, -6.760892391204834, -6.442668437957764, -6.124444007873535, -5.806220054626465, -5.4879961013793945, -5.169772148132324, -4.851548194885254, -4.533324241638184, -4.215100288391113, -3.896876096725464, -3.5786521434783936, -3.2604281902313232, -2.942203998565674, -2.6239800453186035, -2.305756092071533, -1.987532138824463, -1.669308066368103, -1.3510839939117432, -1.0328600406646729, -0.7146360874176025, -0.3964120149612427, -0.07818794250488281, 0.2400369644165039, 0.558260977268219, 0.8764849901199341, 1.194709062576294, 1.5129330158233643, 1.8311569690704346, 2.149381160736084, 2.4676051139831543, 2.7858290672302246, 3.104053020477295, 3.4222769737243652, 3.7405011653900146, 4.058725357055664, 4.376949310302734, 4.695173263549805, 5.013397216796875, 5.331621170043945, 5.649845123291016, 5.968069076538086, 6.286293029785156, 6.604516983032227, 6.922740936279297, 7.240965366363525, 7.559189319610596, 7.877413272857666, 8.195637702941895, 8.513861656188965, 8.832085609436035, 9.150309562683105, 9.468533515930176, 9.786757469177246, 10.104981422424316, 10.423205375671387]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 11.0, 8.0, 25.0, 25.0, 40.0, 66.0, 84.0, 145.0, 252.0, 361.0, 521.0, 821.0, 1260.0, 2031.0, 2996.0, 4596.0, 7522.0, 12416.0, 21371.0, 39895.0, 79237.0, 179758.0, 609342.0, 2079330.0, 755067.0, 205157.0, 87872.0, 43628.0, 23415.0, 13371.0, 8288.0, 5105.0, 3459.0, 2131.0, 1504.0, 1032.0, 658.0, 443.0, 325.0, 206.0, 145.0, 107.0, 92.0, 52.0, 45.0, 18.0, 13.0, 13.0, 6.0, 11.0, 2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.390625, -13.86865234375, -13.3466796875, -12.82470703125, -12.302734375, -11.78076171875, -11.2587890625, -10.73681640625, -10.21484375, -9.69287109375, -9.1708984375, -8.64892578125, -8.126953125, -7.60498046875, -7.0830078125, -6.56103515625, -6.0390625, -5.51708984375, -4.9951171875, -4.47314453125, -3.951171875, -3.42919921875, -2.9072265625, -2.38525390625, -1.86328125, -1.34130859375, -0.8193359375, -0.29736328125, 0.224609375, 0.74658203125, 1.2685546875, 1.79052734375, 2.3125, 2.83447265625, 3.3564453125, 3.87841796875, 4.400390625, 4.92236328125, 5.4443359375, 5.96630859375, 6.48828125, 7.01025390625, 7.5322265625, 8.05419921875, 8.576171875, 9.09814453125, 9.6201171875, 10.14208984375, 10.6640625, 11.18603515625, 11.7080078125, 12.22998046875, 12.751953125, 13.27392578125, 13.7958984375, 14.31787109375, 14.83984375, 15.36181640625, 15.8837890625, 16.40576171875, 16.927734375, 17.44970703125, 17.9716796875, 18.49365234375, 19.015625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 10.0, 5.0, 8.0, 15.0, 12.0, 19.0, 12.0, 27.0, 36.0, 23.0, 17.0, 30.0, 26.0, 41.0, 33.0, 54.0, 44.0, 46.0, 65.0, 51.0, 36.0, 36.0, 35.0, 42.0, 36.0, 37.0, 31.0, 27.0, 23.0, 20.0, 13.0, 12.0, 19.0, 10.0, 8.0, 11.0, 11.0, 5.0, 3.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.58203125, -5.38720703125, -5.1923828125, -4.99755859375, -4.802734375, -4.60791015625, -4.4130859375, -4.21826171875, -4.0234375, -3.82861328125, -3.6337890625, -3.43896484375, -3.244140625, -3.04931640625, -2.8544921875, -2.65966796875, -2.46484375, -2.27001953125, -2.0751953125, -1.88037109375, -1.685546875, -1.49072265625, -1.2958984375, -1.10107421875, -0.90625, -0.71142578125, -0.5166015625, -0.32177734375, -0.126953125, 0.06787109375, 0.2626953125, 0.45751953125, 0.65234375, 0.84716796875, 1.0419921875, 1.23681640625, 1.431640625, 1.62646484375, 1.8212890625, 2.01611328125, 2.2109375, 2.40576171875, 2.6005859375, 2.79541015625, 2.990234375, 3.18505859375, 3.3798828125, 3.57470703125, 3.76953125, 3.96435546875, 4.1591796875, 4.35400390625, 4.548828125, 4.74365234375, 4.9384765625, 5.13330078125, 5.328125, 5.52294921875, 5.7177734375, 5.91259765625, 6.107421875, 6.30224609375, 6.4970703125, 6.69189453125, 6.88671875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 11.0, 11.0, 10.0, 9.0, 23.0, 21.0, 44.0, 48.0, 82.0, 107.0, 179.0, 238.0, 399.0, 493.0, 786.0, 1263.0, 1722.0, 3006.0, 4725.0, 7690.0, 13209.0, 23375.0, 43683.0, 90008.0, 213553.0, 634261.0, 1931264.0, 765849.0, 246246.0, 101044.0, 48710.0, 25515.0, 14184.0, 8490.0, 5105.0, 3036.0, 2033.0, 1230.0, 858.0, 598.0, 350.0, 291.0, 166.0, 115.0, 76.0, 42.0, 45.0, 26.0, 14.0, 17.0, 11.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0546875, -12.627685546875, -12.20068359375, -11.773681640625, -11.3466796875, -10.919677734375, -10.49267578125, -10.065673828125, -9.638671875, -9.211669921875, -8.78466796875, -8.357666015625, -7.9306640625, -7.503662109375, -7.07666015625, -6.649658203125, -6.22265625, -5.795654296875, -5.36865234375, -4.941650390625, -4.5146484375, -4.087646484375, -3.66064453125, -3.233642578125, -2.806640625, -2.379638671875, -1.95263671875, -1.525634765625, -1.0986328125, -0.671630859375, -0.24462890625, 0.182373046875, 0.609375, 1.036376953125, 1.46337890625, 1.890380859375, 2.3173828125, 2.744384765625, 3.17138671875, 3.598388671875, 4.025390625, 4.452392578125, 4.87939453125, 5.306396484375, 5.7333984375, 6.160400390625, 6.58740234375, 7.014404296875, 7.44140625, 7.868408203125, 8.29541015625, 8.722412109375, 9.1494140625, 9.576416015625, 10.00341796875, 10.430419921875, 10.857421875, 11.284423828125, 11.71142578125, 12.138427734375, 12.5654296875, 12.992431640625, 13.41943359375, 13.846435546875, 14.2734375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 9.0, 17.0, 13.0, 20.0, 39.0, 32.0, 45.0, 45.0, 69.0, 98.0, 106.0, 126.0, 163.0, 201.0, 229.0, 280.0, 319.0, 385.0, 314.0, 299.0, 229.0, 200.0, 139.0, 109.0, 110.0, 78.0, 83.0, 56.0, 53.0, 36.0, 39.0, 18.0, 24.0, 16.0, 14.0, 10.0, 4.0, 5.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.48046875, -3.373748779296875, -3.26702880859375, -3.160308837890625, -3.0535888671875, -2.946868896484375, -2.84014892578125, -2.733428955078125, -2.626708984375, -2.519989013671875, -2.41326904296875, -2.306549072265625, -2.1998291015625, -2.093109130859375, -1.98638916015625, -1.879669189453125, -1.77294921875, -1.666229248046875, -1.55950927734375, -1.452789306640625, -1.3460693359375, -1.239349365234375, -1.13262939453125, -1.025909423828125, -0.919189453125, -0.812469482421875, -0.70574951171875, -0.599029541015625, -0.4923095703125, -0.385589599609375, -0.27886962890625, -0.172149658203125, -0.0654296875, 0.041290283203125, 0.14801025390625, 0.254730224609375, 0.3614501953125, 0.468170166015625, 0.57489013671875, 0.681610107421875, 0.788330078125, 0.895050048828125, 1.00177001953125, 1.108489990234375, 1.2152099609375, 1.321929931640625, 1.42864990234375, 1.535369873046875, 1.64208984375, 1.748809814453125, 1.85552978515625, 1.962249755859375, 2.0689697265625, 2.175689697265625, 2.28240966796875, 2.389129638671875, 2.495849609375, 2.602569580078125, 2.70928955078125, 2.816009521484375, 2.9227294921875, 3.029449462890625, 3.13616943359375, 3.242889404296875, 3.349609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 11.0, 11.0, 13.0, 14.0, 16.0, 32.0, 31.0, 41.0, 71.0, 91.0, 151.0, 143.0, 105.0, 72.0, 42.0, 47.0, 31.0, 16.0, 12.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.33967399597168, -9.929840087890625, -9.52000617980957, -9.110173225402832, -8.700339317321777, -8.290505409240723, -7.880671501159668, -7.4708380699157715, -7.061004638671875, -6.65117073059082, -6.241337299346924, -5.831503391265869, -5.421669960021973, -5.011836051940918, -4.602002143859863, -4.192168712615967, -3.782334804534912, -3.3725011348724365, -2.962667465209961, -2.5528335571289062, -2.1430001258850098, -1.733166217803955, -1.3233325481414795, -0.9134988784790039, -0.5036652088165283, -0.09383150935173035, 0.3160021901130676, 0.725835919380188, 1.1356695890426636, 1.5455033779144287, 1.9553370475769043, 2.36517071723938, 2.7750043869018555, 3.184838056564331, 3.5946717262268066, 4.004505634307861, 4.414339065551758, 4.8241729736328125, 5.234006881713867, 5.643840312957764, 6.05367374420166, 6.463507652282715, 6.873341083526611, 7.283174991607666, 7.6930084228515625, 8.102842330932617, 8.512676239013672, 8.922510147094727, 9.332344055175781, 9.742177963256836, 10.15201187133789, 10.561844825744629, 10.971678733825684, 11.381512641906738, 11.791346549987793, 12.201179504394531, 12.611013412475586, 13.02084732055664, 13.430681228637695, 13.840514183044434, 14.250348091125488, 14.660181999206543, 15.070015907287598, 15.479848861694336, 15.88968276977539]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 13.0, 13.0, 14.0, 19.0, 26.0, 30.0, 26.0, 35.0, 25.0, 48.0, 47.0, 36.0, 36.0, 45.0, 51.0, 39.0, 43.0, 42.0, 51.0, 51.0, 32.0, 39.0, 37.0, 22.0, 32.0, 20.0, 21.0, 19.0, 17.0, 13.0, 8.0, 13.0, 8.0, 2.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.224446773529053, -6.994480133056641, -6.7645134925842285, -6.534546852111816, -6.304580211639404, -6.074613571166992, -5.84464693069458, -5.614680290222168, -5.384713649749756, -5.154747009277344, -4.924780368804932, -4.6948137283325195, -4.464847087860107, -4.234880447387695, -4.004913806915283, -3.774947166442871, -3.544980525970459, -3.315013885498047, -3.0850472450256348, -2.8550806045532227, -2.6251139640808105, -2.3951473236083984, -2.1651806831359863, -1.9352140426635742, -1.705247402191162, -1.47528076171875, -1.245314121246338, -1.0153474807739258, -0.7853808403015137, -0.5554141998291016, -0.32544755935668945, -0.09548091888427734, 0.13448524475097656, 0.36445188522338867, 0.5944185256958008, 0.8243851661682129, 1.054351806640625, 1.284318447113037, 1.5142850875854492, 1.7442517280578613, 1.9742183685302734, 2.2041850090026855, 2.4341516494750977, 2.6641182899475098, 2.894084930419922, 3.124051570892334, 3.354018211364746, 3.583984851837158, 3.8139514923095703, 4.043918132781982, 4.2738847732543945, 4.503851413726807, 4.733818054199219, 4.963784694671631, 5.193751335144043, 5.423717975616455, 5.653684616088867, 5.883651256561279, 6.113617897033691, 6.3435845375061035, 6.573551177978516, 6.803517818450928, 7.03348445892334, 7.263451099395752, 7.493417739868164]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 8.0, 8.0, 15.0, 22.0, 31.0, 42.0, 54.0, 75.0, 118.0, 160.0, 197.0, 295.0, 484.0, 649.0, 990.0, 1435.0, 2305.0, 3680.0, 5982.0, 10098.0, 18823.0, 37817.0, 87605.0, 293486.0, 386140.0, 104457.0, 43158.0, 21200.0, 11294.0, 6487.0, 3961.0, 2484.0, 1661.0, 1010.0, 699.0, 468.0, 332.0, 236.0, 161.0, 121.0, 92.0, 58.0, 38.0, 34.0, 18.0, 14.0, 9.0, 9.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.2890625, -10.937255859375, -10.58544921875, -10.233642578125, -9.8818359375, -9.530029296875, -9.17822265625, -8.826416015625, -8.474609375, -8.122802734375, -7.77099609375, -7.419189453125, -7.0673828125, -6.715576171875, -6.36376953125, -6.011962890625, -5.66015625, -5.308349609375, -4.95654296875, -4.604736328125, -4.2529296875, -3.901123046875, -3.54931640625, -3.197509765625, -2.845703125, -2.493896484375, -2.14208984375, -1.790283203125, -1.4384765625, -1.086669921875, -0.73486328125, -0.383056640625, -0.03125, 0.320556640625, 0.67236328125, 1.024169921875, 1.3759765625, 1.727783203125, 2.07958984375, 2.431396484375, 2.783203125, 3.135009765625, 3.48681640625, 3.838623046875, 4.1904296875, 4.542236328125, 4.89404296875, 5.245849609375, 5.59765625, 5.949462890625, 6.30126953125, 6.653076171875, 7.0048828125, 7.356689453125, 7.70849609375, 8.060302734375, 8.412109375, 8.763916015625, 9.11572265625, 9.467529296875, 9.8193359375, 10.171142578125, 10.52294921875, 10.874755859375, 11.2265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 4.0, 10.0, 6.0, 7.0, 15.0, 21.0, 18.0, 19.0, 27.0, 28.0, 24.0, 37.0, 40.0, 40.0, 41.0, 35.0, 46.0, 39.0, 39.0, 41.0, 44.0, 45.0, 48.0, 44.0, 34.0, 34.0, 30.0, 22.0, 24.0, 13.0, 26.0, 18.0, 14.0, 14.0, 10.0, 13.0, 10.0, 8.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-7.62890625, -7.41058349609375, -7.1922607421875, -6.97393798828125, -6.755615234375, -6.53729248046875, -6.3189697265625, -6.10064697265625, -5.88232421875, -5.66400146484375, -5.4456787109375, -5.22735595703125, -5.009033203125, -4.79071044921875, -4.5723876953125, -4.35406494140625, -4.1357421875, -3.91741943359375, -3.6990966796875, -3.48077392578125, -3.262451171875, -3.04412841796875, -2.8258056640625, -2.60748291015625, -2.38916015625, -2.17083740234375, -1.9525146484375, -1.73419189453125, -1.515869140625, -1.29754638671875, -1.0792236328125, -0.86090087890625, -0.642578125, -0.42425537109375, -0.2059326171875, 0.01239013671875, 0.230712890625, 0.44903564453125, 0.6673583984375, 0.88568115234375, 1.10400390625, 1.32232666015625, 1.5406494140625, 1.75897216796875, 1.977294921875, 2.19561767578125, 2.4139404296875, 2.63226318359375, 2.8505859375, 3.06890869140625, 3.2872314453125, 3.50555419921875, 3.723876953125, 3.94219970703125, 4.1605224609375, 4.37884521484375, 4.59716796875, 4.81549072265625, 5.0338134765625, 5.25213623046875, 5.470458984375, 5.68878173828125, 5.9071044921875, 6.12542724609375, 6.34375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 17.0, 15.0, 11.0, 21.0, 27.0, 42.0, 51.0, 76.0, 119.0, 151.0, 214.0, 317.0, 418.0, 723.0, 1034.0, 1720.0, 2860.0, 5598.0, 11496.0, 31428.0, 279446.0, 645453.0, 39282.0, 13173.0, 6137.0, 3307.0, 1830.0, 1206.0, 709.0, 490.0, 342.0, 236.0, 160.0, 134.0, 99.0, 40.0, 41.0, 43.0, 25.0, 15.0, 16.0, 11.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.296875, -23.5625, -22.828125, -22.09375, -21.359375, -20.625, -19.890625, -19.15625, -18.421875, -17.6875, -16.953125, -16.21875, -15.484375, -14.75, -14.015625, -13.28125, -12.546875, -11.8125, -11.078125, -10.34375, -9.609375, -8.875, -8.140625, -7.40625, -6.671875, -5.9375, -5.203125, -4.46875, -3.734375, -3.0, -2.265625, -1.53125, -0.796875, -0.0625, 0.671875, 1.40625, 2.140625, 2.875, 3.609375, 4.34375, 5.078125, 5.8125, 6.546875, 7.28125, 8.015625, 8.75, 9.484375, 10.21875, 10.953125, 11.6875, 12.421875, 13.15625, 13.890625, 14.625, 15.359375, 16.09375, 16.828125, 17.5625, 18.296875, 19.03125, 19.765625, 20.5, 21.234375, 21.96875, 22.703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 5.0, 2.0, 16.0, 17.0, 8.0, 20.0, 20.0, 30.0, 32.0, 36.0, 42.0, 51.0, 63.0, 48.0, 50.0, 54.0, 61.0, 54.0, 74.0, 44.0, 41.0, 45.0, 35.0, 20.0, 26.0, 15.0, 15.0, 14.0, 15.0, 12.0, 10.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.01953125, -6.81781005859375, -6.6160888671875, -6.41436767578125, -6.212646484375, -6.01092529296875, -5.8092041015625, -5.60748291015625, -5.40576171875, -5.20404052734375, -5.0023193359375, -4.80059814453125, -4.598876953125, -4.39715576171875, -4.1954345703125, -3.99371337890625, -3.7919921875, -3.59027099609375, -3.3885498046875, -3.18682861328125, -2.985107421875, -2.78338623046875, -2.5816650390625, -2.37994384765625, -2.17822265625, -1.97650146484375, -1.7747802734375, -1.57305908203125, -1.371337890625, -1.16961669921875, -0.9678955078125, -0.76617431640625, -0.564453125, -0.36273193359375, -0.1610107421875, 0.04071044921875, 0.242431640625, 0.44415283203125, 0.6458740234375, 0.84759521484375, 1.04931640625, 1.25103759765625, 1.4527587890625, 1.65447998046875, 1.856201171875, 2.05792236328125, 2.2596435546875, 2.46136474609375, 2.6630859375, 2.86480712890625, 3.0665283203125, 3.26824951171875, 3.469970703125, 3.67169189453125, 3.8734130859375, 4.07513427734375, 4.27685546875, 4.47857666015625, 4.6802978515625, 4.88201904296875, 5.083740234375, 5.28546142578125, 5.4871826171875, 5.68890380859375, 5.890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 9.0, 7.0, 13.0, 15.0, 15.0, 27.0, 34.0, 40.0, 71.0, 70.0, 133.0, 146.0, 230.0, 351.0, 438.0, 618.0, 886.0, 1212.0, 1741.0, 2670.0, 4253.0, 6984.0, 12766.0, 25435.0, 68367.0, 590181.0, 235765.0, 47886.0, 20418.0, 10543.0, 5883.0, 3644.0, 2310.0, 1573.0, 1111.0, 745.0, 556.0, 398.0, 249.0, 212.0, 169.0, 130.0, 70.0, 51.0, 50.0, 35.0, 19.0, 9.0, 5.0, 3.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.96484375, -3.8363037109375, -3.707763671875, -3.5792236328125, -3.45068359375, -3.3221435546875, -3.193603515625, -3.0650634765625, -2.9365234375, -2.8079833984375, -2.679443359375, -2.5509033203125, -2.42236328125, -2.2938232421875, -2.165283203125, -2.0367431640625, -1.908203125, -1.7796630859375, -1.651123046875, -1.5225830078125, -1.39404296875, -1.2655029296875, -1.136962890625, -1.0084228515625, -0.8798828125, -0.7513427734375, -0.622802734375, -0.4942626953125, -0.36572265625, -0.2371826171875, -0.108642578125, 0.0198974609375, 0.1484375, 0.2769775390625, 0.405517578125, 0.5340576171875, 0.66259765625, 0.7911376953125, 0.919677734375, 1.0482177734375, 1.1767578125, 1.3052978515625, 1.433837890625, 1.5623779296875, 1.69091796875, 1.8194580078125, 1.947998046875, 2.0765380859375, 2.205078125, 2.3336181640625, 2.462158203125, 2.5906982421875, 2.71923828125, 2.8477783203125, 2.976318359375, 3.1048583984375, 3.2333984375, 3.3619384765625, 3.490478515625, 3.6190185546875, 3.74755859375, 3.8760986328125, 4.004638671875, 4.1331787109375, 4.26171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 5.0, 9.0, 7.0, 6.0, 14.0, 16.0, 21.0, 31.0, 26.0, 54.0, 64.0, 119.0, 105.0, 120.0, 84.0, 70.0, 71.0, 43.0, 35.0, 17.0, 20.0, 9.0, 12.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00014591217041015625, -0.0001408495008945465, -0.00013578683137893677, -0.00013072416186332703, -0.00012566149234771729, -0.00012059882283210754, -0.0001155361533164978, -0.00011047348380088806, -0.00010541081428527832, -0.00010034814476966858, -9.528547525405884e-05, -9.02228057384491e-05, -8.516013622283936e-05, -8.009746670722961e-05, -7.503479719161987e-05, -6.997212767601013e-05, -6.490945816040039e-05, -5.984678864479065e-05, -5.478411912918091e-05, -4.972144961357117e-05, -4.4658780097961426e-05, -3.9596110582351685e-05, -3.453344106674194e-05, -2.9470771551132202e-05, -2.440810203552246e-05, -1.934543251991272e-05, -1.4282763004302979e-05, -9.220093488693237e-06, -4.157423973083496e-06, 9.052455425262451e-07, 5.967915058135986e-06, 1.1030584573745728e-05, 1.609325408935547e-05, 2.115592360496521e-05, 2.621859312057495e-05, 3.128126263618469e-05, 3.6343932151794434e-05, 4.1406601667404175e-05, 4.6469271183013916e-05, 5.153194069862366e-05, 5.65946102142334e-05, 6.165727972984314e-05, 6.671994924545288e-05, 7.178261876106262e-05, 7.684528827667236e-05, 8.19079577922821e-05, 8.697062730789185e-05, 9.203329682350159e-05, 9.709596633911133e-05, 0.00010215863585472107, 0.00010722130537033081, 0.00011228397488594055, 0.00011734664440155029, 0.00012240931391716003, 0.00012747198343276978, 0.00013253465294837952, 0.00013759732246398926, 0.000142659991979599, 0.00014772266149520874, 0.00015278533101081848, 0.00015784800052642822, 0.00016291067004203796, 0.0001679733395576477, 0.00017303600907325745, 0.0001780986785888672]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 14.0, 18.0, 29.0, 39.0, 62.0, 94.0, 166.0, 254.0, 398.0, 649.0, 1065.0, 1696.0, 3011.0, 5824.0, 12082.0, 28608.0, 92836.0, 623794.0, 198155.0, 45032.0, 17015.0, 7999.0, 4180.0, 2185.0, 1230.0, 793.0, 458.0, 307.0, 187.0, 120.0, 67.0, 52.0, 38.0, 25.0, 20.0, 14.0, 11.0, 6.0, 4.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3359375, -5.1728515625, -5.009765625, -4.8466796875, -4.68359375, -4.5205078125, -4.357421875, -4.1943359375, -4.03125, -3.8681640625, -3.705078125, -3.5419921875, -3.37890625, -3.2158203125, -3.052734375, -2.8896484375, -2.7265625, -2.5634765625, -2.400390625, -2.2373046875, -2.07421875, -1.9111328125, -1.748046875, -1.5849609375, -1.421875, -1.2587890625, -1.095703125, -0.9326171875, -0.76953125, -0.6064453125, -0.443359375, -0.2802734375, -0.1171875, 0.0458984375, 0.208984375, 0.3720703125, 0.53515625, 0.6982421875, 0.861328125, 1.0244140625, 1.1875, 1.3505859375, 1.513671875, 1.6767578125, 1.83984375, 2.0029296875, 2.166015625, 2.3291015625, 2.4921875, 2.6552734375, 2.818359375, 2.9814453125, 3.14453125, 3.3076171875, 3.470703125, 3.6337890625, 3.796875, 3.9599609375, 4.123046875, 4.2861328125, 4.44921875, 4.6123046875, 4.775390625, 4.9384765625, 5.1015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 3.0, 7.0, 2.0, 2.0, 6.0, 7.0, 23.0, 28.0, 32.0, 56.0, 74.0, 128.0, 170.0, 154.0, 102.0, 59.0, 29.0, 27.0, 17.0, 12.0, 18.0, 8.0, 11.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1720428466796875, -1.135101318359375, -1.0981597900390625, -1.06121826171875, -1.0242767333984375, -0.987335205078125, -0.9503936767578125, -0.9134521484375, -0.8765106201171875, -0.839569091796875, -0.8026275634765625, -0.76568603515625, -0.7287445068359375, -0.691802978515625, -0.6548614501953125, -0.617919921875, -0.5809783935546875, -0.544036865234375, -0.5070953369140625, -0.47015380859375, -0.4332122802734375, -0.396270751953125, -0.3593292236328125, -0.3223876953125, -0.2854461669921875, -0.248504638671875, -0.2115631103515625, -0.17462158203125, -0.1376800537109375, -0.100738525390625, -0.0637969970703125, -0.02685546875, 0.0100860595703125, 0.047027587890625, 0.0839691162109375, 0.12091064453125, 0.1578521728515625, 0.194793701171875, 0.2317352294921875, 0.2686767578125, 0.3056182861328125, 0.342559814453125, 0.3795013427734375, 0.41644287109375, 0.4533843994140625, 0.490325927734375, 0.5272674560546875, 0.564208984375, 0.6011505126953125, 0.638092041015625, 0.6750335693359375, 0.71197509765625, 0.7489166259765625, 0.785858154296875, 0.8227996826171875, 0.8597412109375, 0.8966827392578125, 0.933624267578125, 0.9705657958984375, 1.00750732421875, 1.0444488525390625, 1.081390380859375, 1.1183319091796875, 1.1552734375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 15.0, 7.0, 17.0, 20.0, 27.0, 31.0, 51.0, 84.0, 113.0, 166.0, 136.0, 80.0, 75.0, 48.0, 27.0, 25.0, 14.0, 12.0, 16.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.902300834655762, -8.493037223815918, -8.083773612976074, -7.674509525299072, -7.2652459144592285, -6.855982303619385, -6.446718215942383, -6.037454605102539, -5.628190994262695, -5.218927383422852, -4.809663772583008, -4.400399684906006, -3.991136074066162, -3.5818724632263184, -3.1726086139678955, -2.7633447647094727, -2.354081153869629, -1.9448174238204956, -1.5355536937713623, -1.126289963722229, -0.7170262336730957, -0.30776262283325195, 0.1015012264251709, 0.5107650756835938, 0.9200286865234375, 1.3292924165725708, 1.738556146621704, 2.147819995880127, 2.5570836067199707, 2.9663472175598145, 3.3756110668182373, 3.78487491607666, 4.1941375732421875, 4.603401184082031, 5.012664794921875, 5.421928882598877, 5.831192493438721, 6.2404561042785645, 6.649720191955566, 7.05898380279541, 7.468247413635254, 7.877511024475098, 8.286774635314941, 8.696038246154785, 9.105302810668945, 9.514566421508789, 9.923830032348633, 10.333093643188477, 10.74235725402832, 11.151620864868164, 11.560884475708008, 11.970148086547852, 12.379411697387695, 12.788675308227539, 13.1979398727417, 13.607203483581543, 14.016467094421387, 14.42573070526123, 14.834994316101074, 15.244257926940918, 15.653522491455078, 16.062786102294922, 16.472049713134766, 16.88131332397461, 17.290576934814453]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 18.0, 14.0, 17.0, 27.0, 26.0, 28.0, 45.0, 28.0, 45.0, 51.0, 31.0, 42.0, 43.0, 52.0, 40.0, 41.0, 44.0, 51.0, 39.0, 40.0, 38.0, 30.0, 36.0, 21.0, 18.0, 24.0, 16.0, 19.0, 10.0, 8.0, 9.0, 8.0, 2.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.872030258178711, -6.651519298553467, -6.4310078620910645, -6.21049690246582, -5.989985466003418, -5.769474506378174, -5.54896354675293, -5.328452110290527, -5.107941150665283, -4.887430191040039, -4.666918754577637, -4.446407794952393, -4.225896835327148, -4.005385398864746, -3.784874439239502, -3.5643632411956787, -3.3438520431518555, -3.1233408451080322, -2.902829647064209, -2.682318687438965, -2.4618074893951416, -2.2412962913513184, -2.020785331726074, -1.800274133682251, -1.5797629356384277, -1.3592517375946045, -1.1387406587600708, -0.9182295203208923, -0.6977183818817139, -0.4772071838378906, -0.25669610500335693, -0.03618502616882324, 0.1843266487121582, 0.40483778715133667, 0.6253489255905151, 0.8458600640296936, 1.066371202468872, 1.2868824005126953, 1.507393479347229, 1.7279045581817627, 1.948415756225586, 2.168926954269409, 2.3894381523132324, 2.6099491119384766, 2.8304603099823, 3.050971508026123, 3.271482467651367, 3.4919936656951904, 3.7125048637390137, 3.933016061782837, 4.15352725982666, 4.374038219451904, 4.594549179077148, 4.815060615539551, 5.035571575164795, 5.256082534790039, 5.476593971252441, 5.6971049308776855, 5.917616367340088, 6.138127326965332, 6.358638763427734, 6.5791497230529785, 6.799660682678223, 7.020172119140625, 7.240683078765869]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 6.0, 8.0, 17.0, 15.0, 23.0, 39.0, 55.0, 74.0, 123.0, 141.0, 236.0, 329.0, 485.0, 696.0, 1045.0, 1679.0, 2440.0, 3942.0, 6431.0, 10530.0, 18086.0, 31305.0, 56133.0, 103250.0, 199925.0, 267994.0, 154507.0, 80975.0, 44524.0, 25168.0, 14735.0, 8747.0, 5343.0, 3293.0, 2127.0, 1314.0, 901.0, 572.0, 404.0, 286.0, 180.0, 140.0, 104.0, 65.0, 44.0, 32.0, 34.0, 26.0, 13.0, 12.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.0859375, -10.7427978515625, -10.399658203125, -10.0565185546875, -9.71337890625, -9.3702392578125, -9.027099609375, -8.6839599609375, -8.3408203125, -7.9976806640625, -7.654541015625, -7.3114013671875, -6.96826171875, -6.6251220703125, -6.281982421875, -5.9388427734375, -5.595703125, -5.2525634765625, -4.909423828125, -4.5662841796875, -4.22314453125, -3.8800048828125, -3.536865234375, -3.1937255859375, -2.8505859375, -2.5074462890625, -2.164306640625, -1.8211669921875, -1.47802734375, -1.1348876953125, -0.791748046875, -0.4486083984375, -0.10546875, 0.2376708984375, 0.580810546875, 0.9239501953125, 1.26708984375, 1.6102294921875, 1.953369140625, 2.2965087890625, 2.6396484375, 2.9827880859375, 3.325927734375, 3.6690673828125, 4.01220703125, 4.3553466796875, 4.698486328125, 5.0416259765625, 5.384765625, 5.7279052734375, 6.071044921875, 6.4141845703125, 6.75732421875, 7.1004638671875, 7.443603515625, 7.7867431640625, 8.1298828125, 8.4730224609375, 8.816162109375, 9.1593017578125, 9.50244140625, 9.8455810546875, 10.188720703125, 10.5318603515625, 10.875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 10.0, 10.0, 10.0, 15.0, 14.0, 20.0, 33.0, 31.0, 30.0, 34.0, 39.0, 33.0, 29.0, 29.0, 41.0, 44.0, 49.0, 38.0, 41.0, 41.0, 36.0, 40.0, 30.0, 28.0, 35.0, 25.0, 30.0, 13.0, 24.0, 21.0, 15.0, 10.0, 14.0, 15.0, 11.0, 10.0, 8.0, 4.0, 5.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-5.1015625, -4.933349609375, -4.76513671875, -4.596923828125, -4.4287109375, -4.260498046875, -4.09228515625, -3.924072265625, -3.755859375, -3.587646484375, -3.41943359375, -3.251220703125, -3.0830078125, -2.914794921875, -2.74658203125, -2.578369140625, -2.41015625, -2.241943359375, -2.07373046875, -1.905517578125, -1.7373046875, -1.569091796875, -1.40087890625, -1.232666015625, -1.064453125, -0.896240234375, -0.72802734375, -0.559814453125, -0.3916015625, -0.223388671875, -0.05517578125, 0.113037109375, 0.28125, 0.449462890625, 0.61767578125, 0.785888671875, 0.9541015625, 1.122314453125, 1.29052734375, 1.458740234375, 1.626953125, 1.795166015625, 1.96337890625, 2.131591796875, 2.2998046875, 2.468017578125, 2.63623046875, 2.804443359375, 2.97265625, 3.140869140625, 3.30908203125, 3.477294921875, 3.6455078125, 3.813720703125, 3.98193359375, 4.150146484375, 4.318359375, 4.486572265625, 4.65478515625, 4.822998046875, 4.9912109375, 5.159423828125, 5.32763671875, 5.495849609375, 5.6640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 11.0, 18.0, 14.0, 34.0, 32.0, 41.0, 64.0, 88.0, 129.0, 181.0, 264.0, 364.0, 542.0, 853.0, 1293.0, 1999.0, 3331.0, 5845.0, 10546.0, 18626.0, 36097.0, 71298.0, 155039.0, 300670.0, 227399.0, 104043.0, 50388.0, 25960.0, 13745.0, 7878.0, 4440.0, 2550.0, 1540.0, 1068.0, 665.0, 450.0, 308.0, 211.0, 139.0, 116.0, 73.0, 48.0, 31.0, 22.0, 24.0, 25.0, 16.0, 6.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-11.1328125, -10.770751953125, -10.40869140625, -10.046630859375, -9.6845703125, -9.322509765625, -8.96044921875, -8.598388671875, -8.236328125, -7.874267578125, -7.51220703125, -7.150146484375, -6.7880859375, -6.426025390625, -6.06396484375, -5.701904296875, -5.33984375, -4.977783203125, -4.61572265625, -4.253662109375, -3.8916015625, -3.529541015625, -3.16748046875, -2.805419921875, -2.443359375, -2.081298828125, -1.71923828125, -1.357177734375, -0.9951171875, -0.633056640625, -0.27099609375, 0.091064453125, 0.453125, 0.815185546875, 1.17724609375, 1.539306640625, 1.9013671875, 2.263427734375, 2.62548828125, 2.987548828125, 3.349609375, 3.711669921875, 4.07373046875, 4.435791015625, 4.7978515625, 5.159912109375, 5.52197265625, 5.884033203125, 6.24609375, 6.608154296875, 6.97021484375, 7.332275390625, 7.6943359375, 8.056396484375, 8.41845703125, 8.780517578125, 9.142578125, 9.504638671875, 9.86669921875, 10.228759765625, 10.5908203125, 10.952880859375, 11.31494140625, 11.677001953125, 12.0390625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 13.0, 4.0, 11.0, 4.0, 8.0, 10.0, 12.0, 24.0, 16.0, 22.0, 19.0, 19.0, 23.0, 37.0, 34.0, 38.0, 29.0, 43.0, 42.0, 38.0, 47.0, 46.0, 41.0, 46.0, 31.0, 40.0, 32.0, 50.0, 33.0, 19.0, 30.0, 21.0, 15.0, 21.0, 15.0, 11.0, 10.0, 9.0, 9.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.71484375, -3.597900390625, -3.48095703125, -3.364013671875, -3.2470703125, -3.130126953125, -3.01318359375, -2.896240234375, -2.779296875, -2.662353515625, -2.54541015625, -2.428466796875, -2.3115234375, -2.194580078125, -2.07763671875, -1.960693359375, -1.84375, -1.726806640625, -1.60986328125, -1.492919921875, -1.3759765625, -1.259033203125, -1.14208984375, -1.025146484375, -0.908203125, -0.791259765625, -0.67431640625, -0.557373046875, -0.4404296875, -0.323486328125, -0.20654296875, -0.089599609375, 0.02734375, 0.144287109375, 0.26123046875, 0.378173828125, 0.4951171875, 0.612060546875, 0.72900390625, 0.845947265625, 0.962890625, 1.079833984375, 1.19677734375, 1.313720703125, 1.4306640625, 1.547607421875, 1.66455078125, 1.781494140625, 1.8984375, 2.015380859375, 2.13232421875, 2.249267578125, 2.3662109375, 2.483154296875, 2.60009765625, 2.717041015625, 2.833984375, 2.950927734375, 3.06787109375, 3.184814453125, 3.3017578125, 3.418701171875, 3.53564453125, 3.652587890625, 3.76953125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 13.0, 12.0, 15.0, 20.0, 30.0, 43.0, 73.0, 95.0, 111.0, 166.0, 234.0, 388.0, 507.0, 755.0, 1236.0, 1969.0, 3330.0, 6306.0, 13720.0, 35796.0, 150316.0, 704587.0, 81422.0, 24609.0, 10168.0, 5060.0, 2807.0, 1587.0, 1011.0, 655.0, 441.0, 302.0, 219.0, 147.0, 100.0, 77.0, 58.0, 37.0, 32.0, 25.0, 21.0, 11.0, 3.0, 12.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.25, -17.71826171875, -17.1865234375, -16.65478515625, -16.123046875, -15.59130859375, -15.0595703125, -14.52783203125, -13.99609375, -13.46435546875, -12.9326171875, -12.40087890625, -11.869140625, -11.33740234375, -10.8056640625, -10.27392578125, -9.7421875, -9.21044921875, -8.6787109375, -8.14697265625, -7.615234375, -7.08349609375, -6.5517578125, -6.02001953125, -5.48828125, -4.95654296875, -4.4248046875, -3.89306640625, -3.361328125, -2.82958984375, -2.2978515625, -1.76611328125, -1.234375, -0.70263671875, -0.1708984375, 0.36083984375, 0.892578125, 1.42431640625, 1.9560546875, 2.48779296875, 3.01953125, 3.55126953125, 4.0830078125, 4.61474609375, 5.146484375, 5.67822265625, 6.2099609375, 6.74169921875, 7.2734375, 7.80517578125, 8.3369140625, 8.86865234375, 9.400390625, 9.93212890625, 10.4638671875, 10.99560546875, 11.52734375, 12.05908203125, 12.5908203125, 13.12255859375, 13.654296875, 14.18603515625, 14.7177734375, 15.24951171875, 15.78125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 13.0, 13.0, 9.0, 17.0, 28.0, 28.0, 42.0, 57.0, 88.0, 127.0, 159.0, 110.0, 71.0, 48.0, 39.0, 32.0, 21.0, 19.0, 24.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006008148193359375, -0.0005842819809913635, -0.0005677491426467896, -0.0005512163043022156, -0.0005346834659576416, -0.0005181506276130676, -0.0005016177892684937, -0.0004850849509239197, -0.0004685521125793457, -0.00045201927423477173, -0.00043548643589019775, -0.0004189535975456238, -0.0004024207592010498, -0.00038588792085647583, -0.00036935508251190186, -0.0003528222441673279, -0.0003362894058227539, -0.00031975656747817993, -0.00030322372913360596, -0.000286690890789032, -0.000270158052444458, -0.00025362521409988403, -0.00023709237575531006, -0.00022055953741073608, -0.0002040266990661621, -0.00018749386072158813, -0.00017096102237701416, -0.00015442818403244019, -0.0001378953456878662, -0.00012136250734329224, -0.00010482966899871826, -8.829683065414429e-05, -7.176399230957031e-05, -5.523115396499634e-05, -3.869831562042236e-05, -2.216547727584839e-05, -5.632638931274414e-06, 1.090019941329956e-05, 2.7433037757873535e-05, 4.396587610244751e-05, 6.0498714447021484e-05, 7.703155279159546e-05, 9.356439113616943e-05, 0.00011009722948074341, 0.00012663006782531738, 0.00014316290616989136, 0.00015969574451446533, 0.0001762285828590393, 0.00019276142120361328, 0.00020929425954818726, 0.00022582709789276123, 0.0002423599362373352, 0.0002588927745819092, 0.00027542561292648315, 0.00029195845127105713, 0.0003084912896156311, 0.0003250241279602051, 0.00034155696630477905, 0.00035808980464935303, 0.000374622642993927, 0.000391155481338501, 0.00040768831968307495, 0.0004242211580276489, 0.0004407539963722229, 0.0004572868347167969]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 6.0, 8.0, 5.0, 10.0, 17.0, 12.0, 19.0, 37.0, 38.0, 67.0, 84.0, 108.0, 151.0, 244.0, 291.0, 398.0, 618.0, 889.0, 1366.0, 2024.0, 3263.0, 5738.0, 11132.0, 27406.0, 104196.0, 736967.0, 100635.0, 26631.0, 11155.0, 5501.0, 3137.0, 2036.0, 1341.0, 896.0, 610.0, 422.0, 292.0, 214.0, 166.0, 125.0, 77.0, 55.0, 49.0, 35.0, 22.0, 16.0, 16.0, 11.0, 8.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.3515625, -12.8988037109375, -12.446044921875, -11.9932861328125, -11.54052734375, -11.0877685546875, -10.635009765625, -10.1822509765625, -9.7294921875, -9.2767333984375, -8.823974609375, -8.3712158203125, -7.91845703125, -7.4656982421875, -7.012939453125, -6.5601806640625, -6.107421875, -5.6546630859375, -5.201904296875, -4.7491455078125, -4.29638671875, -3.8436279296875, -3.390869140625, -2.9381103515625, -2.4853515625, -2.0325927734375, -1.579833984375, -1.1270751953125, -0.67431640625, -0.2215576171875, 0.231201171875, 0.6839599609375, 1.13671875, 1.5894775390625, 2.042236328125, 2.4949951171875, 2.94775390625, 3.4005126953125, 3.853271484375, 4.3060302734375, 4.7587890625, 5.2115478515625, 5.664306640625, 6.1170654296875, 6.56982421875, 7.0225830078125, 7.475341796875, 7.9281005859375, 8.380859375, 8.8336181640625, 9.286376953125, 9.7391357421875, 10.19189453125, 10.6446533203125, 11.097412109375, 11.5501708984375, 12.0029296875, 12.4556884765625, 12.908447265625, 13.3612060546875, 13.81396484375, 14.2667236328125, 14.719482421875, 15.1722412109375, 15.625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 7.0, 10.0, 12.0, 21.0, 25.0, 29.0, 42.0, 59.0, 85.0, 254.0, 145.0, 81.0, 52.0, 43.0, 32.0, 17.0, 17.0, 5.0, 9.0, 6.0, 3.0, 2.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.748046875, -3.640716552734375, -3.53338623046875, -3.426055908203125, -3.3187255859375, -3.211395263671875, -3.10406494140625, -2.996734619140625, -2.889404296875, -2.782073974609375, -2.67474365234375, -2.567413330078125, -2.4600830078125, -2.352752685546875, -2.24542236328125, -2.138092041015625, -2.03076171875, -1.923431396484375, -1.81610107421875, -1.708770751953125, -1.6014404296875, -1.494110107421875, -1.38677978515625, -1.279449462890625, -1.172119140625, -1.064788818359375, -0.95745849609375, -0.850128173828125, -0.7427978515625, -0.635467529296875, -0.52813720703125, -0.420806884765625, -0.3134765625, -0.206146240234375, -0.09881591796875, 0.008514404296875, 0.1158447265625, 0.223175048828125, 0.33050537109375, 0.437835693359375, 0.545166015625, 0.652496337890625, 0.75982666015625, 0.867156982421875, 0.9744873046875, 1.081817626953125, 1.18914794921875, 1.296478271484375, 1.40380859375, 1.511138916015625, 1.61846923828125, 1.725799560546875, 1.8331298828125, 1.940460205078125, 2.04779052734375, 2.155120849609375, 2.262451171875, 2.369781494140625, 2.47711181640625, 2.584442138671875, 2.6917724609375, 2.799102783203125, 2.90643310546875, 3.013763427734375, 3.12109375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 2.0, 9.0, 8.0, 9.0, 7.0, 17.0, 25.0, 60.0, 84.0, 102.0, 167.0, 135.0, 97.0, 69.0, 59.0, 40.0, 27.0, 15.0, 13.0, 9.0, 8.0, 5.0, 7.0, 3.0, 2.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.680816650390625, -6.3064093589782715, -5.932002067565918, -5.557595252990723, -5.183187961578369, -4.808780670166016, -4.43437385559082, -4.059966564178467, -3.6855592727661133, -3.3111519813537598, -2.9367449283599854, -2.562337875366211, -2.1879305839538574, -1.8135234117507935, -1.4391162395477295, -1.064709186553955, -0.6903018951416016, -0.3158947229385376, 0.05851244926452637, 0.43291962146759033, 0.8073267936706543, 1.1817339658737183, 1.5561411380767822, 1.9305481910705566, 2.30495548248291, 2.6793627738952637, 3.053769826889038, 3.4281768798828125, 3.802584171295166, 4.1769914627075195, 4.551398277282715, 4.925805568695068, 5.300212860107422, 5.674620151519775, 6.049027442932129, 6.423434257507324, 6.797841548919678, 7.172248840332031, 7.546655654907227, 7.92106294631958, 8.295470237731934, 8.669877052307129, 9.04428482055664, 9.418691635131836, 9.793098449707031, 10.167506217956543, 10.541913032531738, 10.91632080078125, 11.290727615356445, 11.66513442993164, 12.039542198181152, 12.413949012756348, 12.78835678100586, 13.162763595581055, 13.53717041015625, 13.911577224731445, 14.285984992980957, 14.660391807556152, 15.034799575805664, 15.40920639038086, 15.783613204956055, 16.15802001953125, 16.532428741455078, 16.906835556030273, 17.28124237060547]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 9.0, 11.0, 15.0, 17.0, 15.0, 22.0, 26.0, 27.0, 34.0, 35.0, 40.0, 45.0, 49.0, 45.0, 44.0, 54.0, 57.0, 48.0, 43.0, 39.0, 40.0, 39.0, 38.0, 27.0, 29.0, 24.0, 20.0, 16.0, 15.0, 15.0, 3.0, 20.0, 12.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.094730854034424, -6.886653900146484, -6.678576946258545, -6.4704999923706055, -6.262423038482666, -6.054346084594727, -5.846269130706787, -5.638192176818848, -5.430115222930908, -5.222038269042969, -5.013961315155029, -4.80588436126709, -4.59780740737915, -4.389730453491211, -4.1816534996032715, -3.973576545715332, -3.7654998302459717, -3.5574228763580322, -3.3493459224700928, -3.1412689685821533, -2.933192014694214, -2.7251152992248535, -2.517038345336914, -2.3089613914489746, -2.100884437561035, -1.8928074836730957, -1.6847305297851562, -1.4766535758972168, -1.2685766220092773, -1.0604997873306274, -0.852422833442688, -0.6443458795547485, -0.43626880645751953, -0.22819186747074127, -0.020114928483963013, 0.18796199560165405, 0.3960389494895935, 0.6041158437728882, 0.8121927976608276, 1.020269751548767, 1.2283467054367065, 1.436423659324646, 1.6445006132125854, 1.8525774478912354, 2.060654401779175, 2.2687313556671143, 2.4768083095550537, 2.684885263442993, 2.8929622173309326, 3.101039171218872, 3.3091161251068115, 3.517193078994751, 3.7252700328826904, 3.933346748352051, 4.14142370223999, 4.34950065612793, 4.557577610015869, 4.765654563903809, 4.973731517791748, 5.1818084716796875, 5.389885425567627, 5.597962379455566, 5.806039333343506, 6.014116287231445, 6.222193241119385]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 18.0, 18.0, 22.0, 36.0, 47.0, 68.0, 113.0, 156.0, 234.0, 318.0, 475.0, 589.0, 905.0, 1310.0, 1800.0, 2619.0, 3698.0, 5136.0, 7947.0, 12060.0, 19170.0, 31702.0, 57005.0, 111665.0, 269215.0, 1007126.0, 1769679.0, 520359.0, 172109.0, 81100.0, 43905.0, 26109.0, 16199.0, 10289.0, 6686.0, 4425.0, 3107.0, 2141.0, 1422.0, 1019.0, 749.0, 506.0, 360.0, 233.0, 149.0, 111.0, 66.0, 42.0, 22.0, 18.0, 6.0, 4.0, 5.0, 3.0, 1.0], "bins": [-8.984375, -8.72967529296875, -8.4749755859375, -8.22027587890625, -7.965576171875, -7.71087646484375, -7.4561767578125, -7.20147705078125, -6.94677734375, -6.69207763671875, -6.4373779296875, -6.18267822265625, -5.927978515625, -5.67327880859375, -5.4185791015625, -5.16387939453125, -4.9091796875, -4.65447998046875, -4.3997802734375, -4.14508056640625, -3.890380859375, -3.63568115234375, -3.3809814453125, -3.12628173828125, -2.87158203125, -2.61688232421875, -2.3621826171875, -2.10748291015625, -1.852783203125, -1.59808349609375, -1.3433837890625, -1.08868408203125, -0.833984375, -0.57928466796875, -0.3245849609375, -0.06988525390625, 0.184814453125, 0.43951416015625, 0.6942138671875, 0.94891357421875, 1.20361328125, 1.45831298828125, 1.7130126953125, 1.96771240234375, 2.222412109375, 2.47711181640625, 2.7318115234375, 2.98651123046875, 3.2412109375, 3.49591064453125, 3.7506103515625, 4.00531005859375, 4.260009765625, 4.51470947265625, 4.7694091796875, 5.02410888671875, 5.27880859375, 5.53350830078125, 5.7882080078125, 6.04290771484375, 6.297607421875, 6.55230712890625, 6.8070068359375, 7.06170654296875, 7.31640625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 7.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 10.0, 17.0, 10.0, 10.0, 17.0, 20.0, 16.0, 34.0, 24.0, 46.0, 33.0, 48.0, 48.0, 34.0, 51.0, 47.0, 39.0, 55.0, 38.0, 48.0, 47.0, 39.0, 32.0, 29.0, 23.0, 24.0, 22.0, 18.0, 20.0, 15.0, 16.0, 10.0, 12.0, 6.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.203125, -4.087738037109375, -3.97235107421875, -3.856964111328125, -3.7415771484375, -3.626190185546875, -3.51080322265625, -3.395416259765625, -3.280029296875, -3.164642333984375, -3.04925537109375, -2.933868408203125, -2.8184814453125, -2.703094482421875, -2.58770751953125, -2.472320556640625, -2.35693359375, -2.241546630859375, -2.12615966796875, -2.010772705078125, -1.8953857421875, -1.779998779296875, -1.66461181640625, -1.549224853515625, -1.433837890625, -1.318450927734375, -1.20306396484375, -1.087677001953125, -0.9722900390625, -0.856903076171875, -0.74151611328125, -0.626129150390625, -0.5107421875, -0.395355224609375, -0.27996826171875, -0.164581298828125, -0.0491943359375, 0.066192626953125, 0.18157958984375, 0.296966552734375, 0.412353515625, 0.527740478515625, 0.64312744140625, 0.758514404296875, 0.8739013671875, 0.989288330078125, 1.10467529296875, 1.220062255859375, 1.33544921875, 1.450836181640625, 1.56622314453125, 1.681610107421875, 1.7969970703125, 1.912384033203125, 2.02777099609375, 2.143157958984375, 2.258544921875, 2.373931884765625, 2.48931884765625, 2.604705810546875, 2.7200927734375, 2.835479736328125, 2.95086669921875, 3.066253662109375, 3.181640625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 9.0, 14.0, 16.0, 17.0, 30.0, 42.0, 62.0, 87.0, 126.0, 154.0, 237.0, 332.0, 475.0, 722.0, 1010.0, 1487.0, 2286.0, 3540.0, 5790.0, 9070.0, 15136.0, 27225.0, 51256.0, 103669.0, 232490.0, 633073.0, 1755765.0, 811744.0, 282608.0, 121337.0, 58596.0, 30550.0, 17224.0, 10142.0, 6193.0, 3906.0, 2528.0, 1706.0, 1108.0, 746.0, 554.0, 369.0, 251.0, 171.0, 126.0, 91.0, 67.0, 50.0, 29.0, 27.0, 8.0, 14.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0], "bins": [-7.58203125, -7.3494873046875, -7.116943359375, -6.8843994140625, -6.65185546875, -6.4193115234375, -6.186767578125, -5.9542236328125, -5.7216796875, -5.4891357421875, -5.256591796875, -5.0240478515625, -4.79150390625, -4.5589599609375, -4.326416015625, -4.0938720703125, -3.861328125, -3.6287841796875, -3.396240234375, -3.1636962890625, -2.93115234375, -2.6986083984375, -2.466064453125, -2.2335205078125, -2.0009765625, -1.7684326171875, -1.535888671875, -1.3033447265625, -1.07080078125, -0.8382568359375, -0.605712890625, -0.3731689453125, -0.140625, 0.0919189453125, 0.324462890625, 0.5570068359375, 0.78955078125, 1.0220947265625, 1.254638671875, 1.4871826171875, 1.7197265625, 1.9522705078125, 2.184814453125, 2.4173583984375, 2.64990234375, 2.8824462890625, 3.114990234375, 3.3475341796875, 3.580078125, 3.8126220703125, 4.045166015625, 4.2777099609375, 4.51025390625, 4.7427978515625, 4.975341796875, 5.2078857421875, 5.4404296875, 5.6729736328125, 5.905517578125, 6.1380615234375, 6.37060546875, 6.6031494140625, 6.835693359375, 7.0682373046875, 7.30078125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 9.0, 14.0, 10.0, 16.0, 21.0, 25.0, 51.0, 57.0, 37.0, 62.0, 83.0, 110.0, 125.0, 120.0, 165.0, 234.0, 217.0, 277.0, 285.0, 328.0, 310.0, 260.0, 223.0, 185.0, 155.0, 127.0, 86.0, 86.0, 68.0, 58.0, 47.0, 39.0, 37.0, 19.0, 23.0, 22.0, 10.0, 9.0, 10.0, 13.0, 13.0, 5.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.875, -1.81561279296875, -1.7562255859375, -1.69683837890625, -1.637451171875, -1.57806396484375, -1.5186767578125, -1.45928955078125, -1.39990234375, -1.34051513671875, -1.2811279296875, -1.22174072265625, -1.162353515625, -1.10296630859375, -1.0435791015625, -0.98419189453125, -0.9248046875, -0.86541748046875, -0.8060302734375, -0.74664306640625, -0.687255859375, -0.62786865234375, -0.5684814453125, -0.50909423828125, -0.44970703125, -0.39031982421875, -0.3309326171875, -0.27154541015625, -0.212158203125, -0.15277099609375, -0.0933837890625, -0.03399658203125, 0.025390625, 0.08477783203125, 0.1441650390625, 0.20355224609375, 0.262939453125, 0.32232666015625, 0.3817138671875, 0.44110107421875, 0.50048828125, 0.55987548828125, 0.6192626953125, 0.67864990234375, 0.738037109375, 0.79742431640625, 0.8568115234375, 0.91619873046875, 0.9755859375, 1.03497314453125, 1.0943603515625, 1.15374755859375, 1.213134765625, 1.27252197265625, 1.3319091796875, 1.39129638671875, 1.45068359375, 1.51007080078125, 1.5694580078125, 1.62884521484375, 1.688232421875, 1.74761962890625, 1.8070068359375, 1.86639404296875, 1.92578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 7.0, 11.0, 16.0, 16.0, 25.0, 54.0, 72.0, 110.0, 129.0, 161.0, 129.0, 76.0, 51.0, 50.0, 21.0, 15.0, 10.0, 5.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27719783782959, -5.997032642364502, -5.716867923736572, -5.436702728271484, -5.156538009643555, -4.876372814178467, -4.596207618713379, -4.316042900085449, -4.0358781814575195, -3.7557132244110107, -3.475548267364502, -3.195383071899414, -2.9152183532714844, -2.6350531578063965, -2.3548882007598877, -2.074723243713379, -1.794558048248291, -1.5143930912017822, -1.2342281341552734, -0.9540630578994751, -0.6738981008529663, -0.3937331438064575, -0.11356806755065918, 0.1665968894958496, 0.4467618465423584, 0.7269268035888672, 1.007091760635376, 1.2872568368911743, 1.567421793937683, 1.847586750984192, 2.1277518272399902, 2.407916784286499, 2.688081741333008, 2.9682466983795166, 3.2484116554260254, 3.5285768508911133, 3.808741569519043, 4.088906764984131, 4.369071960449219, 4.649236679077148, 4.929401397705078, 5.209566593170166, 5.489731311798096, 5.769896507263184, 6.050061225891113, 6.330226421356201, 6.610391616821289, 6.890556335449219, 7.170721530914307, 7.4508867263793945, 7.731051445007324, 8.011216163635254, 8.2913818359375, 8.57154655456543, 8.85171127319336, 9.131875991821289, 9.412041664123535, 9.692206382751465, 9.972372055053711, 10.25253677368164, 10.53270149230957, 10.8128662109375, 11.093031883239746, 11.373196601867676, 11.653361320495605]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 4.0, 8.0, 10.0, 6.0, 6.0, 13.0, 9.0, 12.0, 23.0, 21.0, 31.0, 26.0, 28.0, 35.0, 33.0, 41.0, 37.0, 38.0, 48.0, 33.0, 30.0, 36.0, 61.0, 32.0, 34.0, 37.0, 33.0, 38.0, 24.0, 28.0, 28.0, 17.0, 20.0, 13.0, 21.0, 16.0, 9.0, 13.0, 10.0, 3.0, 11.0, 2.0, 4.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.869497537612915, -3.750976085662842, -3.6324548721313477, -3.5139334201812744, -3.395411968231201, -3.276890754699707, -3.158369302749634, -3.0398478507995605, -2.9213266372680664, -2.802805185317993, -2.684283971786499, -2.565762519836426, -2.4472413063049316, -2.3287198543548584, -2.210198402404785, -2.091677188873291, -1.9731557369232178, -1.854634404182434, -1.7361130714416504, -1.6175916194915771, -1.4990702867507935, -1.3805489540100098, -1.2620275020599365, -1.1435061693191528, -1.0249848365783691, -0.9064635038375854, -0.787942111492157, -0.6694207191467285, -0.5508993864059448, -0.43237805366516113, -0.31385666131973267, -0.1953352689743042, -0.07681393623352051, 0.04170742630958557, 0.16022878885269165, 0.27875015139579773, 0.3972715139389038, 0.5157928466796875, 0.634314239025116, 0.7528356313705444, 0.8713569641113281, 0.9898782968521118, 1.1083996295928955, 1.2269210815429688, 1.3454424142837524, 1.4639637470245361, 1.5824851989746094, 1.701006531715393, 1.8195278644561768, 1.9380491971969604, 2.056570529937744, 2.1750919818878174, 2.2936134338378906, 2.4121346473693848, 2.530656099319458, 2.6491775512695312, 2.7676987648010254, 2.8862202167510986, 3.0047414302825928, 3.123262882232666, 3.24178409576416, 3.3603055477142334, 3.4788269996643066, 3.597348213195801, 3.715869665145874]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 4.0, 3.0, 9.0, 15.0, 15.0, 24.0, 34.0, 40.0, 51.0, 87.0, 85.0, 119.0, 164.0, 220.0, 308.0, 416.0, 529.0, 777.0, 1052.0, 1618.0, 2125.0, 3176.0, 4784.0, 7396.0, 11812.0, 19333.0, 34665.0, 69995.0, 199289.0, 433435.0, 129065.0, 53467.0, 28075.0, 16231.0, 9943.0, 6369.0, 4070.0, 2823.0, 1956.0, 1403.0, 990.0, 708.0, 488.0, 368.0, 248.0, 181.0, 131.0, 136.0, 82.0, 62.0, 56.0, 41.0, 29.0, 22.0, 9.0, 10.0, 10.0, 4.0, 1.0, 6.0, 2.0], "bins": [-4.65625, -4.51220703125, -4.3681640625, -4.22412109375, -4.080078125, -3.93603515625, -3.7919921875, -3.64794921875, -3.50390625, -3.35986328125, -3.2158203125, -3.07177734375, -2.927734375, -2.78369140625, -2.6396484375, -2.49560546875, -2.3515625, -2.20751953125, -2.0634765625, -1.91943359375, -1.775390625, -1.63134765625, -1.4873046875, -1.34326171875, -1.19921875, -1.05517578125, -0.9111328125, -0.76708984375, -0.623046875, -0.47900390625, -0.3349609375, -0.19091796875, -0.046875, 0.09716796875, 0.2412109375, 0.38525390625, 0.529296875, 0.67333984375, 0.8173828125, 0.96142578125, 1.10546875, 1.24951171875, 1.3935546875, 1.53759765625, 1.681640625, 1.82568359375, 1.9697265625, 2.11376953125, 2.2578125, 2.40185546875, 2.5458984375, 2.68994140625, 2.833984375, 2.97802734375, 3.1220703125, 3.26611328125, 3.41015625, 3.55419921875, 3.6982421875, 3.84228515625, 3.986328125, 4.13037109375, 4.2744140625, 4.41845703125, 4.5625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 13.0, 8.0, 12.0, 18.0, 26.0, 19.0, 23.0, 22.0, 28.0, 40.0, 36.0, 41.0, 36.0, 57.0, 45.0, 33.0, 38.0, 44.0, 53.0, 40.0, 36.0, 37.0, 40.0, 21.0, 29.0, 25.0, 21.0, 18.0, 17.0, 15.0, 15.0, 22.0, 4.0, 12.0, 7.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-4.55859375, -4.4288330078125, -4.299072265625, -4.1693115234375, -4.03955078125, -3.9097900390625, -3.780029296875, -3.6502685546875, -3.5205078125, -3.3907470703125, -3.260986328125, -3.1312255859375, -3.00146484375, -2.8717041015625, -2.741943359375, -2.6121826171875, -2.482421875, -2.3526611328125, -2.222900390625, -2.0931396484375, -1.96337890625, -1.8336181640625, -1.703857421875, -1.5740966796875, -1.4443359375, -1.3145751953125, -1.184814453125, -1.0550537109375, -0.92529296875, -0.7955322265625, -0.665771484375, -0.5360107421875, -0.40625, -0.2764892578125, -0.146728515625, -0.0169677734375, 0.11279296875, 0.2425537109375, 0.372314453125, 0.5020751953125, 0.6318359375, 0.7615966796875, 0.891357421875, 1.0211181640625, 1.15087890625, 1.2806396484375, 1.410400390625, 1.5401611328125, 1.669921875, 1.7996826171875, 1.929443359375, 2.0592041015625, 2.18896484375, 2.3187255859375, 2.448486328125, 2.5782470703125, 2.7080078125, 2.8377685546875, 2.967529296875, 3.0972900390625, 3.22705078125, 3.3568115234375, 3.486572265625, 3.6163330078125, 3.74609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 12.0, 18.0, 27.0, 22.0, 52.0, 56.0, 92.0, 115.0, 198.0, 288.0, 386.0, 577.0, 807.0, 1215.0, 2005.0, 3149.0, 5792.0, 11552.0, 28233.0, 161965.0, 741420.0, 53675.0, 17173.0, 8051.0, 4357.0, 2571.0, 1568.0, 1018.0, 621.0, 476.0, 307.0, 214.0, 158.0, 115.0, 78.0, 59.0, 35.0, 27.0, 15.0, 18.0, 10.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.3515625, -9.0703125, -8.7890625, -8.5078125, -8.2265625, -7.9453125, -7.6640625, -7.3828125, -7.1015625, -6.8203125, -6.5390625, -6.2578125, -5.9765625, -5.6953125, -5.4140625, -5.1328125, -4.8515625, -4.5703125, -4.2890625, -4.0078125, -3.7265625, -3.4453125, -3.1640625, -2.8828125, -2.6015625, -2.3203125, -2.0390625, -1.7578125, -1.4765625, -1.1953125, -0.9140625, -0.6328125, -0.3515625, -0.0703125, 0.2109375, 0.4921875, 0.7734375, 1.0546875, 1.3359375, 1.6171875, 1.8984375, 2.1796875, 2.4609375, 2.7421875, 3.0234375, 3.3046875, 3.5859375, 3.8671875, 4.1484375, 4.4296875, 4.7109375, 4.9921875, 5.2734375, 5.5546875, 5.8359375, 6.1171875, 6.3984375, 6.6796875, 6.9609375, 7.2421875, 7.5234375, 7.8046875, 8.0859375, 8.3671875, 8.6484375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 10.0, 12.0, 9.0, 15.0, 17.0, 26.0, 21.0, 22.0, 33.0, 30.0, 25.0, 45.0, 27.0, 24.0, 44.0, 51.0, 44.0, 40.0, 38.0, 40.0, 39.0, 46.0, 34.0, 34.0, 34.0, 36.0, 23.0, 23.0, 17.0, 23.0, 13.0, 14.0, 13.0, 8.0, 12.0, 7.0, 6.0, 4.0, 7.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.12109375, -3.027313232421875, -2.93353271484375, -2.839752197265625, -2.7459716796875, -2.652191162109375, -2.55841064453125, -2.464630126953125, -2.370849609375, -2.277069091796875, -2.18328857421875, -2.089508056640625, -1.9957275390625, -1.901947021484375, -1.80816650390625, -1.714385986328125, -1.62060546875, -1.526824951171875, -1.43304443359375, -1.339263916015625, -1.2454833984375, -1.151702880859375, -1.05792236328125, -0.964141845703125, -0.870361328125, -0.776580810546875, -0.68280029296875, -0.589019775390625, -0.4952392578125, -0.401458740234375, -0.30767822265625, -0.213897705078125, -0.1201171875, -0.026336669921875, 0.06744384765625, 0.161224365234375, 0.2550048828125, 0.348785400390625, 0.44256591796875, 0.536346435546875, 0.630126953125, 0.723907470703125, 0.81768798828125, 0.911468505859375, 1.0052490234375, 1.099029541015625, 1.19281005859375, 1.286590576171875, 1.38037109375, 1.474151611328125, 1.56793212890625, 1.661712646484375, 1.7554931640625, 1.849273681640625, 1.94305419921875, 2.036834716796875, 2.130615234375, 2.224395751953125, 2.31817626953125, 2.411956787109375, 2.5057373046875, 2.599517822265625, 2.69329833984375, 2.787078857421875, 2.880859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 12.0, 14.0, 24.0, 28.0, 59.0, 72.0, 124.0, 190.0, 274.0, 441.0, 792.0, 1355.0, 2533.0, 5299.0, 11792.0, 35875.0, 287800.0, 629035.0, 46289.0, 14141.0, 5843.0, 2765.0, 1500.0, 869.0, 515.0, 340.0, 181.0, 148.0, 75.0, 41.0, 31.0, 21.0, 21.0, 8.0, 4.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.302734375, -3.202911376953125, -3.10308837890625, -3.003265380859375, -2.9034423828125, -2.803619384765625, -2.70379638671875, -2.603973388671875, -2.504150390625, -2.404327392578125, -2.30450439453125, -2.204681396484375, -2.1048583984375, -2.005035400390625, -1.90521240234375, -1.805389404296875, -1.70556640625, -1.605743408203125, -1.50592041015625, -1.406097412109375, -1.3062744140625, -1.206451416015625, -1.10662841796875, -1.006805419921875, -0.906982421875, -0.807159423828125, -0.70733642578125, -0.607513427734375, -0.5076904296875, -0.407867431640625, -0.30804443359375, -0.208221435546875, -0.1083984375, -0.008575439453125, 0.09124755859375, 0.191070556640625, 0.2908935546875, 0.390716552734375, 0.49053955078125, 0.590362548828125, 0.690185546875, 0.790008544921875, 0.88983154296875, 0.989654541015625, 1.0894775390625, 1.189300537109375, 1.28912353515625, 1.388946533203125, 1.48876953125, 1.588592529296875, 1.68841552734375, 1.788238525390625, 1.8880615234375, 1.987884521484375, 2.08770751953125, 2.187530517578125, 2.287353515625, 2.387176513671875, 2.48699951171875, 2.586822509765625, 2.6866455078125, 2.786468505859375, 2.88629150390625, 2.986114501953125, 3.0859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 4.0, 5.0, 5.0, 4.0, 6.0, 11.0, 13.0, 15.0, 12.0, 22.0, 33.0, 45.0, 57.0, 67.0, 72.0, 96.0, 126.0, 79.0, 76.0, 57.0, 42.0, 29.0, 22.0, 29.0, 18.0, 10.0, 11.0, 5.0, 7.0, 2.0, 7.0, 5.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011610984802246094, -0.00011289399117231369, -0.00010967813432216644, -0.0001064622774720192, -0.00010324642062187195, -0.0001000305637717247, -9.681470692157745e-05, -9.35988500714302e-05, -9.038299322128296e-05, -8.716713637113571e-05, -8.395127952098846e-05, -8.073542267084122e-05, -7.751956582069397e-05, -7.430370897054672e-05, -7.108785212039948e-05, -6.787199527025223e-05, -6.465613842010498e-05, -6.144028156995773e-05, -5.8224424719810486e-05, -5.500856786966324e-05, -5.179271101951599e-05, -4.8576854169368744e-05, -4.5360997319221497e-05, -4.214514046907425e-05, -3.8929283618927e-05, -3.5713426768779755e-05, -3.249756991863251e-05, -2.928171306848526e-05, -2.6065856218338013e-05, -2.2849999368190765e-05, -1.9634142518043518e-05, -1.641828566789627e-05, -1.3202428817749023e-05, -9.986571967601776e-06, -6.770715117454529e-06, -3.5548582673072815e-06, -3.390014171600342e-07, 2.876855432987213e-06, 6.0927122831344604e-06, 9.308569133281708e-06, 1.2524425983428955e-05, 1.5740282833576202e-05, 1.895613968372345e-05, 2.2171996533870697e-05, 2.5387853384017944e-05, 2.860371023416519e-05, 3.181956708431244e-05, 3.5035423934459686e-05, 3.8251280784606934e-05, 4.146713763475418e-05, 4.468299448490143e-05, 4.7898851335048676e-05, 5.111470818519592e-05, 5.433056503534317e-05, 5.754642188549042e-05, 6.0762278735637665e-05, 6.397813558578491e-05, 6.719399243593216e-05, 7.04098492860794e-05, 7.362570613622665e-05, 7.68415629863739e-05, 8.005741983652115e-05, 8.32732766866684e-05, 8.648913353681564e-05, 8.970499038696289e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 13.0, 9.0, 18.0, 27.0, 29.0, 46.0, 65.0, 87.0, 108.0, 180.0, 205.0, 304.0, 477.0, 774.0, 1110.0, 1780.0, 2877.0, 4964.0, 8851.0, 17682.0, 42098.0, 137679.0, 569491.0, 168555.0, 48097.0, 19396.0, 9785.0, 5172.0, 3167.0, 1868.0, 1156.0, 728.0, 510.0, 383.0, 241.0, 165.0, 127.0, 101.0, 65.0, 53.0, 30.0, 23.0, 14.0, 11.0, 10.0, 2.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.87890625, -1.8193817138671875, -1.759857177734375, -1.7003326416015625, -1.64080810546875, -1.5812835693359375, -1.521759033203125, -1.4622344970703125, -1.4027099609375, -1.3431854248046875, -1.283660888671875, -1.2241363525390625, -1.16461181640625, -1.1050872802734375, -1.045562744140625, -0.9860382080078125, -0.926513671875, -0.8669891357421875, -0.807464599609375, -0.7479400634765625, -0.68841552734375, -0.6288909912109375, -0.569366455078125, -0.5098419189453125, -0.4503173828125, -0.3907928466796875, -0.331268310546875, -0.2717437744140625, -0.21221923828125, -0.1526947021484375, -0.093170166015625, -0.0336456298828125, 0.02587890625, 0.0854034423828125, 0.144927978515625, 0.2044525146484375, 0.26397705078125, 0.3235015869140625, 0.383026123046875, 0.4425506591796875, 0.5020751953125, 0.5615997314453125, 0.621124267578125, 0.6806488037109375, 0.74017333984375, 0.7996978759765625, 0.859222412109375, 0.9187469482421875, 0.978271484375, 1.0377960205078125, 1.097320556640625, 1.1568450927734375, 1.21636962890625, 1.2758941650390625, 1.335418701171875, 1.3949432373046875, 1.4544677734375, 1.5139923095703125, 1.573516845703125, 1.6330413818359375, 1.69256591796875, 1.7520904541015625, 1.811614990234375, 1.8711395263671875, 1.9306640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 10.0, 20.0, 26.0, 37.0, 53.0, 55.0, 79.0, 115.0, 134.0, 145.0, 100.0, 66.0, 42.0, 30.0, 22.0, 12.0, 12.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478515625, -0.45975494384765625, -0.4409942626953125, -0.42223358154296875, -0.403472900390625, -0.38471221923828125, -0.3659515380859375, -0.34719085693359375, -0.32843017578125, -0.30966949462890625, -0.2909088134765625, -0.27214813232421875, -0.253387451171875, -0.23462677001953125, -0.2158660888671875, -0.19710540771484375, -0.1783447265625, -0.15958404541015625, -0.1408233642578125, -0.12206268310546875, -0.103302001953125, -0.08454132080078125, -0.0657806396484375, -0.04701995849609375, -0.02825927734375, -0.00949859619140625, 0.0092620849609375, 0.02802276611328125, 0.046783447265625, 0.06554412841796875, 0.0843048095703125, 0.10306549072265625, 0.121826171875, 0.14058685302734375, 0.1593475341796875, 0.17810821533203125, 0.196868896484375, 0.21562957763671875, 0.2343902587890625, 0.25315093994140625, 0.27191162109375, 0.29067230224609375, 0.3094329833984375, 0.32819366455078125, 0.346954345703125, 0.36571502685546875, 0.3844757080078125, 0.40323638916015625, 0.4219970703125, 0.44075775146484375, 0.4595184326171875, 0.47827911376953125, 0.497039794921875, 0.5158004760742188, 0.5345611572265625, 0.5533218383789062, 0.57208251953125, 0.5908432006835938, 0.6096038818359375, 0.6283645629882812, 0.647125244140625, 0.6658859252929688, 0.6846466064453125, 0.7034072875976562, 0.72216796875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 11.0, 14.0, 18.0, 29.0, 29.0, 52.0, 88.0, 126.0, 168.0, 146.0, 109.0, 57.0, 50.0, 37.0, 9.0, 10.0, 11.0, 2.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1531829833984375, -5.871450901031494, -5.589718341827393, -5.307986259460449, -5.026253700256348, -4.744521617889404, -4.462789535522461, -4.181056976318359, -3.899324893951416, -3.6175925731658936, -3.335860252380371, -3.0541281700134277, -2.7723958492279053, -2.490663528442383, -2.2089314460754395, -1.927199125289917, -1.6454668045043945, -1.363734483718872, -1.0820022821426392, -0.8002700209617615, -0.5185377597808838, -0.23680543899536133, 0.04492676258087158, 0.3266589641571045, 0.608391284942627, 0.8901235461235046, 1.1718558073043823, 1.4535880088806152, 1.7353203296661377, 2.01705265045166, 2.2987847328186035, 2.580517053604126, 2.8622493743896484, 3.143981695175171, 3.4257140159606934, 3.7074460983276367, 3.989178419113159, 4.270910739898682, 4.552642822265625, 4.834375381469727, 5.11610746383667, 5.397839546203613, 5.679572105407715, 5.961304187774658, 6.243036270141602, 6.524768829345703, 6.8065009117126465, 7.08823299407959, 7.369965553283691, 7.651697635650635, 7.933430194854736, 8.21516227722168, 8.496894836425781, 8.778627395629883, 9.060359001159668, 9.34209156036377, 9.623823165893555, 9.905555725097656, 10.187287330627441, 10.469019889831543, 10.750752449035645, 11.03248405456543, 11.314216613769531, 11.595949172973633, 11.877681732177734]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 5.0, 7.0, 9.0, 6.0, 9.0, 13.0, 11.0, 20.0, 22.0, 22.0, 24.0, 34.0, 27.0, 34.0, 37.0, 40.0, 40.0, 31.0, 51.0, 33.0, 48.0, 36.0, 41.0, 41.0, 39.0, 35.0, 28.0, 36.0, 26.0, 26.0, 25.0, 17.0, 23.0, 12.0, 22.0, 8.0, 12.0, 10.0, 5.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.9159622192382812, -3.7973082065582275, -3.678654193878174, -3.56000018119812, -3.4413461685180664, -3.322692394256592, -3.204038143157959, -3.0853843688964844, -2.9667303562164307, -2.848076343536377, -2.7294223308563232, -2.6107683181762695, -2.492114305496216, -2.373460292816162, -2.2548065185546875, -2.136152505874634, -2.01749849319458, -1.8988444805145264, -1.7801904678344727, -1.661536455154419, -1.5428825616836548, -1.424228549003601, -1.3055745363235474, -1.1869206428527832, -1.0682663917541504, -0.9496123790740967, -0.8309584259986877, -0.712304413318634, -0.5936504602432251, -0.4749964475631714, -0.3563424348831177, -0.23768848180770874, -0.1190345287322998, -0.0003805384039878845, 0.11827345192432404, 0.23692744970321655, 0.3555814325809479, 0.4742354154586792, 0.5928894281387329, 0.7115433812141418, 0.8301973938941956, 0.9488514065742493, 1.0675053596496582, 1.186159372329712, 1.3048133850097656, 1.4234673976898193, 1.542121410369873, 1.6607753038406372, 1.779429316520691, 1.8980833292007446, 2.016737222671509, 2.1353912353515625, 2.254045248031616, 2.37269926071167, 2.4913532733917236, 2.6100072860717773, 2.728661298751831, 2.8473153114318848, 2.9659693241119385, 3.084623336791992, 3.203277349472046, 3.3219313621520996, 3.440585136413574, 3.559239149093628, 3.6778931617736816]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 15.0, 16.0, 30.0, 35.0, 56.0, 75.0, 119.0, 205.0, 271.0, 396.0, 594.0, 985.0, 1498.0, 2469.0, 4057.0, 6583.0, 11452.0, 20324.0, 37080.0, 71739.0, 143297.0, 266133.0, 231355.0, 116925.0, 59355.0, 31428.0, 17229.0, 9816.0, 5680.0, 3289.0, 2181.0, 1350.0, 864.0, 529.0, 363.0, 229.0, 168.0, 116.0, 74.0, 59.0, 33.0, 21.0, 20.0, 12.0, 2.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0, -7.75653076171875, -7.5130615234375, -7.26959228515625, -7.026123046875, -6.78265380859375, -6.5391845703125, -6.29571533203125, -6.05224609375, -5.80877685546875, -5.5653076171875, -5.32183837890625, -5.078369140625, -4.83489990234375, -4.5914306640625, -4.34796142578125, -4.1044921875, -3.86102294921875, -3.6175537109375, -3.37408447265625, -3.130615234375, -2.88714599609375, -2.6436767578125, -2.40020751953125, -2.15673828125, -1.91326904296875, -1.6697998046875, -1.42633056640625, -1.182861328125, -0.93939208984375, -0.6959228515625, -0.45245361328125, -0.208984375, 0.03448486328125, 0.2779541015625, 0.52142333984375, 0.764892578125, 1.00836181640625, 1.2518310546875, 1.49530029296875, 1.73876953125, 1.98223876953125, 2.2257080078125, 2.46917724609375, 2.712646484375, 2.95611572265625, 3.1995849609375, 3.44305419921875, 3.6865234375, 3.92999267578125, 4.1734619140625, 4.41693115234375, 4.660400390625, 4.90386962890625, 5.1473388671875, 5.39080810546875, 5.63427734375, 5.87774658203125, 6.1212158203125, 6.36468505859375, 6.608154296875, 6.85162353515625, 7.0950927734375, 7.33856201171875, 7.58203125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 4.0, 9.0, 5.0, 6.0, 10.0, 9.0, 12.0, 26.0, 29.0, 25.0, 35.0, 30.0, 43.0, 43.0, 43.0, 52.0, 47.0, 53.0, 39.0, 42.0, 46.0, 43.0, 50.0, 43.0, 41.0, 27.0, 37.0, 22.0, 10.0, 19.0, 17.0, 14.0, 16.0, 12.0, 11.0, 4.0, 1.0, 2.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0], "bins": [-4.296875, -4.178436279296875, -4.05999755859375, -3.941558837890625, -3.8231201171875, -3.704681396484375, -3.58624267578125, -3.467803955078125, -3.349365234375, -3.230926513671875, -3.11248779296875, -2.994049072265625, -2.8756103515625, -2.757171630859375, -2.63873291015625, -2.520294189453125, -2.40185546875, -2.283416748046875, -2.16497802734375, -2.046539306640625, -1.9281005859375, -1.809661865234375, -1.69122314453125, -1.572784423828125, -1.454345703125, -1.335906982421875, -1.21746826171875, -1.099029541015625, -0.9805908203125, -0.862152099609375, -0.74371337890625, -0.625274658203125, -0.5068359375, -0.388397216796875, -0.26995849609375, -0.151519775390625, -0.0330810546875, 0.085357666015625, 0.20379638671875, 0.322235107421875, 0.440673828125, 0.559112548828125, 0.67755126953125, 0.795989990234375, 0.9144287109375, 1.032867431640625, 1.15130615234375, 1.269744873046875, 1.38818359375, 1.506622314453125, 1.62506103515625, 1.743499755859375, 1.8619384765625, 1.980377197265625, 2.09881591796875, 2.217254638671875, 2.335693359375, 2.454132080078125, 2.57257080078125, 2.691009521484375, 2.8094482421875, 2.927886962890625, 3.04632568359375, 3.164764404296875, 3.283203125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 8.0, 17.0, 30.0, 34.0, 44.0, 62.0, 109.0, 168.0, 244.0, 374.0, 626.0, 1060.0, 1752.0, 3157.0, 5828.0, 10776.0, 20750.0, 41289.0, 83778.0, 172074.0, 295555.0, 207243.0, 100964.0, 49337.0, 24931.0, 12751.0, 6744.0, 3587.0, 2037.0, 1231.0, 717.0, 436.0, 299.0, 159.0, 128.0, 74.0, 57.0, 38.0, 28.0, 10.0, 18.0, 6.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.796875, -7.55792236328125, -7.3189697265625, -7.08001708984375, -6.841064453125, -6.60211181640625, -6.3631591796875, -6.12420654296875, -5.88525390625, -5.64630126953125, -5.4073486328125, -5.16839599609375, -4.929443359375, -4.69049072265625, -4.4515380859375, -4.21258544921875, -3.9736328125, -3.73468017578125, -3.4957275390625, -3.25677490234375, -3.017822265625, -2.77886962890625, -2.5399169921875, -2.30096435546875, -2.06201171875, -1.82305908203125, -1.5841064453125, -1.34515380859375, -1.106201171875, -0.86724853515625, -0.6282958984375, -0.38934326171875, -0.150390625, 0.08856201171875, 0.3275146484375, 0.56646728515625, 0.805419921875, 1.04437255859375, 1.2833251953125, 1.52227783203125, 1.76123046875, 2.00018310546875, 2.2391357421875, 2.47808837890625, 2.717041015625, 2.95599365234375, 3.1949462890625, 3.43389892578125, 3.6728515625, 3.91180419921875, 4.1507568359375, 4.38970947265625, 4.628662109375, 4.86761474609375, 5.1065673828125, 5.34552001953125, 5.58447265625, 5.82342529296875, 6.0623779296875, 6.30133056640625, 6.540283203125, 6.77923583984375, 7.0181884765625, 7.25714111328125, 7.49609375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 4.0, 9.0, 12.0, 15.0, 12.0, 24.0, 15.0, 23.0, 22.0, 21.0, 21.0, 23.0, 27.0, 33.0, 22.0, 36.0, 39.0, 28.0, 41.0, 51.0, 34.0, 38.0, 35.0, 33.0, 40.0, 23.0, 44.0, 32.0, 28.0, 21.0, 30.0, 31.0, 25.0, 16.0, 13.0, 9.0, 11.0, 9.0, 7.0, 8.0, 4.0, 5.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-2.244140625, -2.1786956787109375, -2.113250732421875, -2.0478057861328125, -1.98236083984375, -1.9169158935546875, -1.851470947265625, -1.7860260009765625, -1.7205810546875, -1.6551361083984375, -1.589691162109375, -1.5242462158203125, -1.45880126953125, -1.3933563232421875, -1.327911376953125, -1.2624664306640625, -1.197021484375, -1.1315765380859375, -1.066131591796875, -1.0006866455078125, -0.93524169921875, -0.8697967529296875, -0.804351806640625, -0.7389068603515625, -0.6734619140625, -0.6080169677734375, -0.542572021484375, -0.4771270751953125, -0.41168212890625, -0.3462371826171875, -0.280792236328125, -0.2153472900390625, -0.14990234375, -0.0844573974609375, -0.019012451171875, 0.0464324951171875, 0.11187744140625, 0.1773223876953125, 0.242767333984375, 0.3082122802734375, 0.3736572265625, 0.4391021728515625, 0.504547119140625, 0.5699920654296875, 0.63543701171875, 0.7008819580078125, 0.766326904296875, 0.8317718505859375, 0.897216796875, 0.9626617431640625, 1.028106689453125, 1.0935516357421875, 1.15899658203125, 1.2244415283203125, 1.289886474609375, 1.3553314208984375, 1.4207763671875, 1.4862213134765625, 1.551666259765625, 1.6171112060546875, 1.68255615234375, 1.7480010986328125, 1.813446044921875, 1.8788909912109375, 1.9443359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 18.0, 32.0, 50.0, 56.0, 77.0, 133.0, 176.0, 252.0, 415.0, 592.0, 990.0, 1731.0, 3117.0, 6455.0, 16356.0, 60275.0, 777765.0, 133915.0, 26922.0, 9362.0, 4223.0, 2152.0, 1227.0, 749.0, 493.0, 303.0, 202.0, 154.0, 89.0, 72.0, 55.0, 28.0, 25.0, 17.0, 15.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.1029052734375, -10.729248046875, -10.3555908203125, -9.98193359375, -9.6082763671875, -9.234619140625, -8.8609619140625, -8.4873046875, -8.1136474609375, -7.739990234375, -7.3663330078125, -6.99267578125, -6.6190185546875, -6.245361328125, -5.8717041015625, -5.498046875, -5.1243896484375, -4.750732421875, -4.3770751953125, -4.00341796875, -3.6297607421875, -3.256103515625, -2.8824462890625, -2.5087890625, -2.1351318359375, -1.761474609375, -1.3878173828125, -1.01416015625, -0.6405029296875, -0.266845703125, 0.1068115234375, 0.48046875, 0.8541259765625, 1.227783203125, 1.6014404296875, 1.97509765625, 2.3487548828125, 2.722412109375, 3.0960693359375, 3.4697265625, 3.8433837890625, 4.217041015625, 4.5906982421875, 4.96435546875, 5.3380126953125, 5.711669921875, 6.0853271484375, 6.458984375, 6.8326416015625, 7.206298828125, 7.5799560546875, 7.95361328125, 8.3272705078125, 8.700927734375, 9.0745849609375, 9.4482421875, 9.8218994140625, 10.195556640625, 10.5692138671875, 10.94287109375, 11.3165283203125, 11.690185546875, 12.0638427734375, 12.4375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 7.0, 9.0, 15.0, 24.0, 35.0, 56.0, 121.0, 305.0, 178.0, 100.0, 54.0, 24.0, 26.0, 16.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030612945556640625, -0.0002958327531814575, -0.0002855360507965088, -0.00027523934841156006, -0.00026494264602661133, -0.0002546459436416626, -0.00024434924125671387, -0.00023405253887176514, -0.0002237558364868164, -0.00021345913410186768, -0.00020316243171691895, -0.00019286572933197021, -0.00018256902694702148, -0.00017227232456207275, -0.00016197562217712402, -0.0001516789197921753, -0.00014138221740722656, -0.00013108551502227783, -0.0001207888126373291, -0.00011049211025238037, -0.00010019540786743164, -8.989870548248291e-05, -7.960200309753418e-05, -6.930530071258545e-05, -5.900859832763672e-05, -4.871189594268799e-05, -3.841519355773926e-05, -2.8118491172790527e-05, -1.7821788787841797e-05, -7.525086402893066e-06, 2.771615982055664e-06, 1.3068318367004395e-05, 2.3365020751953125e-05, 3.3661723136901855e-05, 4.3958425521850586e-05, 5.4255127906799316e-05, 6.455183029174805e-05, 7.484853267669678e-05, 8.514523506164551e-05, 9.544193744659424e-05, 0.00010573863983154297, 0.0001160353422164917, 0.00012633204460144043, 0.00013662874698638916, 0.0001469254493713379, 0.00015722215175628662, 0.00016751885414123535, 0.00017781555652618408, 0.0001881122589111328, 0.00019840896129608154, 0.00020870566368103027, 0.000219002366065979, 0.00022929906845092773, 0.00023959577083587646, 0.0002498924732208252, 0.0002601891756057739, 0.00027048587799072266, 0.0002807825803756714, 0.0002910792827606201, 0.00030137598514556885, 0.0003116726875305176, 0.0003219693899154663, 0.00033226609230041504, 0.00034256279468536377, 0.0003528594970703125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 5.0, 6.0, 10.0, 11.0, 17.0, 16.0, 21.0, 36.0, 41.0, 67.0, 90.0, 121.0, 171.0, 265.0, 360.0, 540.0, 854.0, 1313.0, 2226.0, 4006.0, 8235.0, 21063.0, 84566.0, 804702.0, 81216.0, 20488.0, 8088.0, 3926.0, 2159.0, 1303.0, 841.0, 551.0, 359.0, 265.0, 172.0, 114.0, 93.0, 68.0, 43.0, 39.0, 26.0, 23.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.1640625, -10.8204345703125, -10.476806640625, -10.1331787109375, -9.78955078125, -9.4459228515625, -9.102294921875, -8.7586669921875, -8.4150390625, -8.0714111328125, -7.727783203125, -7.3841552734375, -7.04052734375, -6.6968994140625, -6.353271484375, -6.0096435546875, -5.666015625, -5.3223876953125, -4.978759765625, -4.6351318359375, -4.29150390625, -3.9478759765625, -3.604248046875, -3.2606201171875, -2.9169921875, -2.5733642578125, -2.229736328125, -1.8861083984375, -1.54248046875, -1.1988525390625, -0.855224609375, -0.5115966796875, -0.16796875, 0.1756591796875, 0.519287109375, 0.8629150390625, 1.20654296875, 1.5501708984375, 1.893798828125, 2.2374267578125, 2.5810546875, 2.9246826171875, 3.268310546875, 3.6119384765625, 3.95556640625, 4.2991943359375, 4.642822265625, 4.9864501953125, 5.330078125, 5.6737060546875, 6.017333984375, 6.3609619140625, 6.70458984375, 7.0482177734375, 7.391845703125, 7.7354736328125, 8.0791015625, 8.4227294921875, 8.766357421875, 9.1099853515625, 9.45361328125, 9.7972412109375, 10.140869140625, 10.4844970703125, 10.828125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 12.0, 17.0, 23.0, 26.0, 36.0, 81.0, 122.0, 359.0, 99.0, 56.0, 40.0, 27.0, 23.0, 13.0, 10.0, 7.0, 2.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.533203125, -2.4521484375, -2.37109375, -2.2900390625, -2.208984375, -2.1279296875, -2.046875, -1.9658203125, -1.884765625, -1.8037109375, -1.72265625, -1.6416015625, -1.560546875, -1.4794921875, -1.3984375, -1.3173828125, -1.236328125, -1.1552734375, -1.07421875, -0.9931640625, -0.912109375, -0.8310546875, -0.75, -0.6689453125, -0.587890625, -0.5068359375, -0.42578125, -0.3447265625, -0.263671875, -0.1826171875, -0.1015625, -0.0205078125, 0.060546875, 0.1416015625, 0.22265625, 0.3037109375, 0.384765625, 0.4658203125, 0.546875, 0.6279296875, 0.708984375, 0.7900390625, 0.87109375, 0.9521484375, 1.033203125, 1.1142578125, 1.1953125, 1.2763671875, 1.357421875, 1.4384765625, 1.51953125, 1.6005859375, 1.681640625, 1.7626953125, 1.84375, 1.9248046875, 2.005859375, 2.0869140625, 2.16796875, 2.2490234375, 2.330078125, 2.4111328125, 2.4921875, 2.5732421875, 2.654296875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 13.0, 22.0, 41.0, 60.0, 120.0, 159.0, 186.0, 137.0, 72.0, 59.0, 33.0, 27.0, 20.0, 7.0, 9.0, 4.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.377165794372559, -5.079503059387207, -4.7818403244018555, -4.484177589416504, -4.186514854431152, -3.888852119445801, -3.591189384460449, -3.2935266494750977, -2.995863914489746, -2.6982011795043945, -2.400538444519043, -2.1028757095336914, -1.8052129745483398, -1.5075502395629883, -1.2098875045776367, -0.9122247695922852, -0.6145620346069336, -0.31689929962158203, -0.01923656463623047, 0.2784261703491211, 0.5760889053344727, 0.8737516403198242, 1.1714143753051758, 1.4690771102905273, 1.766739845275879, 2.0644025802612305, 2.362065315246582, 2.6597280502319336, 2.957390785217285, 3.2550535202026367, 3.5527162551879883, 3.85037899017334, 4.148042678833008, 4.445705413818359, 4.743368148803711, 5.0410308837890625, 5.338693618774414, 5.636356353759766, 5.934019088745117, 6.231681823730469, 6.52934455871582, 6.827007293701172, 7.124670028686523, 7.422332763671875, 7.719995498657227, 8.017658233642578, 8.31532096862793, 8.612983703613281, 8.910646438598633, 9.208309173583984, 9.505971908569336, 9.803634643554688, 10.101297378540039, 10.39896011352539, 10.696622848510742, 10.994285583496094, 11.291948318481445, 11.589611053466797, 11.887273788452148, 12.1849365234375, 12.482599258422852, 12.780261993408203, 13.077924728393555, 13.375587463378906, 13.673250198364258]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 7.0, 5.0, 7.0, 14.0, 13.0, 15.0, 16.0, 14.0, 32.0, 19.0, 20.0, 30.0, 29.0, 35.0, 41.0, 34.0, 47.0, 34.0, 40.0, 40.0, 51.0, 39.0, 51.0, 43.0, 40.0, 38.0, 31.0, 38.0, 25.0, 27.0, 27.0, 12.0, 9.0, 12.0, 14.0, 14.0, 1.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248772621154785, -3.1344285011291504, -3.0200846195220947, -2.905740737915039, -2.7913966178894043, -2.6770524978637695, -2.562708616256714, -2.448364734649658, -2.3340206146240234, -2.2196764945983887, -2.105332612991333, -1.9909886121749878, -1.8766446113586426, -1.7623006105422974, -1.6479566097259521, -1.533612608909607, -1.4192686080932617, -1.3049246072769165, -1.1905806064605713, -1.076236605644226, -0.9618926048278809, -0.8475486040115356, -0.7332046031951904, -0.6188606023788452, -0.5045166015625, -0.3901726007461548, -0.27582859992980957, -0.16148459911346436, -0.04714059829711914, 0.06720340251922607, 0.1815474033355713, 0.2958914041519165, 0.4102354049682617, 0.5245794057846069, 0.6389234066009521, 0.7532674074172974, 0.8676114082336426, 0.9819554090499878, 1.096299409866333, 1.2106434106826782, 1.3249874114990234, 1.4393314123153687, 1.5536754131317139, 1.668019413948059, 1.7823634147644043, 1.8967074155807495, 2.0110514163970947, 2.1253952980041504, 2.239739418029785, 2.35408353805542, 2.4684274196624756, 2.5827713012695312, 2.697115421295166, 2.811459541320801, 2.9258034229278564, 3.040147304534912, 3.154491424560547, 3.2688355445861816, 3.3831794261932373, 3.497523307800293, 3.6118674278259277, 3.7262115478515625, 3.840555429458618, 3.954899311065674, 4.069243431091309]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 8.0, 15.0, 17.0, 33.0, 41.0, 63.0, 88.0, 139.0, 202.0, 316.0, 411.0, 713.0, 1027.0, 1658.0, 2669.0, 4215.0, 6921.0, 11487.0, 20376.0, 36816.0, 74607.0, 175661.0, 632498.0, 2116664.0, 742092.0, 196056.0, 80664.0, 38875.0, 20490.0, 11620.0, 6658.0, 4135.0, 2502.0, 1623.0, 1016.0, 643.0, 389.0, 301.0, 193.0, 128.0, 77.0, 54.0, 38.0, 31.0, 22.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.6953125, -6.50146484375, -6.3076171875, -6.11376953125, -5.919921875, -5.72607421875, -5.5322265625, -5.33837890625, -5.14453125, -4.95068359375, -4.7568359375, -4.56298828125, -4.369140625, -4.17529296875, -3.9814453125, -3.78759765625, -3.59375, -3.39990234375, -3.2060546875, -3.01220703125, -2.818359375, -2.62451171875, -2.4306640625, -2.23681640625, -2.04296875, -1.84912109375, -1.6552734375, -1.46142578125, -1.267578125, -1.07373046875, -0.8798828125, -0.68603515625, -0.4921875, -0.29833984375, -0.1044921875, 0.08935546875, 0.283203125, 0.47705078125, 0.6708984375, 0.86474609375, 1.05859375, 1.25244140625, 1.4462890625, 1.64013671875, 1.833984375, 2.02783203125, 2.2216796875, 2.41552734375, 2.609375, 2.80322265625, 2.9970703125, 3.19091796875, 3.384765625, 3.57861328125, 3.7724609375, 3.96630859375, 4.16015625, 4.35400390625, 4.5478515625, 4.74169921875, 4.935546875, 5.12939453125, 5.3232421875, 5.51708984375, 5.7109375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 5.0, 14.0, 22.0, 17.0, 17.0, 23.0, 30.0, 23.0, 31.0, 41.0, 40.0, 35.0, 41.0, 52.0, 49.0, 39.0, 53.0, 46.0, 44.0, 43.0, 37.0, 50.0, 29.0, 25.0, 30.0, 27.0, 24.0, 17.0, 11.0, 11.0, 10.0, 7.0, 7.0, 2.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.67578125, -2.600341796875, -2.52490234375, -2.449462890625, -2.3740234375, -2.298583984375, -2.22314453125, -2.147705078125, -2.072265625, -1.996826171875, -1.92138671875, -1.845947265625, -1.7705078125, -1.695068359375, -1.61962890625, -1.544189453125, -1.46875, -1.393310546875, -1.31787109375, -1.242431640625, -1.1669921875, -1.091552734375, -1.01611328125, -0.940673828125, -0.865234375, -0.789794921875, -0.71435546875, -0.638916015625, -0.5634765625, -0.488037109375, -0.41259765625, -0.337158203125, -0.26171875, -0.186279296875, -0.11083984375, -0.035400390625, 0.0400390625, 0.115478515625, 0.19091796875, 0.266357421875, 0.341796875, 0.417236328125, 0.49267578125, 0.568115234375, 0.6435546875, 0.718994140625, 0.79443359375, 0.869873046875, 0.9453125, 1.020751953125, 1.09619140625, 1.171630859375, 1.2470703125, 1.322509765625, 1.39794921875, 1.473388671875, 1.548828125, 1.624267578125, 1.69970703125, 1.775146484375, 1.8505859375, 1.926025390625, 2.00146484375, 2.076904296875, 2.15234375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 12.0, 14.0, 18.0, 34.0, 40.0, 58.0, 91.0, 110.0, 194.0, 238.0, 436.0, 604.0, 897.0, 1510.0, 2200.0, 3573.0, 5762.0, 9699.0, 16913.0, 30061.0, 57047.0, 117297.0, 266404.0, 745635.0, 1747531.0, 697479.0, 253853.0, 111934.0, 54600.0, 28903.0, 16219.0, 9496.0, 5660.0, 3467.0, 2155.0, 1440.0, 852.0, 639.0, 399.0, 254.0, 166.0, 113.0, 71.0, 68.0, 39.0, 30.0, 17.0, 17.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0], "bins": [-4.93359375, -4.78619384765625, -4.6387939453125, -4.49139404296875, -4.343994140625, -4.19659423828125, -4.0491943359375, -3.90179443359375, -3.75439453125, -3.60699462890625, -3.4595947265625, -3.31219482421875, -3.164794921875, -3.01739501953125, -2.8699951171875, -2.72259521484375, -2.5751953125, -2.42779541015625, -2.2803955078125, -2.13299560546875, -1.985595703125, -1.83819580078125, -1.6907958984375, -1.54339599609375, -1.39599609375, -1.24859619140625, -1.1011962890625, -0.95379638671875, -0.806396484375, -0.65899658203125, -0.5115966796875, -0.36419677734375, -0.216796875, -0.06939697265625, 0.0780029296875, 0.22540283203125, 0.372802734375, 0.52020263671875, 0.6676025390625, 0.81500244140625, 0.96240234375, 1.10980224609375, 1.2572021484375, 1.40460205078125, 1.552001953125, 1.69940185546875, 1.8468017578125, 1.99420166015625, 2.1416015625, 2.28900146484375, 2.4364013671875, 2.58380126953125, 2.731201171875, 2.87860107421875, 3.0260009765625, 3.17340087890625, 3.32080078125, 3.46820068359375, 3.6156005859375, 3.76300048828125, 3.910400390625, 4.05780029296875, 4.2052001953125, 4.35260009765625, 4.5]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 6.0, 8.0, 12.0, 11.0, 15.0, 21.0, 27.0, 25.0, 57.0, 64.0, 77.0, 86.0, 112.0, 131.0, 152.0, 194.0, 215.0, 235.0, 304.0, 317.0, 344.0, 329.0, 250.0, 198.0, 150.0, 153.0, 103.0, 84.0, 76.0, 68.0, 45.0, 34.0, 45.0, 31.0, 16.0, 17.0, 7.0, 13.0, 9.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.11248779296875, -1.0726318359375, -1.03277587890625, -0.992919921875, -0.95306396484375, -0.9132080078125, -0.87335205078125, -0.83349609375, -0.79364013671875, -0.7537841796875, -0.71392822265625, -0.674072265625, -0.63421630859375, -0.5943603515625, -0.55450439453125, -0.5146484375, -0.47479248046875, -0.4349365234375, -0.39508056640625, -0.355224609375, -0.31536865234375, -0.2755126953125, -0.23565673828125, -0.19580078125, -0.15594482421875, -0.1160888671875, -0.07623291015625, -0.036376953125, 0.00347900390625, 0.0433349609375, 0.08319091796875, 0.123046875, 0.16290283203125, 0.2027587890625, 0.24261474609375, 0.282470703125, 0.32232666015625, 0.3621826171875, 0.40203857421875, 0.44189453125, 0.48175048828125, 0.5216064453125, 0.56146240234375, 0.601318359375, 0.64117431640625, 0.6810302734375, 0.72088623046875, 0.7607421875, 0.80059814453125, 0.8404541015625, 0.88031005859375, 0.920166015625, 0.96002197265625, 0.9998779296875, 1.03973388671875, 1.07958984375, 1.11944580078125, 1.1593017578125, 1.19915771484375, 1.239013671875, 1.27886962890625, 1.3187255859375, 1.35858154296875, 1.3984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 10.0, 8.0, 12.0, 25.0, 34.0, 53.0, 77.0, 124.0, 158.0, 149.0, 114.0, 75.0, 45.0, 31.0, 24.0, 21.0, 10.0, 10.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.053717136383057, -6.863794803619385, -6.673872947692871, -6.483950614929199, -6.2940287590026855, -6.104106426239014, -5.9141845703125, -5.724262237548828, -5.534339904785156, -5.344417572021484, -5.154495716094971, -4.964573383331299, -4.774651527404785, -4.584729194641113, -4.394806861877441, -4.204885005950928, -4.014963150024414, -3.8250410556793213, -3.6351189613342285, -3.4451966285705566, -3.255274772644043, -3.065352439880371, -2.8754303455352783, -2.6855082511901855, -2.4955861568450928, -2.3056640625, -2.1157419681549072, -1.925819754600525, -1.7358976602554321, -1.5459755659103394, -1.356053352355957, -1.1661312580108643, -0.9762091636657715, -0.7862870693206787, -0.5963649153709412, -0.4064427614212036, -0.21652066707611084, -0.026598572731018066, 0.16332364082336426, 0.35324573516845703, 0.5431678295135498, 0.7330899238586426, 0.9230120778083801, 1.1129342317581177, 1.3028563261032104, 1.4927784204483032, 1.6827006340026855, 1.8726227283477783, 2.062544822692871, 2.252466917037964, 2.4423890113830566, 2.6323113441467285, 2.822233200073242, 3.012155532836914, 3.202077627182007, 3.3919997215270996, 3.5819218158721924, 3.771843910217285, 3.961766004562378, 4.151688098907471, 4.341610431671143, 4.531532287597656, 4.721454620361328, 4.911376953125, 5.101298809051514]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 15.0, 8.0, 8.0, 14.0, 17.0, 13.0, 19.0, 28.0, 30.0, 26.0, 28.0, 30.0, 35.0, 27.0, 38.0, 44.0, 33.0, 36.0, 45.0, 46.0, 43.0, 39.0, 40.0, 38.0, 29.0, 40.0, 34.0, 25.0, 29.0, 21.0, 21.0, 12.0, 12.0, 12.0, 4.0, 15.0, 7.0, 4.0, 3.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31754469871521, -2.241307258605957, -2.165070056915283, -2.0888326168060303, -2.0125951766967773, -1.9363579750061035, -1.8601205348968506, -1.7838832139968872, -1.7076458930969238, -1.6314085721969604, -1.555171251296997, -1.4789338111877441, -1.4026964902877808, -1.3264591693878174, -1.2502217292785645, -1.173984408378601, -1.0977470874786377, -1.0215097665786743, -0.9452723860740662, -0.869035005569458, -0.7927976846694946, -0.7165603637695312, -0.6403229832649231, -0.5640856027603149, -0.48784828186035156, -0.4116109311580658, -0.33537358045578003, -0.25913622975349426, -0.1828988790512085, -0.10666152834892273, -0.030424177646636963, 0.04581320285797119, 0.12205052375793457, 0.19828787446022034, 0.2745252251625061, 0.35076257586479187, 0.42699992656707764, 0.503237247467041, 0.5794746279716492, 0.6557120084762573, 0.7319493293762207, 0.8081866502761841, 0.8844240307807922, 0.9606614112854004, 1.0368987321853638, 1.1131360530853271, 1.18937349319458, 1.2656108140945435, 1.3418481349945068, 1.4180854558944702, 1.4943227767944336, 1.5705602169036865, 1.64679753780365, 1.7230348587036133, 1.7992722988128662, 1.8755096197128296, 1.951746940612793, 2.027984380722046, 2.1042215824127197, 2.1804590225219727, 2.2566962242126465, 2.3329336643218994, 2.4091711044311523, 2.485408306121826, 2.561645746231079]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 11.0, 16.0, 19.0, 24.0, 44.0, 58.0, 77.0, 92.0, 152.0, 250.0, 339.0, 549.0, 779.0, 1351.0, 1980.0, 3221.0, 5475.0, 9138.0, 16416.0, 31873.0, 72559.0, 262830.0, 451730.0, 101038.0, 40548.0, 20026.0, 11031.0, 6502.0, 3812.0, 2358.0, 1447.0, 926.0, 601.0, 396.0, 277.0, 187.0, 130.0, 88.0, 60.0, 47.0, 24.0, 13.0, 20.0, 6.0, 5.0, 6.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0], "bins": [-3.888671875, -3.77484130859375, -3.6610107421875, -3.54718017578125, -3.433349609375, -3.31951904296875, -3.2056884765625, -3.09185791015625, -2.97802734375, -2.86419677734375, -2.7503662109375, -2.63653564453125, -2.522705078125, -2.40887451171875, -2.2950439453125, -2.18121337890625, -2.0673828125, -1.95355224609375, -1.8397216796875, -1.72589111328125, -1.612060546875, -1.49822998046875, -1.3843994140625, -1.27056884765625, -1.15673828125, -1.04290771484375, -0.9290771484375, -0.81524658203125, -0.701416015625, -0.58758544921875, -0.4737548828125, -0.35992431640625, -0.24609375, -0.13226318359375, -0.0184326171875, 0.09539794921875, 0.209228515625, 0.32305908203125, 0.4368896484375, 0.55072021484375, 0.66455078125, 0.77838134765625, 0.8922119140625, 1.00604248046875, 1.119873046875, 1.23370361328125, 1.3475341796875, 1.46136474609375, 1.5751953125, 1.68902587890625, 1.8028564453125, 1.91668701171875, 2.030517578125, 2.14434814453125, 2.2581787109375, 2.37200927734375, 2.48583984375, 2.59967041015625, 2.7135009765625, 2.82733154296875, 2.941162109375, 3.05499267578125, 3.1688232421875, 3.28265380859375, 3.396484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 5.0, 8.0, 8.0, 15.0, 12.0, 17.0, 14.0, 22.0, 26.0, 22.0, 23.0, 36.0, 38.0, 35.0, 32.0, 45.0, 47.0, 46.0, 55.0, 39.0, 42.0, 43.0, 45.0, 40.0, 40.0, 41.0, 35.0, 30.0, 18.0, 18.0, 13.0, 13.0, 17.0, 11.0, 7.0, 6.0, 5.0, 3.0, 7.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.642578125, -2.5592041015625, -2.475830078125, -2.3924560546875, -2.30908203125, -2.2257080078125, -2.142333984375, -2.0589599609375, -1.9755859375, -1.8922119140625, -1.808837890625, -1.7254638671875, -1.64208984375, -1.5587158203125, -1.475341796875, -1.3919677734375, -1.30859375, -1.2252197265625, -1.141845703125, -1.0584716796875, -0.97509765625, -0.8917236328125, -0.808349609375, -0.7249755859375, -0.6416015625, -0.5582275390625, -0.474853515625, -0.3914794921875, -0.30810546875, -0.2247314453125, -0.141357421875, -0.0579833984375, 0.025390625, 0.1087646484375, 0.192138671875, 0.2755126953125, 0.35888671875, 0.4422607421875, 0.525634765625, 0.6090087890625, 0.6923828125, 0.7757568359375, 0.859130859375, 0.9425048828125, 1.02587890625, 1.1092529296875, 1.192626953125, 1.2760009765625, 1.359375, 1.4427490234375, 1.526123046875, 1.6094970703125, 1.69287109375, 1.7762451171875, 1.859619140625, 1.9429931640625, 2.0263671875, 2.1097412109375, 2.193115234375, 2.2764892578125, 2.35986328125, 2.4432373046875, 2.526611328125, 2.6099853515625, 2.693359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 15.0, 5.0, 15.0, 14.0, 14.0, 36.0, 52.0, 49.0, 72.0, 109.0, 145.0, 171.0, 299.0, 395.0, 569.0, 842.0, 1129.0, 1825.0, 2834.0, 4808.0, 8978.0, 18834.0, 58930.0, 739252.0, 150877.0, 29333.0, 12249.0, 6250.0, 3568.0, 2200.0, 1387.0, 973.0, 635.0, 467.0, 377.0, 205.0, 176.0, 139.0, 91.0, 59.0, 42.0, 47.0, 29.0, 17.0, 8.0, 10.0, 7.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-5.86328125, -5.678466796875, -5.49365234375, -5.308837890625, -5.1240234375, -4.939208984375, -4.75439453125, -4.569580078125, -4.384765625, -4.199951171875, -4.01513671875, -3.830322265625, -3.6455078125, -3.460693359375, -3.27587890625, -3.091064453125, -2.90625, -2.721435546875, -2.53662109375, -2.351806640625, -2.1669921875, -1.982177734375, -1.79736328125, -1.612548828125, -1.427734375, -1.242919921875, -1.05810546875, -0.873291015625, -0.6884765625, -0.503662109375, -0.31884765625, -0.134033203125, 0.05078125, 0.235595703125, 0.42041015625, 0.605224609375, 0.7900390625, 0.974853515625, 1.15966796875, 1.344482421875, 1.529296875, 1.714111328125, 1.89892578125, 2.083740234375, 2.2685546875, 2.453369140625, 2.63818359375, 2.822998046875, 3.0078125, 3.192626953125, 3.37744140625, 3.562255859375, 3.7470703125, 3.931884765625, 4.11669921875, 4.301513671875, 4.486328125, 4.671142578125, 4.85595703125, 5.040771484375, 5.2255859375, 5.410400390625, 5.59521484375, 5.780029296875, 5.96484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 14.0, 8.0, 14.0, 12.0, 20.0, 16.0, 32.0, 25.0, 18.0, 28.0, 27.0, 44.0, 33.0, 38.0, 37.0, 38.0, 32.0, 45.0, 49.0, 37.0, 29.0, 38.0, 33.0, 34.0, 32.0, 23.0, 23.0, 29.0, 36.0, 23.0, 19.0, 12.0, 12.0, 13.0, 12.0, 12.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5205841064453125, -1.467926025390625, -1.4152679443359375, -1.36260986328125, -1.3099517822265625, -1.257293701171875, -1.2046356201171875, -1.1519775390625, -1.0993194580078125, -1.046661376953125, -0.9940032958984375, -0.94134521484375, -0.8886871337890625, -0.836029052734375, -0.7833709716796875, -0.730712890625, -0.6780548095703125, -0.625396728515625, -0.5727386474609375, -0.52008056640625, -0.4674224853515625, -0.414764404296875, -0.3621063232421875, -0.3094482421875, -0.2567901611328125, -0.204132080078125, -0.1514739990234375, -0.09881591796875, -0.0461578369140625, 0.006500244140625, 0.0591583251953125, 0.11181640625, 0.1644744873046875, 0.217132568359375, 0.2697906494140625, 0.32244873046875, 0.3751068115234375, 0.427764892578125, 0.4804229736328125, 0.5330810546875, 0.5857391357421875, 0.638397216796875, 0.6910552978515625, 0.74371337890625, 0.7963714599609375, 0.849029541015625, 0.9016876220703125, 0.954345703125, 1.0070037841796875, 1.059661865234375, 1.1123199462890625, 1.16497802734375, 1.2176361083984375, 1.270294189453125, 1.3229522705078125, 1.3756103515625, 1.4282684326171875, 1.480926513671875, 1.5335845947265625, 1.58624267578125, 1.6389007568359375, 1.691558837890625, 1.7442169189453125, 1.796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 1.0, 5.0, 6.0, 17.0, 19.0, 14.0, 26.0, 49.0, 61.0, 67.0, 129.0, 150.0, 201.0, 288.0, 439.0, 644.0, 1005.0, 1618.0, 2803.0, 5081.0, 10755.0, 27764.0, 132835.0, 755937.0, 70173.0, 19665.0, 8215.0, 4175.0, 2313.0, 1359.0, 862.0, 569.0, 359.0, 259.0, 170.0, 134.0, 102.0, 59.0, 56.0, 55.0, 26.0, 16.0, 18.0, 14.0, 20.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.328125, -1.2882843017578125, -1.248443603515625, -1.2086029052734375, -1.16876220703125, -1.1289215087890625, -1.089080810546875, -1.0492401123046875, -1.0093994140625, -0.9695587158203125, -0.929718017578125, -0.8898773193359375, -0.85003662109375, -0.8101959228515625, -0.770355224609375, -0.7305145263671875, -0.690673828125, -0.6508331298828125, -0.610992431640625, -0.5711517333984375, -0.53131103515625, -0.4914703369140625, -0.451629638671875, -0.4117889404296875, -0.3719482421875, -0.3321075439453125, -0.292266845703125, -0.2524261474609375, -0.21258544921875, -0.1727447509765625, -0.132904052734375, -0.0930633544921875, -0.05322265625, -0.0133819580078125, 0.026458740234375, 0.0662994384765625, 0.10614013671875, 0.1459808349609375, 0.185821533203125, 0.2256622314453125, 0.2655029296875, 0.3053436279296875, 0.345184326171875, 0.3850250244140625, 0.42486572265625, 0.4647064208984375, 0.504547119140625, 0.5443878173828125, 0.584228515625, 0.6240692138671875, 0.663909912109375, 0.7037506103515625, 0.74359130859375, 0.7834320068359375, 0.823272705078125, 0.8631134033203125, 0.9029541015625, 0.9427947998046875, 0.982635498046875, 1.0224761962890625, 1.06231689453125, 1.1021575927734375, 1.141998291015625, 1.1818389892578125, 1.2216796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 7.0, 4.0, 15.0, 11.0, 13.0, 18.0, 28.0, 59.0, 69.0, 102.0, 128.0, 174.0, 138.0, 85.0, 42.0, 32.0, 27.0, 24.0, 8.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-05, -4.260055720806122e-05, -4.049763083457947e-05, -3.839470446109772e-05, -3.629177808761597e-05, -3.4188851714134216e-05, -3.2085925340652466e-05, -2.9982998967170715e-05, -2.7880072593688965e-05, -2.5777146220207214e-05, -2.3674219846725464e-05, -2.1571293473243713e-05, -1.9468367099761963e-05, -1.7365440726280212e-05, -1.5262514352798462e-05, -1.3159587979316711e-05, -1.1056661605834961e-05, -8.95373523235321e-06, -6.85080885887146e-06, -4.7478824853897095e-06, -2.644956111907959e-06, -5.420297384262085e-07, 1.560896635055542e-06, 3.6638230085372925e-06, 5.766749382019043e-06, 7.869675755500793e-06, 9.972602128982544e-06, 1.2075528502464294e-05, 1.4178454875946045e-05, 1.6281381249427795e-05, 1.8384307622909546e-05, 2.0487233996391296e-05, 2.2590160369873047e-05, 2.4693086743354797e-05, 2.6796013116836548e-05, 2.88989394903183e-05, 3.100186586380005e-05, 3.31047922372818e-05, 3.520771861076355e-05, 3.73106449842453e-05, 3.941357135772705e-05, 4.15164977312088e-05, 4.361942410469055e-05, 4.57223504781723e-05, 4.782527685165405e-05, 4.99282032251358e-05, 5.2031129598617554e-05, 5.4134055972099304e-05, 5.6236982345581055e-05, 5.8339908719062805e-05, 6.0442835092544556e-05, 6.25457614660263e-05, 6.464868783950806e-05, 6.675161421298981e-05, 6.885454058647156e-05, 7.095746695995331e-05, 7.306039333343506e-05, 7.516331970691681e-05, 7.726624608039856e-05, 7.936917245388031e-05, 8.147209882736206e-05, 8.357502520084381e-05, 8.567795157432556e-05, 8.778087794780731e-05, 8.988380432128906e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 12.0, 12.0, 18.0, 37.0, 48.0, 56.0, 104.0, 128.0, 181.0, 309.0, 400.0, 615.0, 1037.0, 1663.0, 2752.0, 5009.0, 9841.0, 21180.0, 54558.0, 208490.0, 569720.0, 105692.0, 34855.0, 14618.0, 7335.0, 3790.0, 2238.0, 1331.0, 868.0, 543.0, 359.0, 244.0, 146.0, 94.0, 85.0, 49.0, 41.0, 33.0, 20.0, 12.0, 4.0, 6.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.16796875, -1.1338958740234375, -1.099822998046875, -1.0657501220703125, -1.03167724609375, -0.9976043701171875, -0.963531494140625, -0.9294586181640625, -0.8953857421875, -0.8613128662109375, -0.827239990234375, -0.7931671142578125, -0.75909423828125, -0.7250213623046875, -0.690948486328125, -0.6568756103515625, -0.622802734375, -0.5887298583984375, -0.554656982421875, -0.5205841064453125, -0.48651123046875, -0.4524383544921875, -0.418365478515625, -0.3842926025390625, -0.3502197265625, -0.3161468505859375, -0.282073974609375, -0.2480010986328125, -0.21392822265625, -0.1798553466796875, -0.145782470703125, -0.1117095947265625, -0.07763671875, -0.0435638427734375, -0.009490966796875, 0.0245819091796875, 0.05865478515625, 0.0927276611328125, 0.126800537109375, 0.1608734130859375, 0.1949462890625, 0.2290191650390625, 0.263092041015625, 0.2971649169921875, 0.33123779296875, 0.3653106689453125, 0.399383544921875, 0.4334564208984375, 0.467529296875, 0.5016021728515625, 0.535675048828125, 0.5697479248046875, 0.60382080078125, 0.6378936767578125, 0.671966552734375, 0.7060394287109375, 0.7401123046875, 0.7741851806640625, 0.808258056640625, 0.8423309326171875, 0.87640380859375, 0.9104766845703125, 0.944549560546875, 0.9786224365234375, 1.0126953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 5.0, 11.0, 21.0, 17.0, 33.0, 42.0, 54.0, 70.0, 90.0, 122.0, 118.0, 114.0, 78.0, 50.0, 41.0, 29.0, 22.0, 9.0, 11.0, 9.0, 11.0, 5.0, 5.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.237060546875, -0.22910308837890625, -0.2211456298828125, -0.21318817138671875, -0.205230712890625, -0.19727325439453125, -0.1893157958984375, -0.18135833740234375, -0.17340087890625, -0.16544342041015625, -0.1574859619140625, -0.14952850341796875, -0.141571044921875, -0.13361358642578125, -0.1256561279296875, -0.11769866943359375, -0.1097412109375, -0.10178375244140625, -0.0938262939453125, -0.08586883544921875, -0.077911376953125, -0.06995391845703125, -0.0619964599609375, -0.05403900146484375, -0.04608154296875, -0.03812408447265625, -0.0301666259765625, -0.02220916748046875, -0.014251708984375, -0.00629425048828125, 0.0016632080078125, 0.00962066650390625, 0.017578125, 0.02553558349609375, 0.0334930419921875, 0.04145050048828125, 0.049407958984375, 0.05736541748046875, 0.0653228759765625, 0.07328033447265625, 0.08123779296875, 0.08919525146484375, 0.0971527099609375, 0.10511016845703125, 0.113067626953125, 0.12102508544921875, 0.1289825439453125, 0.13694000244140625, 0.1448974609375, 0.15285491943359375, 0.1608123779296875, 0.16876983642578125, 0.176727294921875, 0.18468475341796875, 0.1926422119140625, 0.20059967041015625, 0.20855712890625, 0.21651458740234375, 0.2244720458984375, 0.23242950439453125, 0.240386962890625, 0.24834442138671875, 0.2563018798828125, 0.26425933837890625, 0.272216796875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 11.0, 13.0, 14.0, 28.0, 30.0, 48.0, 69.0, 119.0, 151.0, 138.0, 119.0, 80.0, 41.0, 40.0, 26.0, 18.0, 15.0, 14.0, 12.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.450377464294434, -6.27675724029541, -6.103137016296387, -5.9295172691345215, -5.755897045135498, -5.582276821136475, -5.408657073974609, -5.235036849975586, -5.0614166259765625, -4.887796401977539, -4.714176177978516, -4.54055643081665, -4.366936206817627, -4.1933159828186035, -4.019696235656738, -3.846076011657715, -3.6724557876586914, -3.498835563659668, -3.3252155780792236, -3.1515955924987793, -2.977975368499756, -2.8043551445007324, -2.630735158920288, -2.4571151733398438, -2.2834949493408203, -2.109874725341797, -1.9362547397613525, -1.7626346349716187, -1.5890145301818848, -1.4153944253921509, -1.241774320602417, -1.068154215812683, -0.8945345878601074, -0.7209144830703735, -0.5472943782806396, -0.37367427349090576, -0.20005416870117188, -0.02643406391143799, 0.1471860408782959, 0.3208061456680298, 0.49442625045776367, 0.6680463552474976, 0.8416664600372314, 1.0152865648269653, 1.1889066696166992, 1.362526774406433, 1.536146879196167, 1.7097669839859009, 1.8833870887756348, 2.057007312774658, 2.2306272983551025, 2.404247283935547, 2.5778675079345703, 2.7514877319335938, 2.925107717514038, 3.0987277030944824, 3.272347927093506, 3.4459681510925293, 3.6195881366729736, 3.793208122253418, 3.9668283462524414, 4.140448570251465, 4.314068794250488, 4.4876885414123535, 4.661308765411377]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 3.0, 5.0, 12.0, 8.0, 9.0, 12.0, 17.0, 15.0, 18.0, 24.0, 27.0, 32.0, 28.0, 29.0, 33.0, 34.0, 40.0, 31.0, 41.0, 34.0, 44.0, 37.0, 54.0, 39.0, 34.0, 39.0, 33.0, 32.0, 41.0, 24.0, 35.0, 23.0, 11.0, 12.0, 20.0, 8.0, 10.0, 10.0, 6.0, 5.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28342342376709, -2.2087173461914062, -2.1340110301971436, -2.05930495262146, -1.9845988750457764, -1.9098926782608032, -1.83518648147583, -1.7604804039001465, -1.6857742071151733, -1.6110680103302002, -1.5363619327545166, -1.4616557359695435, -1.3869495391845703, -1.3122434616088867, -1.2375372648239136, -1.1628310680389404, -1.0881249904632568, -1.0134187936782837, -0.9387127161026001, -0.864006519317627, -0.7893003821372986, -0.7145942449569702, -0.6398880481719971, -0.5651819109916687, -0.49047577381134033, -0.41576963663101196, -0.3410634696483612, -0.26635730266571045, -0.19165116548538208, -0.11694502830505371, -0.042238861322402954, 0.0324673056602478, 0.10717320442199707, 0.18187935650348663, 0.2565855085849762, 0.33129167556762695, 0.4059978127479553, 0.4807039499282837, 0.5554101467132568, 0.6301162838935852, 0.7048224210739136, 0.7795285582542419, 0.8542346954345703, 0.9289408922195435, 1.0036470890045166, 1.0783531665802002, 1.1530593633651733, 1.2277655601501465, 1.30247163772583, 1.3771778345108032, 1.4518839120864868, 1.52659010887146, 1.6012961864471436, 1.6760023832321167, 1.7507085800170898, 1.8254146575927734, 1.9001208543777466, 1.9748270511627197, 2.0495331287384033, 2.124239206314087, 2.1989455223083496, 2.273651599884033, 2.348357677459717, 2.4230639934539795, 2.497770071029663]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 6.0, 2.0, 9.0, 7.0, 23.0, 24.0, 36.0, 55.0, 56.0, 77.0, 129.0, 185.0, 271.0, 354.0, 523.0, 770.0, 1065.0, 1584.0, 2437.0, 3689.0, 5731.0, 8922.0, 14402.0, 22952.0, 38425.0, 65665.0, 113985.0, 192815.0, 223383.0, 143831.0, 81873.0, 47973.0, 28683.0, 17495.0, 10898.0, 6904.0, 4476.0, 2861.0, 1923.0, 1282.0, 811.0, 569.0, 414.0, 287.0, 194.0, 144.0, 101.0, 94.0, 46.0, 34.0, 24.0, 21.0, 13.0, 10.0, 8.0, 2.0, 6.0, 6.0, 1.0, 1.0], "bins": [-3.921875, -3.80010986328125, -3.6783447265625, -3.55657958984375, -3.434814453125, -3.31304931640625, -3.1912841796875, -3.06951904296875, -2.94775390625, -2.82598876953125, -2.7042236328125, -2.58245849609375, -2.460693359375, -2.33892822265625, -2.2171630859375, -2.09539794921875, -1.9736328125, -1.85186767578125, -1.7301025390625, -1.60833740234375, -1.486572265625, -1.36480712890625, -1.2430419921875, -1.12127685546875, -0.99951171875, -0.87774658203125, -0.7559814453125, -0.63421630859375, -0.512451171875, -0.39068603515625, -0.2689208984375, -0.14715576171875, -0.025390625, 0.09637451171875, 0.2181396484375, 0.33990478515625, 0.461669921875, 0.58343505859375, 0.7052001953125, 0.82696533203125, 0.94873046875, 1.07049560546875, 1.1922607421875, 1.31402587890625, 1.435791015625, 1.55755615234375, 1.6793212890625, 1.80108642578125, 1.9228515625, 2.04461669921875, 2.1663818359375, 2.28814697265625, 2.409912109375, 2.53167724609375, 2.6534423828125, 2.77520751953125, 2.89697265625, 3.01873779296875, 3.1405029296875, 3.26226806640625, 3.384033203125, 3.50579833984375, 3.6275634765625, 3.74932861328125, 3.87109375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 8.0, 9.0, 11.0, 11.0, 17.0, 20.0, 25.0, 23.0, 28.0, 36.0, 41.0, 36.0, 34.0, 35.0, 38.0, 44.0, 32.0, 41.0, 47.0, 44.0, 32.0, 49.0, 52.0, 34.0, 38.0, 26.0, 29.0, 22.0, 16.0, 12.0, 18.0, 11.0, 8.0, 8.0, 10.0, 10.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.23828125, -2.168792724609375, -2.09930419921875, -2.029815673828125, -1.9603271484375, -1.890838623046875, -1.82135009765625, -1.751861572265625, -1.682373046875, -1.612884521484375, -1.54339599609375, -1.473907470703125, -1.4044189453125, -1.334930419921875, -1.26544189453125, -1.195953369140625, -1.12646484375, -1.056976318359375, -0.98748779296875, -0.917999267578125, -0.8485107421875, -0.779022216796875, -0.70953369140625, -0.640045166015625, -0.570556640625, -0.501068115234375, -0.43157958984375, -0.362091064453125, -0.2926025390625, -0.223114013671875, -0.15362548828125, -0.084136962890625, -0.0146484375, 0.054840087890625, 0.12432861328125, 0.193817138671875, 0.2633056640625, 0.332794189453125, 0.40228271484375, 0.471771240234375, 0.541259765625, 0.610748291015625, 0.68023681640625, 0.749725341796875, 0.8192138671875, 0.888702392578125, 0.95819091796875, 1.027679443359375, 1.09716796875, 1.166656494140625, 1.23614501953125, 1.305633544921875, 1.3751220703125, 1.444610595703125, 1.51409912109375, 1.583587646484375, 1.653076171875, 1.722564697265625, 1.79205322265625, 1.861541748046875, 1.9310302734375, 2.000518798828125, 2.07000732421875, 2.139495849609375, 2.208984375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 11.0, 9.0, 16.0, 17.0, 25.0, 36.0, 54.0, 65.0, 102.0, 175.0, 247.0, 393.0, 618.0, 936.0, 1416.0, 2538.0, 4031.0, 6802.0, 12251.0, 21592.0, 38907.0, 71254.0, 130336.0, 231435.0, 231674.0, 131157.0, 71723.0, 39217.0, 21757.0, 12080.0, 6931.0, 4150.0, 2465.0, 1532.0, 898.0, 587.0, 353.0, 254.0, 158.0, 120.0, 80.0, 50.0, 35.0, 14.0, 22.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-4.5234375, -4.390411376953125, -4.25738525390625, -4.124359130859375, -3.9913330078125, -3.858306884765625, -3.72528076171875, -3.592254638671875, -3.459228515625, -3.326202392578125, -3.19317626953125, -3.060150146484375, -2.9271240234375, -2.794097900390625, -2.66107177734375, -2.528045654296875, -2.39501953125, -2.261993408203125, -2.12896728515625, -1.995941162109375, -1.8629150390625, -1.729888916015625, -1.59686279296875, -1.463836669921875, -1.330810546875, -1.197784423828125, -1.06475830078125, -0.931732177734375, -0.7987060546875, -0.665679931640625, -0.53265380859375, -0.399627685546875, -0.2666015625, -0.133575439453125, -0.00054931640625, 0.132476806640625, 0.2655029296875, 0.398529052734375, 0.53155517578125, 0.664581298828125, 0.797607421875, 0.930633544921875, 1.06365966796875, 1.196685791015625, 1.3297119140625, 1.462738037109375, 1.59576416015625, 1.728790283203125, 1.86181640625, 1.994842529296875, 2.12786865234375, 2.260894775390625, 2.3939208984375, 2.526947021484375, 2.65997314453125, 2.792999267578125, 2.926025390625, 3.059051513671875, 3.19207763671875, 3.325103759765625, 3.4581298828125, 3.591156005859375, 3.72418212890625, 3.857208251953125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 12.0, 13.0, 14.0, 10.0, 20.0, 21.0, 20.0, 26.0, 31.0, 25.0, 30.0, 28.0, 47.0, 41.0, 47.0, 59.0, 42.0, 43.0, 36.0, 52.0, 40.0, 52.0, 36.0, 32.0, 31.0, 31.0, 30.0, 19.0, 23.0, 15.0, 16.0, 6.0, 9.0, 9.0, 6.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-1.826171875, -1.7763519287109375, -1.726531982421875, -1.6767120361328125, -1.62689208984375, -1.5770721435546875, -1.527252197265625, -1.4774322509765625, -1.4276123046875, -1.3777923583984375, -1.327972412109375, -1.2781524658203125, -1.22833251953125, -1.1785125732421875, -1.128692626953125, -1.0788726806640625, -1.029052734375, -0.9792327880859375, -0.929412841796875, -0.8795928955078125, -0.82977294921875, -0.7799530029296875, -0.730133056640625, -0.6803131103515625, -0.6304931640625, -0.5806732177734375, -0.530853271484375, -0.4810333251953125, -0.43121337890625, -0.3813934326171875, -0.331573486328125, -0.2817535400390625, -0.23193359375, -0.1821136474609375, -0.132293701171875, -0.0824737548828125, -0.03265380859375, 0.0171661376953125, 0.066986083984375, 0.1168060302734375, 0.1666259765625, 0.2164459228515625, 0.266265869140625, 0.3160858154296875, 0.36590576171875, 0.4157257080078125, 0.465545654296875, 0.5153656005859375, 0.565185546875, 0.6150054931640625, 0.664825439453125, 0.7146453857421875, 0.76446533203125, 0.8142852783203125, 0.864105224609375, 0.9139251708984375, 0.9637451171875, 1.0135650634765625, 1.063385009765625, 1.1132049560546875, 1.16302490234375, 1.2128448486328125, 1.262664794921875, 1.3124847412109375, 1.3623046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 9.0, 7.0, 9.0, 8.0, 11.0, 26.0, 31.0, 46.0, 53.0, 92.0, 143.0, 188.0, 307.0, 487.0, 743.0, 1299.0, 2405.0, 4842.0, 11627.0, 34040.0, 197593.0, 713796.0, 51936.0, 15547.0, 6292.0, 3019.0, 1568.0, 855.0, 518.0, 346.0, 233.0, 125.0, 109.0, 82.0, 60.0, 34.0, 20.0, 17.0, 13.0, 11.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.00921630859375, -5.7957763671875, -5.58233642578125, -5.368896484375, -5.15545654296875, -4.9420166015625, -4.72857666015625, -4.51513671875, -4.30169677734375, -4.0882568359375, -3.87481689453125, -3.661376953125, -3.44793701171875, -3.2344970703125, -3.02105712890625, -2.8076171875, -2.59417724609375, -2.3807373046875, -2.16729736328125, -1.953857421875, -1.74041748046875, -1.5269775390625, -1.31353759765625, -1.10009765625, -0.88665771484375, -0.6732177734375, -0.45977783203125, -0.246337890625, -0.03289794921875, 0.1805419921875, 0.39398193359375, 0.607421875, 0.82086181640625, 1.0343017578125, 1.24774169921875, 1.461181640625, 1.67462158203125, 1.8880615234375, 2.10150146484375, 2.31494140625, 2.52838134765625, 2.7418212890625, 2.95526123046875, 3.168701171875, 3.38214111328125, 3.5955810546875, 3.80902099609375, 4.0224609375, 4.23590087890625, 4.4493408203125, 4.66278076171875, 4.876220703125, 5.08966064453125, 5.3031005859375, 5.51654052734375, 5.72998046875, 5.94342041015625, 6.1568603515625, 6.37030029296875, 6.583740234375, 6.79718017578125, 7.0106201171875, 7.22406005859375, 7.4375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 1.0, 4.0, 5.0, 8.0, 8.0, 6.0, 20.0, 29.0, 25.0, 37.0, 59.0, 87.0, 153.0, 201.0, 96.0, 69.0, 49.0, 27.0, 28.0, 15.0, 15.0, 12.0, 3.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012969970703125, -0.00012590736150741577, -0.00012211501598358154, -0.00011832267045974731, -0.00011453032493591309, -0.00011073797941207886, -0.00010694563388824463, -0.0001031532883644104, -9.936094284057617e-05, -9.556859731674194e-05, -9.177625179290771e-05, -8.798390626907349e-05, -8.419156074523926e-05, -8.039921522140503e-05, -7.66068696975708e-05, -7.281452417373657e-05, -6.902217864990234e-05, -6.522983312606812e-05, -6.143748760223389e-05, -5.764514207839966e-05, -5.385279655456543e-05, -5.00604510307312e-05, -4.626810550689697e-05, -4.2475759983062744e-05, -3.8683414459228516e-05, -3.489106893539429e-05, -3.109872341156006e-05, -2.730637788772583e-05, -2.35140323638916e-05, -1.9721686840057373e-05, -1.5929341316223145e-05, -1.2136995792388916e-05, -8.344650268554688e-06, -4.552304744720459e-06, -7.599592208862305e-07, 3.032386302947998e-06, 6.8247318267822266e-06, 1.0617077350616455e-05, 1.4409422874450684e-05, 1.8201768398284912e-05, 2.199411392211914e-05, 2.578645944595337e-05, 2.9578804969787598e-05, 3.3371150493621826e-05, 3.7163496017456055e-05, 4.095584154129028e-05, 4.474818706512451e-05, 4.854053258895874e-05, 5.233287811279297e-05, 5.61252236366272e-05, 5.9917569160461426e-05, 6.370991468429565e-05, 6.750226020812988e-05, 7.129460573196411e-05, 7.508695125579834e-05, 7.887929677963257e-05, 8.26716423034668e-05, 8.646398782730103e-05, 9.025633335113525e-05, 9.404867887496948e-05, 9.784102439880371e-05, 0.00010163336992263794, 0.00010542571544647217, 0.0001092180609703064, 0.00011301040649414062]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 8.0, 9.0, 13.0, 21.0, 48.0, 57.0, 73.0, 102.0, 148.0, 190.0, 251.0, 442.0, 629.0, 903.0, 1363.0, 2213.0, 4142.0, 7915.0, 18161.0, 52601.0, 622348.0, 259927.0, 43917.0, 15979.0, 7158.0, 3776.0, 2086.0, 1249.0, 867.0, 577.0, 402.0, 277.0, 208.0, 143.0, 92.0, 70.0, 42.0, 37.0, 22.0, 13.0, 16.0, 12.0, 5.0, 6.0, 8.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.9833984375, -4.822265625, -4.6611328125, -4.5, -4.3388671875, -4.177734375, -4.0166015625, -3.85546875, -3.6943359375, -3.533203125, -3.3720703125, -3.2109375, -3.0498046875, -2.888671875, -2.7275390625, -2.56640625, -2.4052734375, -2.244140625, -2.0830078125, -1.921875, -1.7607421875, -1.599609375, -1.4384765625, -1.27734375, -1.1162109375, -0.955078125, -0.7939453125, -0.6328125, -0.4716796875, -0.310546875, -0.1494140625, 0.01171875, 0.1728515625, 0.333984375, 0.4951171875, 0.65625, 0.8173828125, 0.978515625, 1.1396484375, 1.30078125, 1.4619140625, 1.623046875, 1.7841796875, 1.9453125, 2.1064453125, 2.267578125, 2.4287109375, 2.58984375, 2.7509765625, 2.912109375, 3.0732421875, 3.234375, 3.3955078125, 3.556640625, 3.7177734375, 3.87890625, 4.0400390625, 4.201171875, 4.3623046875, 4.5234375, 4.6845703125, 4.845703125, 5.0068359375, 5.16796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 4.0, 10.0, 7.0, 5.0, 25.0, 23.0, 22.0, 39.0, 50.0, 76.0, 222.0, 208.0, 82.0, 44.0, 51.0, 25.0, 16.0, 19.0, 15.0, 12.0, 12.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.25, -1.21209716796875, -1.1741943359375, -1.13629150390625, -1.098388671875, -1.06048583984375, -1.0225830078125, -0.98468017578125, -0.94677734375, -0.90887451171875, -0.8709716796875, -0.83306884765625, -0.795166015625, -0.75726318359375, -0.7193603515625, -0.68145751953125, -0.6435546875, -0.60565185546875, -0.5677490234375, -0.52984619140625, -0.491943359375, -0.45404052734375, -0.4161376953125, -0.37823486328125, -0.34033203125, -0.30242919921875, -0.2645263671875, -0.22662353515625, -0.188720703125, -0.15081787109375, -0.1129150390625, -0.07501220703125, -0.037109375, 0.00079345703125, 0.0386962890625, 0.07659912109375, 0.114501953125, 0.15240478515625, 0.1903076171875, 0.22821044921875, 0.26611328125, 0.30401611328125, 0.3419189453125, 0.37982177734375, 0.417724609375, 0.45562744140625, 0.4935302734375, 0.53143310546875, 0.5693359375, 0.60723876953125, 0.6451416015625, 0.68304443359375, 0.720947265625, 0.75885009765625, 0.7967529296875, 0.83465576171875, 0.87255859375, 0.91046142578125, 0.9483642578125, 0.98626708984375, 1.024169921875, 1.06207275390625, 1.0999755859375, 1.13787841796875, 1.17578125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 11.0, 21.0, 22.0, 29.0, 45.0, 74.0, 118.0, 150.0, 162.0, 89.0, 74.0, 63.0, 33.0, 24.0, 21.0, 16.0, 10.0, 7.0, 6.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.855809688568115, -5.697134017944336, -5.538457870483398, -5.379782199859619, -5.22110652923584, -5.062430381774902, -4.903754711151123, -4.745079040527344, -4.586402893066406, -4.427727222442627, -4.2690510749816895, -4.11037540435791, -3.951699733734131, -3.7930238246917725, -3.634347915649414, -3.4756722450256348, -3.3169965744018555, -3.158320665359497, -2.9996449947357178, -2.8409690856933594, -2.68229341506958, -2.5236175060272217, -2.3649415969848633, -2.206265926361084, -2.0475900173187256, -1.8889142274856567, -1.730238437652588, -1.5715625286102295, -1.4128867387771606, -1.2542109489440918, -1.0955350399017334, -0.9368592500686646, -0.7781839370727539, -0.6195081472396851, -0.46083229780197144, -0.3021564781665802, -0.14348065853118896, 0.015195131301879883, 0.1738709807395935, 0.33254683017730713, 0.491222620010376, 0.6498984098434448, 0.8085742592811584, 0.9672501087188721, 1.125925898551941, 1.2846016883850098, 1.4432775974273682, 1.601953387260437, 1.7606291770935059, 1.9193049669265747, 2.0779807567596436, 2.236656665802002, 2.3953323364257812, 2.5540082454681396, 2.712684154510498, 2.8713598251342773, 3.0300357341766357, 3.188711643218994, 3.3473873138427734, 3.506063222885132, 3.6647391319274902, 3.8234148025512695, 3.982090711593628, 4.140766620635986, 4.299442291259766]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 10.0, 12.0, 11.0, 10.0, 16.0, 8.0, 14.0, 17.0, 21.0, 17.0, 27.0, 28.0, 18.0, 27.0, 34.0, 43.0, 31.0, 32.0, 45.0, 34.0, 39.0, 46.0, 44.0, 60.0, 41.0, 36.0, 29.0, 26.0, 28.0, 27.0, 18.0, 20.0, 22.0, 24.0, 12.0, 8.0, 10.0, 11.0, 10.0, 6.0, 3.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091533660888672, -2.0223774909973145, -1.953221321105957, -1.8840651512145996, -1.8149088621139526, -1.7457526922225952, -1.6765965223312378, -1.6074403524398804, -1.5382840633392334, -1.469127893447876, -1.3999717235565186, -1.3308155536651611, -1.2616592645645142, -1.1925030946731567, -1.1233469247817993, -1.054190754890442, -0.9850345849990845, -0.915878415107727, -0.8467221856117249, -0.7775660157203674, -0.7084097862243652, -0.6392536163330078, -0.5700974464416504, -0.500941276550293, -0.43178504705429077, -0.36262884736061096, -0.29347264766693115, -0.22431647777557373, -0.15516027808189392, -0.08600407838821411, -0.01684790849685669, 0.05230829119682312, 0.12146449089050293, 0.19062069058418274, 0.25977689027786255, 0.32893306016921997, 0.3980892598628998, 0.4672454595565796, 0.536401629447937, 0.6055577993392944, 0.6747140288352966, 0.743870198726654, 0.8130264282226562, 0.8821825981140137, 0.9513387680053711, 1.0204949378967285, 1.089651107788086, 1.158807396888733, 1.2279635667800903, 1.2971197366714478, 1.3662759065628052, 1.4354321956634521, 1.5045883655548096, 1.573744535446167, 1.6429007053375244, 1.7120568752288818, 1.7812130451202393, 1.8503692150115967, 1.919525384902954, 1.9886815547943115, 2.057837724685669, 2.1269941329956055, 2.196150302886963, 2.2653064727783203, 2.3344626426696777]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 11.0, 4.0, 11.0, 14.0, 21.0, 18.0, 36.0, 40.0, 58.0, 77.0, 120.0, 124.0, 212.0, 278.0, 410.0, 539.0, 820.0, 1127.0, 1679.0, 2339.0, 3434.0, 5059.0, 7926.0, 12991.0, 21369.0, 37033.0, 67765.0, 137476.0, 355342.0, 1358594.0, 1470784.0, 387265.0, 145768.0, 72231.0, 39923.0, 23173.0, 14109.0, 8924.0, 5622.0, 3753.0, 2535.0, 1697.0, 1161.0, 776.0, 519.0, 368.0, 269.0, 155.0, 114.0, 76.0, 53.0, 34.0, 20.0, 10.0, 9.0, 3.0, 5.0, 4.0], "bins": [-3.826171875, -3.720001220703125, -3.61383056640625, -3.507659912109375, -3.4014892578125, -3.295318603515625, -3.18914794921875, -3.082977294921875, -2.976806640625, -2.870635986328125, -2.76446533203125, -2.658294677734375, -2.5521240234375, -2.445953369140625, -2.33978271484375, -2.233612060546875, -2.12744140625, -2.021270751953125, -1.91510009765625, -1.808929443359375, -1.7027587890625, -1.596588134765625, -1.49041748046875, -1.384246826171875, -1.278076171875, -1.171905517578125, -1.06573486328125, -0.959564208984375, -0.8533935546875, -0.747222900390625, -0.64105224609375, -0.534881591796875, -0.4287109375, -0.322540283203125, -0.21636962890625, -0.110198974609375, -0.0040283203125, 0.102142333984375, 0.20831298828125, 0.314483642578125, 0.420654296875, 0.526824951171875, 0.63299560546875, 0.739166259765625, 0.8453369140625, 0.951507568359375, 1.05767822265625, 1.163848876953125, 1.27001953125, 1.376190185546875, 1.48236083984375, 1.588531494140625, 1.6947021484375, 1.800872802734375, 1.90704345703125, 2.013214111328125, 2.119384765625, 2.225555419921875, 2.33172607421875, 2.437896728515625, 2.5440673828125, 2.650238037109375, 2.75640869140625, 2.862579345703125, 2.96875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 9.0, 8.0, 9.0, 9.0, 20.0, 14.0, 18.0, 16.0, 18.0, 26.0, 26.0, 28.0, 28.0, 29.0, 41.0, 31.0, 36.0, 47.0, 41.0, 40.0, 50.0, 54.0, 47.0, 33.0, 46.0, 34.0, 24.0, 21.0, 39.0, 19.0, 20.0, 13.0, 18.0, 12.0, 14.0, 9.0, 8.0, 7.0, 8.0, 1.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.47265625, -1.4268341064453125, -1.381011962890625, -1.3351898193359375, -1.28936767578125, -1.2435455322265625, -1.197723388671875, -1.1519012451171875, -1.1060791015625, -1.0602569580078125, -1.014434814453125, -0.9686126708984375, -0.92279052734375, -0.8769683837890625, -0.831146240234375, -0.7853240966796875, -0.739501953125, -0.6936798095703125, -0.647857666015625, -0.6020355224609375, -0.55621337890625, -0.5103912353515625, -0.464569091796875, -0.4187469482421875, -0.3729248046875, -0.3271026611328125, -0.281280517578125, -0.2354583740234375, -0.18963623046875, -0.1438140869140625, -0.097991943359375, -0.0521697998046875, -0.00634765625, 0.0394744873046875, 0.085296630859375, 0.1311187744140625, 0.17694091796875, 0.2227630615234375, 0.268585205078125, 0.3144073486328125, 0.3602294921875, 0.4060516357421875, 0.451873779296875, 0.4976959228515625, 0.54351806640625, 0.5893402099609375, 0.635162353515625, 0.6809844970703125, 0.726806640625, 0.7726287841796875, 0.818450927734375, 0.8642730712890625, 0.91009521484375, 0.9559173583984375, 1.001739501953125, 1.0475616455078125, 1.0933837890625, 1.1392059326171875, 1.185028076171875, 1.2308502197265625, 1.27667236328125, 1.3224945068359375, 1.368316650390625, 1.4141387939453125, 1.4599609375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 14.0, 14.0, 18.0, 32.0, 49.0, 63.0, 96.0, 140.0, 216.0, 371.0, 525.0, 883.0, 1396.0, 2330.0, 4045.0, 7282.0, 12672.0, 24123.0, 47973.0, 102663.0, 244287.0, 704440.0, 1837808.0, 738313.0, 253524.0, 105628.0, 49453.0, 24760.0, 13334.0, 7223.0, 4244.0, 2438.0, 1472.0, 840.0, 596.0, 345.0, 244.0, 141.0, 98.0, 60.0, 33.0, 32.0, 22.0, 12.0, 9.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.31854248046875, -3.2132568359375, -3.10797119140625, -3.002685546875, -2.89739990234375, -2.7921142578125, -2.68682861328125, -2.58154296875, -2.47625732421875, -2.3709716796875, -2.26568603515625, -2.160400390625, -2.05511474609375, -1.9498291015625, -1.84454345703125, -1.7392578125, -1.63397216796875, -1.5286865234375, -1.42340087890625, -1.318115234375, -1.21282958984375, -1.1075439453125, -1.00225830078125, -0.89697265625, -0.79168701171875, -0.6864013671875, -0.58111572265625, -0.475830078125, -0.37054443359375, -0.2652587890625, -0.15997314453125, -0.0546875, 0.05059814453125, 0.1558837890625, 0.26116943359375, 0.366455078125, 0.47174072265625, 0.5770263671875, 0.68231201171875, 0.78759765625, 0.89288330078125, 0.9981689453125, 1.10345458984375, 1.208740234375, 1.31402587890625, 1.4193115234375, 1.52459716796875, 1.6298828125, 1.73516845703125, 1.8404541015625, 1.94573974609375, 2.051025390625, 2.15631103515625, 2.2615966796875, 2.36688232421875, 2.47216796875, 2.57745361328125, 2.6827392578125, 2.78802490234375, 2.893310546875, 2.99859619140625, 3.1038818359375, 3.20916748046875, 3.314453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 3.0, 7.0, 11.0, 10.0, 13.0, 16.0, 23.0, 24.0, 44.0, 50.0, 46.0, 55.0, 70.0, 105.0, 96.0, 141.0, 174.0, 193.0, 219.0, 243.0, 274.0, 258.0, 284.0, 270.0, 239.0, 209.0, 188.0, 142.0, 131.0, 85.0, 104.0, 57.0, 42.0, 44.0, 35.0, 34.0, 35.0, 20.0, 17.0, 14.0, 7.0, 4.0, 15.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.76171875, -0.7371826171875, -0.712646484375, -0.6881103515625, -0.66357421875, -0.6390380859375, -0.614501953125, -0.5899658203125, -0.5654296875, -0.5408935546875, -0.516357421875, -0.4918212890625, -0.46728515625, -0.4427490234375, -0.418212890625, -0.3936767578125, -0.369140625, -0.3446044921875, -0.320068359375, -0.2955322265625, -0.27099609375, -0.2464599609375, -0.221923828125, -0.1973876953125, -0.1728515625, -0.1483154296875, -0.123779296875, -0.0992431640625, -0.07470703125, -0.0501708984375, -0.025634765625, -0.0010986328125, 0.0234375, 0.0479736328125, 0.072509765625, 0.0970458984375, 0.12158203125, 0.1461181640625, 0.170654296875, 0.1951904296875, 0.2197265625, 0.2442626953125, 0.268798828125, 0.2933349609375, 0.31787109375, 0.3424072265625, 0.366943359375, 0.3914794921875, 0.416015625, 0.4405517578125, 0.465087890625, 0.4896240234375, 0.51416015625, 0.5386962890625, 0.563232421875, 0.5877685546875, 0.6123046875, 0.6368408203125, 0.661376953125, 0.6859130859375, 0.71044921875, 0.7349853515625, 0.759521484375, 0.7840576171875, 0.80859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 14.0, 14.0, 25.0, 44.0, 53.0, 90.0, 126.0, 139.0, 146.0, 100.0, 67.0, 44.0, 34.0, 26.0, 15.0, 12.0, 9.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.113173961639404, -4.994057655334473, -4.874941349029541, -4.755825042724609, -4.636708736419678, -4.517592430114746, -4.3984761238098145, -4.279359817504883, -4.160243511199951, -4.0411272048950195, -3.922010898590088, -3.8028945922851562, -3.6837782859802246, -3.564661979675293, -3.4455456733703613, -3.3264293670654297, -3.207312822341919, -3.0881965160369873, -2.9690802097320557, -2.849963903427124, -2.7308475971221924, -2.6117312908172607, -2.49261474609375, -2.3734984397888184, -2.2543821334838867, -2.135265827178955, -2.0161495208740234, -1.8970332145690918, -1.7779169082641602, -1.6588006019592285, -1.5396841764450073, -1.4205678701400757, -1.3014514446258545, -1.1823351383209229, -1.0632188320159912, -0.9441024661064148, -0.8249861598014832, -0.7058698534965515, -0.5867534875869751, -0.46763718128204346, -0.3485208749771118, -0.22940455377101898, -0.11028823256492615, 0.00882810354232788, 0.12794440984725952, 0.24706071615219116, 0.3661770820617676, 0.4852933883666992, 0.6044096946716309, 0.7235260009765625, 0.8426423072814941, 0.9617586731910706, 1.0808749198913574, 1.199991226196289, 1.3191076517105103, 1.438223958015442, 1.5573402643203735, 1.6764565706253052, 1.7955728769302368, 1.914689302444458, 2.0338056087493896, 2.1529219150543213, 2.272038221359253, 2.3911545276641846, 2.510270833969116]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 6.0, 13.0, 8.0, 8.0, 11.0, 16.0, 25.0, 24.0, 32.0, 37.0, 24.0, 27.0, 35.0, 31.0, 31.0, 39.0, 40.0, 46.0, 51.0, 36.0, 41.0, 51.0, 49.0, 29.0, 39.0, 37.0, 20.0, 22.0, 28.0, 22.0, 21.0, 11.0, 9.0, 14.0, 12.0, 2.0, 7.0, 5.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8106961250305176, -1.757601261138916, -1.7045063972473145, -1.651411533355713, -1.5983166694641113, -1.5452218055725098, -1.4921269416809082, -1.4390320777893066, -1.385937213897705, -1.3328423500061035, -1.279747486114502, -1.2266526222229004, -1.1735577583312988, -1.1204628944396973, -1.0673680305480957, -1.0142731666564941, -0.9611783623695374, -0.9080834984779358, -0.8549886345863342, -0.8018937706947327, -0.7487989068031311, -0.6957041025161743, -0.6426092386245728, -0.5895143747329712, -0.5364195108413696, -0.48332464694976807, -0.4302297830581665, -0.37713491916656494, -0.3240400552749634, -0.2709452211856842, -0.21785035729408264, -0.16475549340248108, -0.11166059970855713, -0.058565739542245865, -0.005470879375934601, 0.047623977065086365, 0.10071884095668793, 0.1538136899471283, 0.20690855383872986, 0.2600034177303314, 0.313098281621933, 0.36619314551353455, 0.4192880094051361, 0.4723828434944153, 0.5254777073860168, 0.5785725712776184, 0.63166743516922, 0.6847622990608215, 0.7378571629524231, 0.7909520268440247, 0.8440468907356262, 0.8971417546272278, 0.9502366185188293, 1.0033314228057861, 1.0564262866973877, 1.1095211505889893, 1.1626160144805908, 1.2157108783721924, 1.268805742263794, 1.3219006061553955, 1.374995470046997, 1.4280903339385986, 1.4811851978302002, 1.5342800617218018, 1.5873749256134033]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 6.0, 5.0, 5.0, 9.0, 22.0, 24.0, 36.0, 43.0, 81.0, 90.0, 140.0, 226.0, 375.0, 568.0, 889.0, 1390.0, 2364.0, 4237.0, 7481.0, 13942.0, 27910.0, 60446.0, 156995.0, 462461.0, 178298.0, 66327.0, 30106.0, 14973.0, 8037.0, 4472.0, 2561.0, 1479.0, 911.0, 548.0, 334.0, 233.0, 169.0, 106.0, 77.0, 44.0, 42.0, 29.0, 18.0, 7.0, 10.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.98046875, -1.9156494140625, -1.850830078125, -1.7860107421875, -1.72119140625, -1.6563720703125, -1.591552734375, -1.5267333984375, -1.4619140625, -1.3970947265625, -1.332275390625, -1.2674560546875, -1.20263671875, -1.1378173828125, -1.072998046875, -1.0081787109375, -0.943359375, -0.8785400390625, -0.813720703125, -0.7489013671875, -0.68408203125, -0.6192626953125, -0.554443359375, -0.4896240234375, -0.4248046875, -0.3599853515625, -0.295166015625, -0.2303466796875, -0.16552734375, -0.1007080078125, -0.035888671875, 0.0289306640625, 0.09375, 0.1585693359375, 0.223388671875, 0.2882080078125, 0.35302734375, 0.4178466796875, 0.482666015625, 0.5474853515625, 0.6123046875, 0.6771240234375, 0.741943359375, 0.8067626953125, 0.87158203125, 0.9364013671875, 1.001220703125, 1.0660400390625, 1.130859375, 1.1956787109375, 1.260498046875, 1.3253173828125, 1.39013671875, 1.4549560546875, 1.519775390625, 1.5845947265625, 1.6494140625, 1.7142333984375, 1.779052734375, 1.8438720703125, 1.90869140625, 1.9735107421875, 2.038330078125, 2.1031494140625, 2.16796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 7.0, 7.0, 10.0, 12.0, 9.0, 20.0, 23.0, 24.0, 22.0, 27.0, 36.0, 40.0, 34.0, 32.0, 42.0, 41.0, 43.0, 47.0, 38.0, 52.0, 41.0, 41.0, 47.0, 34.0, 44.0, 24.0, 27.0, 24.0, 19.0, 22.0, 16.0, 13.0, 10.0, 10.0, 10.0, 7.0, 8.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.9609375, -1.9049072265625, -1.848876953125, -1.7928466796875, -1.73681640625, -1.6807861328125, -1.624755859375, -1.5687255859375, -1.5126953125, -1.4566650390625, -1.400634765625, -1.3446044921875, -1.28857421875, -1.2325439453125, -1.176513671875, -1.1204833984375, -1.064453125, -1.0084228515625, -0.952392578125, -0.8963623046875, -0.84033203125, -0.7843017578125, -0.728271484375, -0.6722412109375, -0.6162109375, -0.5601806640625, -0.504150390625, -0.4481201171875, -0.39208984375, -0.3360595703125, -0.280029296875, -0.2239990234375, -0.16796875, -0.1119384765625, -0.055908203125, 0.0001220703125, 0.05615234375, 0.1121826171875, 0.168212890625, 0.2242431640625, 0.2802734375, 0.3363037109375, 0.392333984375, 0.4483642578125, 0.50439453125, 0.5604248046875, 0.616455078125, 0.6724853515625, 0.728515625, 0.7845458984375, 0.840576171875, 0.8966064453125, 0.95263671875, 1.0086669921875, 1.064697265625, 1.1207275390625, 1.1767578125, 1.2327880859375, 1.288818359375, 1.3448486328125, 1.40087890625, 1.4569091796875, 1.512939453125, 1.5689697265625, 1.625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 10.0, 15.0, 16.0, 25.0, 28.0, 38.0, 35.0, 60.0, 81.0, 100.0, 136.0, 200.0, 279.0, 407.0, 622.0, 930.0, 1583.0, 2407.0, 4140.0, 7568.0, 15832.0, 44352.0, 506330.0, 389035.0, 41194.0, 15235.0, 7333.0, 3953.0, 2289.0, 1415.0, 913.0, 595.0, 389.0, 275.0, 185.0, 131.0, 90.0, 82.0, 58.0, 42.0, 32.0, 29.0, 20.0, 18.0, 3.0, 6.0, 9.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0], "bins": [-3.138671875, -3.037322998046875, -2.93597412109375, -2.834625244140625, -2.7332763671875, -2.631927490234375, -2.53057861328125, -2.429229736328125, -2.327880859375, -2.226531982421875, -2.12518310546875, -2.023834228515625, -1.9224853515625, -1.821136474609375, -1.71978759765625, -1.618438720703125, -1.51708984375, -1.415740966796875, -1.31439208984375, -1.213043212890625, -1.1116943359375, -1.010345458984375, -0.90899658203125, -0.807647705078125, -0.706298828125, -0.604949951171875, -0.50360107421875, -0.402252197265625, -0.3009033203125, -0.199554443359375, -0.09820556640625, 0.003143310546875, 0.1044921875, 0.205841064453125, 0.30718994140625, 0.408538818359375, 0.5098876953125, 0.611236572265625, 0.71258544921875, 0.813934326171875, 0.915283203125, 1.016632080078125, 1.11798095703125, 1.219329833984375, 1.3206787109375, 1.422027587890625, 1.52337646484375, 1.624725341796875, 1.72607421875, 1.827423095703125, 1.92877197265625, 2.030120849609375, 2.1314697265625, 2.232818603515625, 2.33416748046875, 2.435516357421875, 2.536865234375, 2.638214111328125, 2.73956298828125, 2.840911865234375, 2.9422607421875, 3.043609619140625, 3.14495849609375, 3.246307373046875, 3.34765625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 12.0, 6.0, 4.0, 4.0, 13.0, 9.0, 21.0, 19.0, 22.0, 27.0, 21.0, 24.0, 26.0, 36.0, 38.0, 42.0, 38.0, 45.0, 35.0, 47.0, 45.0, 60.0, 37.0, 30.0, 40.0, 38.0, 45.0, 27.0, 27.0, 33.0, 22.0, 22.0, 18.0, 25.0, 16.0, 9.0, 8.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.27520751953125, -1.2349853515625, -1.19476318359375, -1.154541015625, -1.11431884765625, -1.0740966796875, -1.03387451171875, -0.99365234375, -0.95343017578125, -0.9132080078125, -0.87298583984375, -0.832763671875, -0.79254150390625, -0.7523193359375, -0.71209716796875, -0.671875, -0.63165283203125, -0.5914306640625, -0.55120849609375, -0.510986328125, -0.47076416015625, -0.4305419921875, -0.39031982421875, -0.35009765625, -0.30987548828125, -0.2696533203125, -0.22943115234375, -0.189208984375, -0.14898681640625, -0.1087646484375, -0.06854248046875, -0.0283203125, 0.01190185546875, 0.0521240234375, 0.09234619140625, 0.132568359375, 0.17279052734375, 0.2130126953125, 0.25323486328125, 0.29345703125, 0.33367919921875, 0.3739013671875, 0.41412353515625, 0.454345703125, 0.49456787109375, 0.5347900390625, 0.57501220703125, 0.615234375, 0.65545654296875, 0.6956787109375, 0.73590087890625, 0.776123046875, 0.81634521484375, 0.8565673828125, 0.89678955078125, 0.93701171875, 0.97723388671875, 1.0174560546875, 1.05767822265625, 1.097900390625, 1.13812255859375, 1.1783447265625, 1.21856689453125, 1.2587890625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 4.0, 4.0, 11.0, 18.0, 23.0, 27.0, 42.0, 73.0, 95.0, 124.0, 173.0, 230.0, 344.0, 497.0, 759.0, 1017.0, 1641.0, 2573.0, 4473.0, 8028.0, 16466.0, 41637.0, 173971.0, 644165.0, 93840.0, 29104.0, 12516.0, 6395.0, 3636.0, 2149.0, 1443.0, 918.0, 607.0, 474.0, 313.0, 210.0, 149.0, 111.0, 90.0, 51.0, 41.0, 25.0, 34.0, 11.0, 12.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.44189453125, -0.42822265625, -0.41455078125, -0.40087890625, -0.38720703125, -0.37353515625, -0.35986328125, -0.34619140625, -0.33251953125, -0.31884765625, -0.30517578125, -0.29150390625, -0.27783203125, -0.26416015625, -0.25048828125, -0.23681640625, -0.22314453125, -0.20947265625, -0.19580078125, -0.18212890625, -0.16845703125, -0.15478515625, -0.14111328125, -0.12744140625, -0.11376953125, -0.10009765625, -0.08642578125, -0.07275390625, -0.05908203125, -0.04541015625, -0.03173828125, -0.01806640625, -0.00439453125, 0.00927734375, 0.02294921875, 0.03662109375, 0.05029296875, 0.06396484375, 0.07763671875, 0.09130859375, 0.10498046875, 0.11865234375, 0.13232421875, 0.14599609375, 0.15966796875, 0.17333984375, 0.18701171875, 0.20068359375, 0.21435546875, 0.22802734375, 0.24169921875, 0.25537109375, 0.26904296875, 0.28271484375, 0.29638671875, 0.31005859375, 0.32373046875, 0.33740234375, 0.35107421875, 0.36474609375, 0.37841796875, 0.39208984375, 0.40576171875, 0.41943359375, 0.43310546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 1.0, 6.0, 1.0, 3.0, 12.0, 6.0, 10.0, 8.0, 14.0, 17.0, 28.0, 39.0, 31.0, 43.0, 69.0, 79.0, 90.0, 103.0, 81.0, 91.0, 69.0, 47.0, 28.0, 32.0, 18.0, 15.0, 12.0, 8.0, 10.0, 9.0, 8.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.7894973754882812e-05, -2.7103349566459656e-05, -2.63117253780365e-05, -2.5520101189613342e-05, -2.4728477001190186e-05, -2.393685281276703e-05, -2.3145228624343872e-05, -2.2353604435920715e-05, -2.156198024749756e-05, -2.0770356059074402e-05, -1.9978731870651245e-05, -1.918710768222809e-05, -1.839548349380493e-05, -1.7603859305381775e-05, -1.6812235116958618e-05, -1.602061092853546e-05, -1.5228986740112305e-05, -1.4437362551689148e-05, -1.3645738363265991e-05, -1.2854114174842834e-05, -1.2062489986419678e-05, -1.1270865797996521e-05, -1.0479241609573364e-05, -9.687617421150208e-06, -8.89599323272705e-06, -8.104369044303894e-06, -7.312744855880737e-06, -6.5211206674575806e-06, -5.729496479034424e-06, -4.937872290611267e-06, -4.14624810218811e-06, -3.3546239137649536e-06, -2.562999725341797e-06, -1.7713755369186401e-06, -9.797513484954834e-07, -1.8812716007232666e-07, 6.034970283508301e-07, 1.3951212167739868e-06, 2.1867454051971436e-06, 2.9783695936203003e-06, 3.769993782043457e-06, 4.561617970466614e-06, 5.3532421588897705e-06, 6.144866347312927e-06, 6.936490535736084e-06, 7.72811472415924e-06, 8.519738912582397e-06, 9.311363101005554e-06, 1.0102987289428711e-05, 1.0894611477851868e-05, 1.1686235666275024e-05, 1.2477859854698181e-05, 1.3269484043121338e-05, 1.4061108231544495e-05, 1.4852732419967651e-05, 1.5644356608390808e-05, 1.6435980796813965e-05, 1.722760498523712e-05, 1.801922917366028e-05, 1.8810853362083435e-05, 1.9602477550506592e-05, 2.039410173892975e-05, 2.1185725927352905e-05, 2.1977350115776062e-05, 2.276897430419922e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 8.0, 11.0, 7.0, 8.0, 9.0, 17.0, 26.0, 42.0, 59.0, 77.0, 115.0, 156.0, 228.0, 319.0, 438.0, 694.0, 996.0, 1540.0, 2298.0, 3825.0, 6169.0, 10870.0, 19524.0, 38698.0, 88250.0, 306167.0, 375445.0, 99542.0, 42010.0, 21210.0, 11611.0, 6761.0, 4007.0, 2516.0, 1627.0, 1015.0, 697.0, 444.0, 342.0, 223.0, 159.0, 114.0, 80.0, 45.0, 48.0, 31.0, 25.0, 18.0, 11.0, 7.0, 9.0, 5.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.3271484375, -0.3158912658691406, -0.30463409423828125, -0.2933769226074219, -0.2821197509765625, -0.2708625793457031, -0.25960540771484375, -0.24834823608398438, -0.237091064453125, -0.22583389282226562, -0.21457672119140625, -0.20331954956054688, -0.1920623779296875, -0.18080520629882812, -0.16954803466796875, -0.15829086303710938, -0.14703369140625, -0.13577651977539062, -0.12451934814453125, -0.11326217651367188, -0.1020050048828125, -0.09074783325195312, -0.07949066162109375, -0.06823348999023438, -0.056976318359375, -0.045719146728515625, -0.03446197509765625, -0.023204803466796875, -0.0119476318359375, -0.000690460205078125, 0.01056671142578125, 0.021823883056640625, 0.0330810546875, 0.044338226318359375, 0.05559539794921875, 0.06685256958007812, 0.0781097412109375, 0.08936691284179688, 0.10062408447265625, 0.11188125610351562, 0.123138427734375, 0.13439559936523438, 0.14565277099609375, 0.15690994262695312, 0.1681671142578125, 0.17942428588867188, 0.19068145751953125, 0.20193862915039062, 0.21319580078125, 0.22445297241210938, 0.23571014404296875, 0.24696731567382812, 0.2582244873046875, 0.2694816589355469, 0.28073883056640625, 0.2919960021972656, 0.303253173828125, 0.3145103454589844, 0.32576751708984375, 0.3370246887207031, 0.3482818603515625, 0.3595390319824219, 0.37079620361328125, 0.3820533752441406, 0.393310546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 8.0, 3.0, 5.0, 3.0, 8.0, 12.0, 11.0, 14.0, 15.0, 39.0, 29.0, 35.0, 57.0, 75.0, 98.0, 119.0, 103.0, 83.0, 74.0, 44.0, 37.0, 25.0, 18.0, 26.0, 16.0, 8.0, 7.0, 8.0, 6.0, 6.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09283447265625, -0.08958816528320312, -0.08634185791015625, -0.08309555053710938, -0.0798492431640625, -0.07660293579101562, -0.07335662841796875, -0.07011032104492188, -0.066864013671875, -0.06361770629882812, -0.06037139892578125, -0.057125091552734375, -0.0538787841796875, -0.050632476806640625, -0.04738616943359375, -0.044139862060546875, -0.0408935546875, -0.037647247314453125, -0.03440093994140625, -0.031154632568359375, -0.0279083251953125, -0.024662017822265625, -0.02141571044921875, -0.018169403076171875, -0.014923095703125, -0.011676788330078125, -0.00843048095703125, -0.005184173583984375, -0.0019378662109375, 0.001308441162109375, 0.00455474853515625, 0.007801055908203125, 0.01104736328125, 0.014293670654296875, 0.01753997802734375, 0.020786285400390625, 0.0240325927734375, 0.027278900146484375, 0.03052520751953125, 0.033771514892578125, 0.037017822265625, 0.040264129638671875, 0.04351043701171875, 0.046756744384765625, 0.0500030517578125, 0.053249359130859375, 0.05649566650390625, 0.059741973876953125, 0.06298828125, 0.06623458862304688, 0.06948089599609375, 0.07272720336914062, 0.0759735107421875, 0.07921981811523438, 0.08246612548828125, 0.08571243286132812, 0.088958740234375, 0.09220504760742188, 0.09545135498046875, 0.09869766235351562, 0.1019439697265625, 0.10519027709960938, 0.10843658447265625, 0.11168289184570312, 0.11492919921875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 12.0, 18.0, 20.0, 37.0, 63.0, 84.0, 123.0, 133.0, 144.0, 124.0, 64.0, 31.0, 40.0, 28.0, 21.0, 8.0, 10.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.878830432891846, -4.762570381164551, -4.646309852600098, -4.530049800872803, -4.41378927230835, -4.297529220581055, -4.181268692016602, -4.065008640289307, -3.9487483501434326, -3.8324880599975586, -3.7162277698516846, -3.5999674797058105, -3.4837074279785156, -3.3674468994140625, -3.2511868476867676, -3.1349265575408936, -3.0186662673950195, -2.9024059772491455, -2.7861456871032715, -2.6698853969573975, -2.5536251068115234, -2.4373650550842285, -2.3211047649383545, -2.2048444747924805, -2.0885841846466064, -1.9723238945007324, -1.8560636043548584, -1.739803433418274, -1.6235431432724, -1.5072828531265259, -1.3910226821899414, -1.2747623920440674, -1.1585018634796143, -1.0422415733337402, -0.925981342792511, -0.8097211122512817, -0.6934608221054077, -0.5772005319595337, -0.46094030141830444, -0.3446800708770752, -0.22841978073120117, -0.11215952038764954, 0.0041007399559021, 0.12036100029945374, 0.23662126064300537, 0.3528815507888794, 0.46914178133010864, 0.5854020118713379, 0.7016623020172119, 0.8179225921630859, 0.9341828227043152, 1.0504430532455444, 1.1667033433914185, 1.2829636335372925, 1.399223804473877, 1.515484094619751, 1.631744384765625, 1.748004674911499, 1.864264965057373, 1.9805251359939575, 2.096785545349121, 2.213045597076416, 2.32930588722229, 2.445566177368164, 2.561826467514038]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 13.0, 8.0, 11.0, 9.0, 7.0, 16.0, 14.0, 20.0, 34.0, 33.0, 30.0, 24.0, 36.0, 31.0, 30.0, 29.0, 35.0, 50.0, 48.0, 43.0, 30.0, 42.0, 56.0, 45.0, 34.0, 32.0, 41.0, 23.0, 19.0, 27.0, 23.0, 18.0, 12.0, 9.0, 12.0, 12.0, 6.0, 7.0, 3.0, 6.0, 8.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7791060209274292, -1.7269487380981445, -1.6747915744781494, -1.6226342916488647, -1.5704771280288696, -1.518319845199585, -1.4661626815795898, -1.4140053987503052, -1.36184823513031, -1.3096909523010254, -1.2575337886810303, -1.2053765058517456, -1.1532193422317505, -1.1010620594024658, -1.0489048957824707, -0.996747612953186, -0.9445903897285461, -0.8924331665039062, -0.8402759432792664, -0.7881187200546265, -0.7359614968299866, -0.6838042736053467, -0.631646990776062, -0.5794898271560669, -0.5273325443267822, -0.47517532110214233, -0.42301809787750244, -0.37086087465286255, -0.31870365142822266, -0.2665463984012604, -0.21438917517662048, -0.1622319519519806, -0.11007475852966309, -0.057917531579732895, -0.005760304629802704, 0.046396926045417786, 0.09855414927005768, 0.15071138739585876, 0.20286861062049866, 0.25502583384513855, 0.30718305706977844, 0.35934028029441833, 0.4114975035190582, 0.4636547565460205, 0.5158119797706604, 0.5679692029953003, 0.6201264262199402, 0.6722836494445801, 0.72444087266922, 0.7765980958938599, 0.8287553191184998, 0.8809125423431396, 0.9330697655677795, 0.9852269887924194, 1.037384271621704, 1.0895414352416992, 1.1416987180709839, 1.1938560009002686, 1.2460131645202637, 1.2981704473495483, 1.3503276109695435, 1.4024848937988281, 1.4546420574188232, 1.506799340248108, 1.558956503868103]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 1.0, 7.0, 5.0, 9.0, 26.0, 30.0, 49.0, 70.0, 112.0, 155.0, 244.0, 385.0, 607.0, 994.0, 1725.0, 2833.0, 4928.0, 8526.0, 15054.0, 26876.0, 49975.0, 96584.0, 183327.0, 266711.0, 181691.0, 95515.0, 49909.0, 26680.0, 14879.0, 8526.0, 4904.0, 2894.0, 1649.0, 953.0, 590.0, 400.0, 268.0, 152.0, 104.0, 64.0, 59.0, 25.0, 15.0, 20.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.0390625, -2.94256591796875, -2.8460693359375, -2.74957275390625, -2.653076171875, -2.55657958984375, -2.4600830078125, -2.36358642578125, -2.26708984375, -2.17059326171875, -2.0740966796875, -1.97760009765625, -1.881103515625, -1.78460693359375, -1.6881103515625, -1.59161376953125, -1.4951171875, -1.39862060546875, -1.3021240234375, -1.20562744140625, -1.109130859375, -1.01263427734375, -0.9161376953125, -0.81964111328125, -0.72314453125, -0.62664794921875, -0.5301513671875, -0.43365478515625, -0.337158203125, -0.24066162109375, -0.1441650390625, -0.04766845703125, 0.048828125, 0.14532470703125, 0.2418212890625, 0.33831787109375, 0.434814453125, 0.53131103515625, 0.6278076171875, 0.72430419921875, 0.82080078125, 0.91729736328125, 1.0137939453125, 1.11029052734375, 1.206787109375, 1.30328369140625, 1.3997802734375, 1.49627685546875, 1.5927734375, 1.68927001953125, 1.7857666015625, 1.88226318359375, 1.978759765625, 2.07525634765625, 2.1717529296875, 2.26824951171875, 2.36474609375, 2.46124267578125, 2.5577392578125, 2.65423583984375, 2.750732421875, 2.84722900390625, 2.9437255859375, 3.04022216796875, 3.13671875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 3.0, 5.0, 7.0, 12.0, 9.0, 10.0, 10.0, 16.0, 23.0, 26.0, 30.0, 17.0, 25.0, 26.0, 32.0, 33.0, 36.0, 38.0, 37.0, 39.0, 35.0, 41.0, 26.0, 51.0, 46.0, 42.0, 38.0, 35.0, 27.0, 26.0, 30.0, 24.0, 25.0, 19.0, 15.0, 11.0, 6.0, 16.0, 11.0, 8.0, 5.0, 4.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.5498046875, -1.5045013427734375, -1.459197998046875, -1.4138946533203125, -1.36859130859375, -1.3232879638671875, -1.277984619140625, -1.2326812744140625, -1.1873779296875, -1.1420745849609375, -1.096771240234375, -1.0514678955078125, -1.00616455078125, -0.9608612060546875, -0.915557861328125, -0.8702545166015625, -0.824951171875, -0.7796478271484375, -0.734344482421875, -0.6890411376953125, -0.64373779296875, -0.5984344482421875, -0.553131103515625, -0.5078277587890625, -0.4625244140625, -0.4172210693359375, -0.371917724609375, -0.3266143798828125, -0.28131103515625, -0.2360076904296875, -0.190704345703125, -0.1454010009765625, -0.10009765625, -0.0547943115234375, -0.009490966796875, 0.0358123779296875, 0.08111572265625, 0.1264190673828125, 0.171722412109375, 0.2170257568359375, 0.2623291015625, 0.3076324462890625, 0.352935791015625, 0.3982391357421875, 0.44354248046875, 0.4888458251953125, 0.534149169921875, 0.5794525146484375, 0.624755859375, 0.6700592041015625, 0.715362548828125, 0.7606658935546875, 0.80596923828125, 0.8512725830078125, 0.896575927734375, 0.9418792724609375, 0.9871826171875, 1.0324859619140625, 1.077789306640625, 1.1230926513671875, 1.16839599609375, 1.2136993408203125, 1.259002685546875, 1.3043060302734375, 1.349609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 16.0, 27.0, 31.0, 57.0, 66.0, 102.0, 173.0, 265.0, 389.0, 707.0, 1180.0, 2021.0, 3995.0, 7653.0, 15221.0, 30994.0, 64123.0, 135050.0, 281210.0, 263826.0, 124203.0, 59120.0, 28379.0, 14009.0, 7159.0, 3758.0, 2001.0, 1098.0, 629.0, 378.0, 224.0, 152.0, 101.0, 58.0, 52.0, 42.0, 22.0, 14.0, 13.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40625, -3.29962158203125, -3.1929931640625, -3.08636474609375, -2.979736328125, -2.87310791015625, -2.7664794921875, -2.65985107421875, -2.55322265625, -2.44659423828125, -2.3399658203125, -2.23333740234375, -2.126708984375, -2.02008056640625, -1.9134521484375, -1.80682373046875, -1.7001953125, -1.59356689453125, -1.4869384765625, -1.38031005859375, -1.273681640625, -1.16705322265625, -1.0604248046875, -0.95379638671875, -0.84716796875, -0.74053955078125, -0.6339111328125, -0.52728271484375, -0.420654296875, -0.31402587890625, -0.2073974609375, -0.10076904296875, 0.005859375, 0.11248779296875, 0.2191162109375, 0.32574462890625, 0.432373046875, 0.53900146484375, 0.6456298828125, 0.75225830078125, 0.85888671875, 0.96551513671875, 1.0721435546875, 1.17877197265625, 1.285400390625, 1.39202880859375, 1.4986572265625, 1.60528564453125, 1.7119140625, 1.81854248046875, 1.9251708984375, 2.03179931640625, 2.138427734375, 2.24505615234375, 2.3516845703125, 2.45831298828125, 2.56494140625, 2.67156982421875, 2.7781982421875, 2.88482666015625, 2.991455078125, 3.09808349609375, 3.2047119140625, 3.31134033203125, 3.41796875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 8.0, 6.0, 12.0, 12.0, 13.0, 18.0, 27.0, 14.0, 15.0, 22.0, 31.0, 23.0, 31.0, 37.0, 26.0, 34.0, 38.0, 46.0, 32.0, 42.0, 43.0, 51.0, 35.0, 33.0, 39.0, 36.0, 29.0, 22.0, 32.0, 28.0, 18.0, 19.0, 16.0, 15.0, 10.0, 10.0, 13.0, 12.0, 5.0, 11.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7533187866210938, -0.7239227294921875, -0.6945266723632812, -0.665130615234375, -0.6357345581054688, -0.6063385009765625, -0.5769424438476562, -0.54754638671875, -0.5181503295898438, -0.4887542724609375, -0.45935821533203125, -0.429962158203125, -0.40056610107421875, -0.3711700439453125, -0.34177398681640625, -0.3123779296875, -0.28298187255859375, -0.2535858154296875, -0.22418975830078125, -0.194793701171875, -0.16539764404296875, -0.1360015869140625, -0.10660552978515625, -0.07720947265625, -0.04781341552734375, -0.0184173583984375, 0.01097869873046875, 0.040374755859375, 0.06977081298828125, 0.0991668701171875, 0.12856292724609375, 0.157958984375, 0.18735504150390625, 0.2167510986328125, 0.24614715576171875, 0.275543212890625, 0.30493927001953125, 0.3343353271484375, 0.36373138427734375, 0.39312744140625, 0.42252349853515625, 0.4519195556640625, 0.48131561279296875, 0.510711669921875, 0.5401077270507812, 0.5695037841796875, 0.5988998413085938, 0.6282958984375, 0.6576919555664062, 0.6870880126953125, 0.7164840698242188, 0.745880126953125, 0.7752761840820312, 0.8046722412109375, 0.8340682983398438, 0.86346435546875, 0.8928604125976562, 0.9222564697265625, 0.9516525268554688, 0.981048583984375, 1.0104446411132812, 1.0398406982421875, 1.0692367553710938, 1.0986328125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 3.0, 5.0, 11.0, 6.0, 22.0, 26.0, 37.0, 35.0, 76.0, 118.0, 175.0, 270.0, 425.0, 724.0, 1250.0, 2347.0, 4629.0, 9614.0, 23002.0, 76211.0, 686442.0, 177519.0, 37922.0, 14067.0, 6295.0, 3131.0, 1781.0, 938.0, 534.0, 296.0, 205.0, 143.0, 85.0, 57.0, 63.0, 22.0, 18.0, 17.0, 10.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.9378662109375, -3.805419921875, -3.6729736328125, -3.54052734375, -3.4080810546875, -3.275634765625, -3.1431884765625, -3.0107421875, -2.8782958984375, -2.745849609375, -2.6134033203125, -2.48095703125, -2.3485107421875, -2.216064453125, -2.0836181640625, -1.951171875, -1.8187255859375, -1.686279296875, -1.5538330078125, -1.42138671875, -1.2889404296875, -1.156494140625, -1.0240478515625, -0.8916015625, -0.7591552734375, -0.626708984375, -0.4942626953125, -0.36181640625, -0.2293701171875, -0.096923828125, 0.0355224609375, 0.16796875, 0.3004150390625, 0.432861328125, 0.5653076171875, 0.69775390625, 0.8302001953125, 0.962646484375, 1.0950927734375, 1.2275390625, 1.3599853515625, 1.492431640625, 1.6248779296875, 1.75732421875, 1.8897705078125, 2.022216796875, 2.1546630859375, 2.287109375, 2.4195556640625, 2.552001953125, 2.6844482421875, 2.81689453125, 2.9493408203125, 3.081787109375, 3.2142333984375, 3.3466796875, 3.4791259765625, 3.611572265625, 3.7440185546875, 3.87646484375, 4.0089111328125, 4.141357421875, 4.2738037109375, 4.40625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 10.0, 4.0, 9.0, 13.0, 24.0, 43.0, 72.0, 114.0, 185.0, 224.0, 116.0, 74.0, 28.0, 21.0, 19.0, 10.0, 8.0, 7.0, 5.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-05, -8.894316852092743e-05, -8.490309119224548e-05, -8.086301386356354e-05, -7.682293653488159e-05, -7.278285920619965e-05, -6.87427818775177e-05, -6.470270454883575e-05, -6.066262722015381e-05, -5.662254989147186e-05, -5.258247256278992e-05, -4.854239523410797e-05, -4.4502317905426025e-05, -4.046224057674408e-05, -3.6422163248062134e-05, -3.238208591938019e-05, -2.8342008590698242e-05, -2.4301931262016296e-05, -2.026185393333435e-05, -1.6221776604652405e-05, -1.2181699275970459e-05, -8.141621947288513e-06, -4.101544618606567e-06, -6.146728992462158e-08, 3.978610038757324e-06, 8.01868736743927e-06, 1.2058764696121216e-05, 1.609884202480316e-05, 2.0138919353485107e-05, 2.4178996682167053e-05, 2.8219074010849e-05, 3.2259151339530945e-05, 3.629922866821289e-05, 4.0339305996894836e-05, 4.437938332557678e-05, 4.841946065425873e-05, 5.2459537982940674e-05, 5.649961531162262e-05, 6.0539692640304565e-05, 6.457976996898651e-05, 6.861984729766846e-05, 7.26599246263504e-05, 7.670000195503235e-05, 8.07400792837143e-05, 8.478015661239624e-05, 8.882023394107819e-05, 9.286031126976013e-05, 9.690038859844208e-05, 0.00010094046592712402, 0.00010498054325580597, 0.00010902062058448792, 0.00011306069791316986, 0.0001171007752418518, 0.00012114085257053375, 0.0001251809298992157, 0.00012922100722789764, 0.0001332610845565796, 0.00013730116188526154, 0.00014134123921394348, 0.00014538131654262543, 0.00014942139387130737, 0.00015346147119998932, 0.00015750154852867126, 0.0001615416258573532, 0.00016558170318603516]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 12.0, 17.0, 36.0, 36.0, 46.0, 90.0, 127.0, 162.0, 258.0, 394.0, 633.0, 1064.0, 1786.0, 3401.0, 6783.0, 15688.0, 47846.0, 536597.0, 359615.0, 44559.0, 15034.0, 6506.0, 3265.0, 1731.0, 1020.0, 641.0, 413.0, 240.0, 160.0, 107.0, 72.0, 63.0, 42.0, 21.0, 22.0, 19.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.514404296875, -4.36865234375, -4.222900390625, -4.0771484375, -3.931396484375, -3.78564453125, -3.639892578125, -3.494140625, -3.348388671875, -3.20263671875, -3.056884765625, -2.9111328125, -2.765380859375, -2.61962890625, -2.473876953125, -2.328125, -2.182373046875, -2.03662109375, -1.890869140625, -1.7451171875, -1.599365234375, -1.45361328125, -1.307861328125, -1.162109375, -1.016357421875, -0.87060546875, -0.724853515625, -0.5791015625, -0.433349609375, -0.28759765625, -0.141845703125, 0.00390625, 0.149658203125, 0.29541015625, 0.441162109375, 0.5869140625, 0.732666015625, 0.87841796875, 1.024169921875, 1.169921875, 1.315673828125, 1.46142578125, 1.607177734375, 1.7529296875, 1.898681640625, 2.04443359375, 2.190185546875, 2.3359375, 2.481689453125, 2.62744140625, 2.773193359375, 2.9189453125, 3.064697265625, 3.21044921875, 3.356201171875, 3.501953125, 3.647705078125, 3.79345703125, 3.939208984375, 4.0849609375, 4.230712890625, 4.37646484375, 4.522216796875, 4.66796875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 14.0, 19.0, 18.0, 35.0, 35.0, 69.0, 105.0, 233.0, 159.0, 91.0, 56.0, 35.0, 30.0, 18.0, 14.0, 11.0, 6.0, 4.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.06219482421875, -1.0277099609375, -0.99322509765625, -0.958740234375, -0.92425537109375, -0.8897705078125, -0.85528564453125, -0.82080078125, -0.78631591796875, -0.7518310546875, -0.71734619140625, -0.682861328125, -0.64837646484375, -0.6138916015625, -0.57940673828125, -0.544921875, -0.51043701171875, -0.4759521484375, -0.44146728515625, -0.406982421875, -0.37249755859375, -0.3380126953125, -0.30352783203125, -0.26904296875, -0.23455810546875, -0.2000732421875, -0.16558837890625, -0.131103515625, -0.09661865234375, -0.0621337890625, -0.02764892578125, 0.0068359375, 0.04132080078125, 0.0758056640625, 0.11029052734375, 0.144775390625, 0.17926025390625, 0.2137451171875, 0.24822998046875, 0.28271484375, 0.31719970703125, 0.3516845703125, 0.38616943359375, 0.420654296875, 0.45513916015625, 0.4896240234375, 0.52410888671875, 0.55859375, 0.59307861328125, 0.6275634765625, 0.66204833984375, 0.696533203125, 0.73101806640625, 0.7655029296875, 0.79998779296875, 0.83447265625, 0.86895751953125, 0.9034423828125, 0.93792724609375, 0.972412109375, 1.00689697265625, 1.0413818359375, 1.07586669921875, 1.1103515625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 9.0, 10.0, 15.0, 24.0, 40.0, 69.0, 65.0, 104.0, 140.0, 116.0, 118.0, 58.0, 49.0, 28.0, 29.0, 24.0, 21.0, 21.0, 13.0, 11.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3150670528411865, -2.224872589111328, -2.134678363800049, -2.0444841384887695, -1.9542896747589111, -1.8640953302383423, -1.7739009857177734, -1.6837066411972046, -1.5935122966766357, -1.503317952156067, -1.413123607635498, -1.3229292631149292, -1.2327349185943604, -1.1425405740737915, -1.0523462295532227, -0.9621518850326538, -0.871957540512085, -0.7817631959915161, -0.6915688514709473, -0.6013745069503784, -0.5111801624298096, -0.4209858179092407, -0.3307914733886719, -0.24059712886810303, -0.15040278434753418, -0.06020843982696533, 0.029985904693603516, 0.12018024921417236, 0.2103745937347412, 0.30056893825531006, 0.3907632827758789, 0.48095762729644775, 0.5711519718170166, 0.6613463163375854, 0.7515406608581543, 0.8417350053787231, 0.931929349899292, 1.0221236944198608, 1.1123180389404297, 1.2025123834609985, 1.2927067279815674, 1.3829010725021362, 1.473095417022705, 1.563289761543274, 1.6534841060638428, 1.7436784505844116, 1.8338727951049805, 1.9240671396255493, 2.014261484146118, 2.1044559478759766, 2.194650173187256, 2.284844398498535, 2.3750388622283936, 2.465233325958252, 2.5554275512695312, 2.6456217765808105, 2.735816240310669, 2.8260107040405273, 2.9162049293518066, 3.006399154663086, 3.0965936183929443, 3.1867880821228027, 3.276982307434082, 3.3671765327453613, 3.4573709964752197]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 10.0, 10.0, 2.0, 16.0, 15.0, 17.0, 22.0, 36.0, 26.0, 31.0, 27.0, 41.0, 41.0, 46.0, 63.0, 47.0, 44.0, 34.0, 53.0, 36.0, 32.0, 45.0, 38.0, 47.0, 36.0, 29.0, 29.0, 12.0, 21.0, 23.0, 22.0, 12.0, 10.0, 5.0, 3.0, 6.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7765657901763916, -1.7177287340164185, -1.6588915586471558, -1.6000545024871826, -1.5412174463272095, -1.4823803901672363, -1.4235432147979736, -1.3647061586380005, -1.3058691024780273, -1.2470320463180542, -1.1881948709487915, -1.1293578147888184, -1.0705207586288452, -1.011683702468872, -0.9528465270996094, -0.8940094709396362, -0.8351722955703735, -0.7763351798057556, -0.7174981236457825, -0.6586610078811646, -0.5998239517211914, -0.5409868359565735, -0.48214972019195557, -0.42331263422966003, -0.3644755482673645, -0.30563846230506897, -0.24680136144161224, -0.18796426057815552, -0.12912717461585999, -0.07029008865356445, -0.011452972888946533, 0.047384113073349, 0.10622119903564453, 0.16505828499794006, 0.2238953858613968, 0.2827324867248535, 0.34156957268714905, 0.4004066586494446, 0.4592437744140625, 0.5180808305740356, 0.5769179463386536, 0.6357550621032715, 0.6945921182632446, 0.7534292340278625, 0.8122663497924805, 0.8711034059524536, 0.9299405217170715, 0.9887776374816895, 1.0476146936416626, 1.1064517498016357, 1.1652889251708984, 1.2241259813308716, 1.2829630374908447, 1.3418002128601074, 1.4006372690200806, 1.4594743251800537, 1.5183115005493164, 1.5771485567092896, 1.6359857320785522, 1.6948227882385254, 1.7536598443984985, 1.8124969005584717, 1.8713340759277344, 1.9301711320877075, 1.9890081882476807]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 24.0, 20.0, 35.0, 43.0, 66.0, 80.0, 137.0, 159.0, 258.0, 349.0, 480.0, 708.0, 1029.0, 1447.0, 2184.0, 3265.0, 4768.0, 7355.0, 11619.0, 18579.0, 31298.0, 54297.0, 101123.0, 212807.0, 605897.0, 1699719.0, 868172.0, 277942.0, 124215.0, 65780.0, 37662.0, 22165.0, 13866.0, 8837.0, 5629.0, 3728.0, 2621.0, 1725.0, 1258.0, 874.0, 588.0, 421.0, 317.0, 217.0, 148.0, 96.0, 87.0, 60.0, 36.0, 27.0, 18.0, 17.0, 7.0, 8.0, 4.0, 1.0, 2.0], "bins": [-2.22265625, -2.154571533203125, -2.08648681640625, -2.018402099609375, -1.9503173828125, -1.882232666015625, -1.81414794921875, -1.746063232421875, -1.677978515625, -1.609893798828125, -1.54180908203125, -1.473724365234375, -1.4056396484375, -1.337554931640625, -1.26947021484375, -1.201385498046875, -1.13330078125, -1.065216064453125, -0.99713134765625, -0.929046630859375, -0.8609619140625, -0.792877197265625, -0.72479248046875, -0.656707763671875, -0.588623046875, -0.520538330078125, -0.45245361328125, -0.384368896484375, -0.3162841796875, -0.248199462890625, -0.18011474609375, -0.112030029296875, -0.0439453125, 0.024139404296875, 0.09222412109375, 0.160308837890625, 0.2283935546875, 0.296478271484375, 0.36456298828125, 0.432647705078125, 0.500732421875, 0.568817138671875, 0.63690185546875, 0.704986572265625, 0.7730712890625, 0.841156005859375, 0.90924072265625, 0.977325439453125, 1.04541015625, 1.113494873046875, 1.18157958984375, 1.249664306640625, 1.3177490234375, 1.385833740234375, 1.45391845703125, 1.522003173828125, 1.590087890625, 1.658172607421875, 1.72625732421875, 1.794342041015625, 1.8624267578125, 1.930511474609375, 1.99859619140625, 2.066680908203125, 2.134765625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 8.0, 9.0, 14.0, 16.0, 26.0, 25.0, 26.0, 27.0, 41.0, 40.0, 32.0, 49.0, 51.0, 48.0, 55.0, 50.0, 44.0, 55.0, 33.0, 42.0, 43.0, 38.0, 38.0, 22.0, 34.0, 21.0, 19.0, 16.0, 18.0, 15.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.13671875, -1.0979766845703125, -1.059234619140625, -1.0204925537109375, -0.98175048828125, -0.9430084228515625, -0.904266357421875, -0.8655242919921875, -0.8267822265625, -0.7880401611328125, -0.749298095703125, -0.7105560302734375, -0.67181396484375, -0.6330718994140625, -0.594329833984375, -0.5555877685546875, -0.516845703125, -0.4781036376953125, -0.439361572265625, -0.4006195068359375, -0.36187744140625, -0.3231353759765625, -0.284393310546875, -0.2456512451171875, -0.2069091796875, -0.1681671142578125, -0.129425048828125, -0.0906829833984375, -0.05194091796875, -0.0131988525390625, 0.025543212890625, 0.0642852783203125, 0.10302734375, 0.1417694091796875, 0.180511474609375, 0.2192535400390625, 0.25799560546875, 0.2967376708984375, 0.335479736328125, 0.3742218017578125, 0.4129638671875, 0.4517059326171875, 0.490447998046875, 0.5291900634765625, 0.56793212890625, 0.6066741943359375, 0.645416259765625, 0.6841583251953125, 0.722900390625, 0.7616424560546875, 0.800384521484375, 0.8391265869140625, 0.87786865234375, 0.9166107177734375, 0.955352783203125, 0.9940948486328125, 1.0328369140625, 1.0715789794921875, 1.110321044921875, 1.1490631103515625, 1.18780517578125, 1.2265472412109375, 1.265289306640625, 1.3040313720703125, 1.3427734375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 12.0, 25.0, 17.0, 17.0, 46.0, 65.0, 117.0, 162.0, 251.0, 337.0, 578.0, 927.0, 1386.0, 2280.0, 3659.0, 5988.0, 9990.0, 17630.0, 31684.0, 61906.0, 129096.0, 298136.0, 848524.0, 1716353.0, 614133.0, 232143.0, 103846.0, 50775.0, 26718.0, 15022.0, 8732.0, 5195.0, 3181.0, 1829.0, 1255.0, 794.0, 495.0, 338.0, 235.0, 129.0, 75.0, 69.0, 48.0, 28.0, 27.0, 7.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.19921875, -2.131256103515625, -2.06329345703125, -1.995330810546875, -1.9273681640625, -1.859405517578125, -1.79144287109375, -1.723480224609375, -1.655517578125, -1.587554931640625, -1.51959228515625, -1.451629638671875, -1.3836669921875, -1.315704345703125, -1.24774169921875, -1.179779052734375, -1.11181640625, -1.043853759765625, -0.97589111328125, -0.907928466796875, -0.8399658203125, -0.772003173828125, -0.70404052734375, -0.636077880859375, -0.568115234375, -0.500152587890625, -0.43218994140625, -0.364227294921875, -0.2962646484375, -0.228302001953125, -0.16033935546875, -0.092376708984375, -0.0244140625, 0.043548583984375, 0.11151123046875, 0.179473876953125, 0.2474365234375, 0.315399169921875, 0.38336181640625, 0.451324462890625, 0.519287109375, 0.587249755859375, 0.65521240234375, 0.723175048828125, 0.7911376953125, 0.859100341796875, 0.92706298828125, 0.995025634765625, 1.06298828125, 1.130950927734375, 1.19891357421875, 1.266876220703125, 1.3348388671875, 1.402801513671875, 1.47076416015625, 1.538726806640625, 1.606689453125, 1.674652099609375, 1.74261474609375, 1.810577392578125, 1.8785400390625, 1.946502685546875, 2.01446533203125, 2.082427978515625, 2.150390625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 10.0, 10.0, 13.0, 10.0, 12.0, 22.0, 21.0, 37.0, 37.0, 46.0, 67.0, 88.0, 79.0, 118.0, 163.0, 182.0, 179.0, 220.0, 252.0, 292.0, 292.0, 285.0, 269.0, 239.0, 198.0, 182.0, 151.0, 127.0, 119.0, 75.0, 57.0, 40.0, 39.0, 25.0, 21.0, 21.0, 8.0, 19.0, 10.0, 10.0, 4.0, 4.0, 12.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6044921875, -0.58612060546875, -0.5677490234375, -0.54937744140625, -0.531005859375, -0.51263427734375, -0.4942626953125, -0.47589111328125, -0.45751953125, -0.43914794921875, -0.4207763671875, -0.40240478515625, -0.384033203125, -0.36566162109375, -0.3472900390625, -0.32891845703125, -0.310546875, -0.29217529296875, -0.2738037109375, -0.25543212890625, -0.237060546875, -0.21868896484375, -0.2003173828125, -0.18194580078125, -0.16357421875, -0.14520263671875, -0.1268310546875, -0.10845947265625, -0.090087890625, -0.07171630859375, -0.0533447265625, -0.03497314453125, -0.0166015625, 0.00177001953125, 0.0201416015625, 0.03851318359375, 0.056884765625, 0.07525634765625, 0.0936279296875, 0.11199951171875, 0.13037109375, 0.14874267578125, 0.1671142578125, 0.18548583984375, 0.203857421875, 0.22222900390625, 0.2406005859375, 0.25897216796875, 0.27734375, 0.29571533203125, 0.3140869140625, 0.33245849609375, 0.350830078125, 0.36920166015625, 0.3875732421875, 0.40594482421875, 0.42431640625, 0.44268798828125, 0.4610595703125, 0.47943115234375, 0.497802734375, 0.51617431640625, 0.5345458984375, 0.55291748046875, 0.5712890625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 5.0, 3.0, 10.0, 9.0, 13.0, 15.0, 28.0, 31.0, 37.0, 84.0, 86.0, 127.0, 143.0, 109.0, 68.0, 56.0, 48.0, 35.0, 22.0, 15.0, 15.0, 12.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5276777744293213, -2.4601409435272217, -2.392603874206543, -2.3250670433044434, -2.2575302124023438, -2.189993143081665, -2.1224563121795654, -2.0549192428588867, -1.987382411956787, -1.919845461845398, -1.8523085117340088, -1.7847716808319092, -1.71723473072052, -1.6496977806091309, -1.5821609497070312, -1.514623999595642, -1.447087049484253, -1.3795500993728638, -1.3120131492614746, -1.244476318359375, -1.1769393682479858, -1.1094024181365967, -1.041865587234497, -0.9743286371231079, -0.9067916870117188, -0.8392547369003296, -0.7717178463935852, -0.7041809558868408, -0.6366440057754517, -0.5691070556640625, -0.5015701651573181, -0.43403324484825134, -0.36649632453918457, -0.2989594042301178, -0.23142248392105103, -0.16388556361198425, -0.09634864330291748, -0.028811722993850708, 0.038725197315216064, 0.10626211762428284, 0.1737990379333496, 0.24133595824241638, 0.30887287855148315, 0.3764097988605499, 0.4439467191696167, 0.5114836692810059, 0.5790205597877502, 0.6465574502944946, 0.7140944004058838, 0.781631350517273, 0.8491682410240173, 0.9167051315307617, 0.9842420816421509, 1.05177903175354, 1.1193158626556396, 1.1868528127670288, 1.254389762878418, 1.3219267129898071, 1.3894636631011963, 1.457000494003296, 1.524537444114685, 1.5920743942260742, 1.6596112251281738, 1.727148175239563, 1.7946851253509521]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 10.0, 4.0, 12.0, 5.0, 16.0, 18.0, 17.0, 28.0, 20.0, 37.0, 28.0, 31.0, 37.0, 37.0, 30.0, 38.0, 41.0, 39.0, 37.0, 45.0, 49.0, 41.0, 40.0, 54.0, 33.0, 35.0, 27.0, 24.0, 29.0, 22.0, 22.0, 16.0, 13.0, 11.0, 11.0, 9.0, 10.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1917500495910645, -1.1529874801635742, -1.114224910736084, -1.0754623413085938, -1.036699652671814, -0.9979370832443237, -0.9591745138168335, -0.9204119443893433, -0.881649374961853, -0.8428868055343628, -0.8041241765022278, -0.7653616070747375, -0.7265990376472473, -0.6878364086151123, -0.6490738391876221, -0.6103112697601318, -0.5715486407279968, -0.5327860713005066, -0.49402347207069397, -0.45526087284088135, -0.4164983034133911, -0.3777357041835785, -0.33897310495376587, -0.30021053552627563, -0.261447936296463, -0.22268535196781158, -0.18392276763916016, -0.14516016840934753, -0.1063975840806961, -0.06763499975204468, -0.028872400522232056, 0.009890168905258179, 0.0486527681350708, 0.08741535246372223, 0.12617793679237366, 0.16494053602218628, 0.2037031203508377, 0.24246570467948914, 0.28122830390930176, 0.319990873336792, 0.3587534725666046, 0.39751607179641724, 0.43627864122390747, 0.4750412404537201, 0.5138038396835327, 0.552566409111023, 0.5913289785385132, 0.6300915479660034, 0.6688541769981384, 0.7076167464256287, 0.7463793754577637, 0.7851419448852539, 0.8239045143127441, 0.8626670837402344, 0.9014297127723694, 0.9401922821998596, 0.9789549112319946, 1.0177174806594849, 1.056480050086975, 1.0952427387237549, 1.1340053081512451, 1.1727678775787354, 1.2115304470062256, 1.2502930164337158, 1.289055585861206]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 8.0, 13.0, 12.0, 15.0, 33.0, 33.0, 56.0, 61.0, 83.0, 137.0, 199.0, 251.0, 371.0, 521.0, 794.0, 1133.0, 1664.0, 2431.0, 3629.0, 5737.0, 9051.0, 14898.0, 26272.0, 50101.0, 106052.0, 292051.0, 303335.0, 109712.0, 51104.0, 26929.0, 15180.0, 9283.0, 5807.0, 3666.0, 2453.0, 1679.0, 1170.0, 797.0, 543.0, 357.0, 276.0, 180.0, 149.0, 104.0, 64.0, 50.0, 43.0, 19.0, 23.0, 12.0, 11.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.86083984375, -0.833953857421875, -0.80706787109375, -0.780181884765625, -0.7532958984375, -0.726409912109375, -0.69952392578125, -0.672637939453125, -0.645751953125, -0.618865966796875, -0.59197998046875, -0.565093994140625, -0.5382080078125, -0.511322021484375, -0.48443603515625, -0.457550048828125, -0.4306640625, -0.403778076171875, -0.37689208984375, -0.350006103515625, -0.3231201171875, -0.296234130859375, -0.26934814453125, -0.242462158203125, -0.215576171875, -0.188690185546875, -0.16180419921875, -0.134918212890625, -0.1080322265625, -0.081146240234375, -0.05426025390625, -0.027374267578125, -0.00048828125, 0.026397705078125, 0.05328369140625, 0.080169677734375, 0.1070556640625, 0.133941650390625, 0.16082763671875, 0.187713623046875, 0.214599609375, 0.241485595703125, 0.26837158203125, 0.295257568359375, 0.3221435546875, 0.349029541015625, 0.37591552734375, 0.402801513671875, 0.4296875, 0.456573486328125, 0.48345947265625, 0.510345458984375, 0.5372314453125, 0.564117431640625, 0.59100341796875, 0.617889404296875, 0.644775390625, 0.671661376953125, 0.69854736328125, 0.725433349609375, 0.7523193359375, 0.779205322265625, 0.80609130859375, 0.832977294921875, 0.85986328125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 9.0, 15.0, 19.0, 21.0, 32.0, 20.0, 35.0, 26.0, 35.0, 34.0, 38.0, 36.0, 36.0, 42.0, 41.0, 37.0, 32.0, 40.0, 47.0, 56.0, 54.0, 32.0, 30.0, 28.0, 20.0, 15.0, 33.0, 21.0, 9.0, 15.0, 15.0, 9.0, 9.0, 5.0, 10.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2783203125, -1.2391815185546875, -1.200042724609375, -1.1609039306640625, -1.12176513671875, -1.0826263427734375, -1.043487548828125, -1.0043487548828125, -0.9652099609375, -0.9260711669921875, -0.886932373046875, -0.8477935791015625, -0.80865478515625, -0.7695159912109375, -0.730377197265625, -0.6912384033203125, -0.652099609375, -0.6129608154296875, -0.573822021484375, -0.5346832275390625, -0.49554443359375, -0.4564056396484375, -0.417266845703125, -0.3781280517578125, -0.3389892578125, -0.2998504638671875, -0.260711669921875, -0.2215728759765625, -0.18243408203125, -0.1432952880859375, -0.104156494140625, -0.0650177001953125, -0.02587890625, 0.0132598876953125, 0.052398681640625, 0.0915374755859375, 0.13067626953125, 0.1698150634765625, 0.208953857421875, 0.2480926513671875, 0.2872314453125, 0.3263702392578125, 0.365509033203125, 0.4046478271484375, 0.44378662109375, 0.4829254150390625, 0.522064208984375, 0.5612030029296875, 0.600341796875, 0.6394805908203125, 0.678619384765625, 0.7177581787109375, 0.75689697265625, 0.7960357666015625, 0.835174560546875, 0.8743133544921875, 0.9134521484375, 0.9525909423828125, 0.991729736328125, 1.0308685302734375, 1.07000732421875, 1.1091461181640625, 1.148284912109375, 1.1874237060546875, 1.2265625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 10.0, 13.0, 9.0, 16.0, 32.0, 27.0, 46.0, 51.0, 86.0, 132.0, 138.0, 198.0, 293.0, 376.0, 504.0, 721.0, 1030.0, 1518.0, 2237.0, 3570.0, 5624.0, 9783.0, 19005.0, 49854.0, 360736.0, 486960.0, 56983.0, 20651.0, 10572.0, 6021.0, 3669.0, 2383.0, 1542.0, 1085.0, 744.0, 508.0, 365.0, 283.0, 201.0, 157.0, 122.0, 81.0, 61.0, 45.0, 31.0, 27.0, 14.0, 11.0, 10.0, 13.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.3671875, -1.3258209228515625, -1.284454345703125, -1.2430877685546875, -1.20172119140625, -1.1603546142578125, -1.118988037109375, -1.0776214599609375, -1.0362548828125, -0.9948883056640625, -0.953521728515625, -0.9121551513671875, -0.87078857421875, -0.8294219970703125, -0.788055419921875, -0.7466888427734375, -0.705322265625, -0.6639556884765625, -0.622589111328125, -0.5812225341796875, -0.53985595703125, -0.4984893798828125, -0.457122802734375, -0.4157562255859375, -0.3743896484375, -0.3330230712890625, -0.291656494140625, -0.2502899169921875, -0.20892333984375, -0.1675567626953125, -0.126190185546875, -0.0848236083984375, -0.04345703125, -0.0020904541015625, 0.039276123046875, 0.0806427001953125, 0.12200927734375, 0.1633758544921875, 0.204742431640625, 0.2461090087890625, 0.2874755859375, 0.3288421630859375, 0.370208740234375, 0.4115753173828125, 0.45294189453125, 0.4943084716796875, 0.535675048828125, 0.5770416259765625, 0.618408203125, 0.6597747802734375, 0.701141357421875, 0.7425079345703125, 0.78387451171875, 0.8252410888671875, 0.866607666015625, 0.9079742431640625, 0.9493408203125, 0.9907073974609375, 1.032073974609375, 1.0734405517578125, 1.11480712890625, 1.1561737060546875, 1.197540283203125, 1.2389068603515625, 1.2802734375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 6.0, 11.0, 12.0, 11.0, 17.0, 15.0, 17.0, 17.0, 21.0, 26.0, 35.0, 25.0, 34.0, 40.0, 40.0, 34.0, 47.0, 50.0, 48.0, 52.0, 36.0, 47.0, 39.0, 44.0, 35.0, 27.0, 38.0, 26.0, 25.0, 22.0, 19.0, 11.0, 15.0, 16.0, 5.0, 9.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84326171875, -0.8162841796875, -0.789306640625, -0.7623291015625, -0.7353515625, -0.7083740234375, -0.681396484375, -0.6544189453125, -0.62744140625, -0.6004638671875, -0.573486328125, -0.5465087890625, -0.51953125, -0.4925537109375, -0.465576171875, -0.4385986328125, -0.41162109375, -0.3846435546875, -0.357666015625, -0.3306884765625, -0.3037109375, -0.2767333984375, -0.249755859375, -0.2227783203125, -0.19580078125, -0.1688232421875, -0.141845703125, -0.1148681640625, -0.087890625, -0.0609130859375, -0.033935546875, -0.0069580078125, 0.02001953125, 0.0469970703125, 0.073974609375, 0.1009521484375, 0.1279296875, 0.1549072265625, 0.181884765625, 0.2088623046875, 0.23583984375, 0.2628173828125, 0.289794921875, 0.3167724609375, 0.34375, 0.3707275390625, 0.397705078125, 0.4246826171875, 0.45166015625, 0.4786376953125, 0.505615234375, 0.5325927734375, 0.5595703125, 0.5865478515625, 0.613525390625, 0.6405029296875, 0.66748046875, 0.6944580078125, 0.721435546875, 0.7484130859375, 0.775390625, 0.8023681640625, 0.829345703125, 0.8563232421875, 0.88330078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 7.0, 12.0, 9.0, 22.0, 24.0, 24.0, 25.0, 49.0, 68.0, 69.0, 105.0, 126.0, 161.0, 212.0, 265.0, 414.0, 647.0, 961.0, 1503.0, 2651.0, 4801.0, 9487.0, 23553.0, 86463.0, 696818.0, 159159.0, 33951.0, 12296.0, 5824.0, 3222.0, 1843.0, 1168.0, 754.0, 527.0, 334.0, 239.0, 173.0, 127.0, 115.0, 73.0, 72.0, 57.0, 32.0, 20.0, 25.0, 20.0, 15.0, 7.0, 5.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34716796875, -0.335845947265625, -0.32452392578125, -0.313201904296875, -0.3018798828125, -0.290557861328125, -0.27923583984375, -0.267913818359375, -0.256591796875, -0.245269775390625, -0.23394775390625, -0.222625732421875, -0.2113037109375, -0.199981689453125, -0.18865966796875, -0.177337646484375, -0.166015625, -0.154693603515625, -0.14337158203125, -0.132049560546875, -0.1207275390625, -0.109405517578125, -0.09808349609375, -0.086761474609375, -0.075439453125, -0.064117431640625, -0.05279541015625, -0.041473388671875, -0.0301513671875, -0.018829345703125, -0.00750732421875, 0.003814697265625, 0.01513671875, 0.026458740234375, 0.03778076171875, 0.049102783203125, 0.0604248046875, 0.071746826171875, 0.08306884765625, 0.094390869140625, 0.105712890625, 0.117034912109375, 0.12835693359375, 0.139678955078125, 0.1510009765625, 0.162322998046875, 0.17364501953125, 0.184967041015625, 0.1962890625, 0.207611083984375, 0.21893310546875, 0.230255126953125, 0.2415771484375, 0.252899169921875, 0.26422119140625, 0.275543212890625, 0.286865234375, 0.298187255859375, 0.30950927734375, 0.320831298828125, 0.3321533203125, 0.343475341796875, 0.35479736328125, 0.366119384765625, 0.37744140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 5.0, 17.0, 10.0, 18.0, 35.0, 43.0, 41.0, 57.0, 97.0, 123.0, 117.0, 112.0, 79.0, 57.0, 51.0, 22.0, 23.0, 15.0, 19.0, 11.0, 8.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8417835235595703e-05, -1.792237162590027e-05, -1.7426908016204834e-05, -1.69314444065094e-05, -1.6435980796813965e-05, -1.594051718711853e-05, -1.5445053577423096e-05, -1.4949589967727661e-05, -1.4454126358032227e-05, -1.3958662748336792e-05, -1.3463199138641357e-05, -1.2967735528945923e-05, -1.2472271919250488e-05, -1.1976808309555054e-05, -1.1481344699859619e-05, -1.0985881090164185e-05, -1.049041748046875e-05, -9.994953870773315e-06, -9.499490261077881e-06, -9.004026651382446e-06, -8.508563041687012e-06, -8.013099431991577e-06, -7.517635822296143e-06, -7.022172212600708e-06, -6.5267086029052734e-06, -6.031244993209839e-06, -5.535781383514404e-06, -5.04031777381897e-06, -4.544854164123535e-06, -4.049390554428101e-06, -3.553926944732666e-06, -3.0584633350372314e-06, -2.562999725341797e-06, -2.0675361156463623e-06, -1.5720725059509277e-06, -1.0766088962554932e-06, -5.811452865600586e-07, -8.568167686462402e-08, 4.0978193283081055e-07, 9.052455425262451e-07, 1.4007091522216797e-06, 1.8961727619171143e-06, 2.391636371612549e-06, 2.8870999813079834e-06, 3.382563591003418e-06, 3.8780272006988525e-06, 4.373490810394287e-06, 4.868954420089722e-06, 5.364418029785156e-06, 5.859881639480591e-06, 6.355345249176025e-06, 6.85080885887146e-06, 7.3462724685668945e-06, 7.841736078262329e-06, 8.337199687957764e-06, 8.832663297653198e-06, 9.328126907348633e-06, 9.823590517044067e-06, 1.0319054126739502e-05, 1.0814517736434937e-05, 1.1309981346130371e-05, 1.1805444955825806e-05, 1.230090856552124e-05, 1.2796372175216675e-05, 1.329183578491211e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 6.0, 5.0, 5.0, 13.0, 11.0, 18.0, 39.0, 39.0, 62.0, 84.0, 129.0, 177.0, 298.0, 446.0, 801.0, 1568.0, 3383.0, 9346.0, 33801.0, 203319.0, 684626.0, 81059.0, 18471.0, 5707.0, 2314.0, 1115.0, 579.0, 393.0, 221.0, 144.0, 120.0, 64.0, 68.0, 41.0, 25.0, 15.0, 12.0, 10.0, 8.0, 0.0, 4.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.5597915649414062, -0.5399932861328125, -0.5201950073242188, -0.500396728515625, -0.48059844970703125, -0.4608001708984375, -0.44100189208984375, -0.42120361328125, -0.40140533447265625, -0.3816070556640625, -0.36180877685546875, -0.342010498046875, -0.32221221923828125, -0.3024139404296875, -0.28261566162109375, -0.2628173828125, -0.24301910400390625, -0.2232208251953125, -0.20342254638671875, -0.183624267578125, -0.16382598876953125, -0.1440277099609375, -0.12422943115234375, -0.10443115234375, -0.08463287353515625, -0.0648345947265625, -0.04503631591796875, -0.025238037109375, -0.00543975830078125, 0.0143585205078125, 0.03415679931640625, 0.053955078125, 0.07375335693359375, 0.0935516357421875, 0.11334991455078125, 0.133148193359375, 0.15294647216796875, 0.1727447509765625, 0.19254302978515625, 0.21234130859375, 0.23213958740234375, 0.2519378662109375, 0.27173614501953125, 0.291534423828125, 0.31133270263671875, 0.3311309814453125, 0.35092926025390625, 0.3707275390625, 0.39052581787109375, 0.4103240966796875, 0.43012237548828125, 0.449920654296875, 0.46971893310546875, 0.4895172119140625, 0.5093154907226562, 0.52911376953125, 0.5489120483398438, 0.5687103271484375, 0.5885086059570312, 0.608306884765625, 0.6281051635742188, 0.6479034423828125, 0.6677017211914062, 0.6875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 6.0, 12.0, 15.0, 20.0, 22.0, 43.0, 60.0, 110.0, 134.0, 163.0, 138.0, 96.0, 62.0, 33.0, 28.0, 15.0, 10.0, 10.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0941162109375, -0.09009170532226562, -0.08606719970703125, -0.08204269409179688, -0.0780181884765625, -0.07399368286132812, -0.06996917724609375, -0.06594467163085938, -0.061920166015625, -0.057895660400390625, -0.05387115478515625, -0.049846649169921875, -0.0458221435546875, -0.041797637939453125, -0.03777313232421875, -0.033748626708984375, -0.02972412109375, -0.025699615478515625, -0.02167510986328125, -0.017650604248046875, -0.0136260986328125, -0.009601593017578125, -0.00557708740234375, -0.001552581787109375, 0.002471923828125, 0.006496429443359375, 0.01052093505859375, 0.014545440673828125, 0.0185699462890625, 0.022594451904296875, 0.02661895751953125, 0.030643463134765625, 0.03466796875, 0.038692474365234375, 0.04271697998046875, 0.046741485595703125, 0.0507659912109375, 0.054790496826171875, 0.05881500244140625, 0.06283950805664062, 0.066864013671875, 0.07088851928710938, 0.07491302490234375, 0.07893753051757812, 0.0829620361328125, 0.08698654174804688, 0.09101104736328125, 0.09503555297851562, 0.09906005859375, 0.10308456420898438, 0.10710906982421875, 0.11113357543945312, 0.1151580810546875, 0.11918258666992188, 0.12320709228515625, 0.12723159790039062, 0.131256103515625, 0.13528060913085938, 0.13930511474609375, 0.14332962036132812, 0.1473541259765625, 0.15137863159179688, 0.15540313720703125, 0.15942764282226562, 0.1634521484375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 12.0, 5.0, 10.0, 17.0, 16.0, 32.0, 34.0, 61.0, 100.0, 110.0, 143.0, 111.0, 95.0, 61.0, 49.0, 39.0, 25.0, 19.0, 13.0, 10.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4162213802337646, -2.348500967025757, -2.28078031539917, -2.213059902191162, -2.145339250564575, -2.0776188373565674, -2.0098981857299805, -1.9421777725219727, -1.8744572401046753, -1.806736707687378, -1.7390161752700806, -1.6712956428527832, -1.6035752296447754, -1.5358545780181885, -1.4681341648101807, -1.4004136323928833, -1.332693099975586, -1.2649725675582886, -1.1972520351409912, -1.1295315027236938, -1.0618109703063965, -0.9940904974937439, -0.9263700246810913, -0.858649492263794, -0.7909289598464966, -0.7232084274291992, -0.6554878950119019, -0.5877674221992493, -0.5200468897819519, -0.45232635736465454, -0.38460585474967957, -0.3168853521347046, -0.24916470050811768, -0.1814441829919815, -0.11372366547584534, -0.04600314795970917, 0.021717369556427002, 0.08943790197372437, 0.15715840458869934, 0.22487890720367432, 0.2925994396209717, 0.36031997203826904, 0.428040474653244, 0.495760977268219, 0.5634815096855164, 0.6312020421028137, 0.6989225149154663, 0.7666430473327637, 0.834363579750061, 0.9020841121673584, 0.9698046445846558, 1.0375251770019531, 1.105245590209961, 1.1729662418365479, 1.2406866550445557, 1.308407187461853, 1.3761277198791504, 1.4438482522964478, 1.5115687847137451, 1.5792893171310425, 1.6470098495483398, 1.7147302627563477, 1.782450795173645, 1.8501713275909424, 1.9178918600082397]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 11.0, 7.0, 6.0, 9.0, 12.0, 18.0, 16.0, 16.0, 27.0, 32.0, 32.0, 25.0, 36.0, 38.0, 34.0, 28.0, 40.0, 40.0, 43.0, 32.0, 48.0, 44.0, 42.0, 46.0, 48.0, 34.0, 26.0, 28.0, 28.0, 23.0, 25.0, 25.0, 15.0, 10.0, 12.0, 11.0, 7.0, 8.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.1591284275054932, -1.121032476425171, -1.0829365253448486, -1.0448405742645264, -1.006744623184204, -0.9686486124992371, -0.93055260181427, -0.8924566507339478, -0.8543606996536255, -0.8162647485733032, -0.778168797492981, -0.7400727868080139, -0.7019768357276917, -0.6638808846473694, -0.6257848739624023, -0.5876889228820801, -0.5495929718017578, -0.5114970207214355, -0.4734010398387909, -0.43530505895614624, -0.397209107875824, -0.3591131567955017, -0.32101717591285706, -0.2829211950302124, -0.24482524394989014, -0.20672927796840668, -0.16863331198692322, -0.13053734600543976, -0.0924413800239563, -0.05434541404247284, -0.01624944806098938, 0.021846532821655273, 0.05994248390197754, 0.098038449883461, 0.13613441586494446, 0.17423038184642792, 0.21232634782791138, 0.25042229890823364, 0.2885182797908783, 0.32661426067352295, 0.3647102117538452, 0.4028061628341675, 0.44090214371681213, 0.4789981245994568, 0.517094075679779, 0.5551900267601013, 0.5932860374450684, 0.6313819885253906, 0.6694779396057129, 0.7075738906860352, 0.7456698417663574, 0.7837658524513245, 0.8218618035316467, 0.859957754611969, 0.898053765296936, 0.9361497163772583, 0.9742456674575806, 1.0123416185379028, 1.050437569618225, 1.0885335206985474, 1.1266295909881592, 1.1647255420684814, 1.2028214931488037, 1.240917444229126, 1.2790133953094482]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 10.0, 9.0, 15.0, 18.0, 36.0, 62.0, 58.0, 111.0, 158.0, 228.0, 345.0, 421.0, 657.0, 967.0, 1480.0, 2324.0, 3495.0, 5317.0, 8358.0, 13567.0, 22208.0, 37573.0, 66518.0, 124107.0, 233914.0, 235643.0, 125636.0, 67299.0, 37870.0, 22287.0, 13502.0, 8553.0, 5281.0, 3532.0, 2309.0, 1468.0, 1025.0, 698.0, 458.0, 329.0, 212.0, 138.0, 108.0, 69.0, 59.0, 40.0, 26.0, 16.0, 9.0, 14.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0], "bins": [-2.064453125, -2.0019073486328125, -1.939361572265625, -1.8768157958984375, -1.81427001953125, -1.7517242431640625, -1.689178466796875, -1.6266326904296875, -1.5640869140625, -1.5015411376953125, -1.438995361328125, -1.3764495849609375, -1.31390380859375, -1.2513580322265625, -1.188812255859375, -1.1262664794921875, -1.063720703125, -1.0011749267578125, -0.938629150390625, -0.8760833740234375, -0.81353759765625, -0.7509918212890625, -0.688446044921875, -0.6259002685546875, -0.5633544921875, -0.5008087158203125, -0.438262939453125, -0.3757171630859375, -0.31317138671875, -0.2506256103515625, -0.188079833984375, -0.1255340576171875, -0.06298828125, -0.0004425048828125, 0.062103271484375, 0.1246490478515625, 0.18719482421875, 0.2497406005859375, 0.312286376953125, 0.3748321533203125, 0.4373779296875, 0.4999237060546875, 0.562469482421875, 0.6250152587890625, 0.68756103515625, 0.7501068115234375, 0.812652587890625, 0.8751983642578125, 0.937744140625, 1.0002899169921875, 1.062835693359375, 1.1253814697265625, 1.18792724609375, 1.2504730224609375, 1.313018798828125, 1.3755645751953125, 1.4381103515625, 1.5006561279296875, 1.563201904296875, 1.6257476806640625, 1.68829345703125, 1.7508392333984375, 1.813385009765625, 1.8759307861328125, 1.9384765625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 10.0, 11.0, 12.0, 7.0, 11.0, 17.0, 23.0, 32.0, 20.0, 33.0, 32.0, 32.0, 37.0, 38.0, 45.0, 35.0, 46.0, 50.0, 51.0, 31.0, 44.0, 49.0, 52.0, 38.0, 38.0, 19.0, 36.0, 27.0, 29.0, 15.0, 13.0, 13.0, 15.0, 10.0, 9.0, 7.0, 7.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0394744873046875, -1.003753662109375, -0.9680328369140625, -0.93231201171875, -0.8965911865234375, -0.860870361328125, -0.8251495361328125, -0.7894287109375, -0.7537078857421875, -0.717987060546875, -0.6822662353515625, -0.64654541015625, -0.6108245849609375, -0.575103759765625, -0.5393829345703125, -0.503662109375, -0.4679412841796875, -0.432220458984375, -0.3964996337890625, -0.36077880859375, -0.3250579833984375, -0.289337158203125, -0.2536163330078125, -0.2178955078125, -0.1821746826171875, -0.146453857421875, -0.1107330322265625, -0.07501220703125, -0.0392913818359375, -0.003570556640625, 0.0321502685546875, 0.06787109375, 0.1035919189453125, 0.139312744140625, 0.1750335693359375, 0.21075439453125, 0.2464752197265625, 0.282196044921875, 0.3179168701171875, 0.3536376953125, 0.3893585205078125, 0.425079345703125, 0.4608001708984375, 0.49652099609375, 0.5322418212890625, 0.567962646484375, 0.6036834716796875, 0.639404296875, 0.6751251220703125, 0.710845947265625, 0.7465667724609375, 0.78228759765625, 0.8180084228515625, 0.853729248046875, 0.8894500732421875, 0.9251708984375, 0.9608917236328125, 0.996612548828125, 1.0323333740234375, 1.06805419921875, 1.1037750244140625, 1.139495849609375, 1.1752166748046875, 1.2109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 9.0, 5.0, 12.0, 28.0, 32.0, 47.0, 70.0, 71.0, 120.0, 182.0, 265.0, 377.0, 581.0, 894.0, 1391.0, 2054.0, 3229.0, 5229.0, 8403.0, 14660.0, 26131.0, 48092.0, 94133.0, 187710.0, 288264.0, 174097.0, 87475.0, 44805.0, 24540.0, 13844.0, 7987.0, 4895.0, 3094.0, 1919.0, 1278.0, 862.0, 582.0, 387.0, 248.0, 186.0, 111.0, 80.0, 62.0, 35.0, 23.0, 27.0, 10.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.13671875, -2.07086181640625, -2.0050048828125, -1.93914794921875, -1.873291015625, -1.80743408203125, -1.7415771484375, -1.67572021484375, -1.60986328125, -1.54400634765625, -1.4781494140625, -1.41229248046875, -1.346435546875, -1.28057861328125, -1.2147216796875, -1.14886474609375, -1.0830078125, -1.01715087890625, -0.9512939453125, -0.88543701171875, -0.819580078125, -0.75372314453125, -0.6878662109375, -0.62200927734375, -0.55615234375, -0.49029541015625, -0.4244384765625, -0.35858154296875, -0.292724609375, -0.22686767578125, -0.1610107421875, -0.09515380859375, -0.029296875, 0.03656005859375, 0.1024169921875, 0.16827392578125, 0.234130859375, 0.29998779296875, 0.3658447265625, 0.43170166015625, 0.49755859375, 0.56341552734375, 0.6292724609375, 0.69512939453125, 0.760986328125, 0.82684326171875, 0.8927001953125, 0.95855712890625, 1.0244140625, 1.09027099609375, 1.1561279296875, 1.22198486328125, 1.287841796875, 1.35369873046875, 1.4195556640625, 1.48541259765625, 1.55126953125, 1.61712646484375, 1.6829833984375, 1.74884033203125, 1.814697265625, 1.88055419921875, 1.9464111328125, 2.01226806640625, 2.078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 8.0, 13.0, 17.0, 16.0, 18.0, 18.0, 17.0, 22.0, 31.0, 37.0, 37.0, 40.0, 32.0, 49.0, 41.0, 45.0, 40.0, 29.0, 43.0, 46.0, 43.0, 28.0, 39.0, 40.0, 39.0, 18.0, 22.0, 10.0, 22.0, 16.0, 17.0, 17.0, 15.0, 6.0, 7.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67333984375, -0.6524810791015625, -0.631622314453125, -0.6107635498046875, -0.58990478515625, -0.5690460205078125, -0.548187255859375, -0.5273284912109375, -0.5064697265625, -0.4856109619140625, -0.464752197265625, -0.4438934326171875, -0.42303466796875, -0.4021759033203125, -0.381317138671875, -0.3604583740234375, -0.339599609375, -0.3187408447265625, -0.297882080078125, -0.2770233154296875, -0.25616455078125, -0.2353057861328125, -0.214447021484375, -0.1935882568359375, -0.1727294921875, -0.1518707275390625, -0.131011962890625, -0.1101531982421875, -0.08929443359375, -0.0684356689453125, -0.047576904296875, -0.0267181396484375, -0.005859375, 0.0149993896484375, 0.035858154296875, 0.0567169189453125, 0.07757568359375, 0.0984344482421875, 0.119293212890625, 0.1401519775390625, 0.1610107421875, 0.1818695068359375, 0.202728271484375, 0.2235870361328125, 0.24444580078125, 0.2653045654296875, 0.286163330078125, 0.3070220947265625, 0.327880859375, 0.3487396240234375, 0.369598388671875, 0.3904571533203125, 0.41131591796875, 0.4321746826171875, 0.453033447265625, 0.4738922119140625, 0.4947509765625, 0.5156097412109375, 0.536468505859375, 0.5573272705078125, 0.57818603515625, 0.5990447998046875, 0.619903564453125, 0.6407623291015625, 0.66162109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 12.0, 16.0, 16.0, 22.0, 41.0, 40.0, 55.0, 82.0, 120.0, 136.0, 204.0, 314.0, 476.0, 629.0, 931.0, 1464.0, 2310.0, 3865.0, 6961.0, 13487.0, 29605.0, 81226.0, 705160.0, 124056.0, 39279.0, 17107.0, 8492.0, 4572.0, 2723.0, 1669.0, 1066.0, 708.0, 470.0, 351.0, 240.0, 168.0, 151.0, 79.0, 72.0, 48.0, 26.0, 18.0, 31.0, 12.0, 14.0, 7.0, 6.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.818359375, -1.7626800537109375, -1.707000732421875, -1.6513214111328125, -1.59564208984375, -1.5399627685546875, -1.484283447265625, -1.4286041259765625, -1.3729248046875, -1.3172454833984375, -1.261566162109375, -1.2058868408203125, -1.15020751953125, -1.0945281982421875, -1.038848876953125, -0.9831695556640625, -0.927490234375, -0.8718109130859375, -0.816131591796875, -0.7604522705078125, -0.70477294921875, -0.6490936279296875, -0.593414306640625, -0.5377349853515625, -0.4820556640625, -0.4263763427734375, -0.370697021484375, -0.3150177001953125, -0.25933837890625, -0.2036590576171875, -0.147979736328125, -0.0923004150390625, -0.03662109375, 0.0190582275390625, 0.074737548828125, 0.1304168701171875, 0.18609619140625, 0.2417755126953125, 0.297454833984375, 0.3531341552734375, 0.4088134765625, 0.4644927978515625, 0.520172119140625, 0.5758514404296875, 0.63153076171875, 0.6872100830078125, 0.742889404296875, 0.7985687255859375, 0.854248046875, 0.9099273681640625, 0.965606689453125, 1.0212860107421875, 1.07696533203125, 1.1326446533203125, 1.188323974609375, 1.2440032958984375, 1.2996826171875, 1.3553619384765625, 1.411041259765625, 1.4667205810546875, 1.52239990234375, 1.5780792236328125, 1.633758544921875, 1.6894378662109375, 1.7451171875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 5.0, 1.0, 8.0, 8.0, 9.0, 25.0, 27.0, 34.0, 94.0, 418.0, 164.0, 87.0, 32.0, 27.0, 25.0, 7.0, 5.0, 5.0, 6.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.015466690063477e-05, -6.754230707883835e-05, -6.492994725704193e-05, -6.231758743524551e-05, -5.97052276134491e-05, -5.709286779165268e-05, -5.448050796985626e-05, -5.1868148148059845e-05, -4.925578832626343e-05, -4.664342850446701e-05, -4.403106868267059e-05, -4.1418708860874176e-05, -3.880634903907776e-05, -3.619398921728134e-05, -3.3581629395484924e-05, -3.096926957368851e-05, -2.835690975189209e-05, -2.5744549930095673e-05, -2.3132190108299255e-05, -2.0519830286502838e-05, -1.790747046470642e-05, -1.5295110642910004e-05, -1.2682750821113586e-05, -1.007039099931717e-05, -7.458031177520752e-06, -4.845671355724335e-06, -2.2333115339279175e-06, 3.7904828786849976e-07, 2.991408109664917e-06, 5.603767931461334e-06, 8.216127753257751e-06, 1.0828487575054169e-05, 1.3440847396850586e-05, 1.6053207218647003e-05, 1.866556704044342e-05, 2.1277926862239838e-05, 2.3890286684036255e-05, 2.6502646505832672e-05, 2.911500632762909e-05, 3.1727366149425507e-05, 3.4339725971221924e-05, 3.695208579301834e-05, 3.956444561481476e-05, 4.2176805436611176e-05, 4.478916525840759e-05, 4.740152508020401e-05, 5.001388490200043e-05, 5.2626244723796844e-05, 5.523860454559326e-05, 5.785096436738968e-05, 6.0463324189186096e-05, 6.307568401098251e-05, 6.568804383277893e-05, 6.830040365457535e-05, 7.091276347637177e-05, 7.352512329816818e-05, 7.61374831199646e-05, 7.874984294176102e-05, 8.136220276355743e-05, 8.397456258535385e-05, 8.658692240715027e-05, 8.919928222894669e-05, 9.18116420507431e-05, 9.442400187253952e-05, 9.703636169433594e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 3.0, 10.0, 11.0, 13.0, 21.0, 19.0, 48.0, 68.0, 79.0, 96.0, 149.0, 244.0, 346.0, 528.0, 796.0, 1308.0, 2200.0, 3684.0, 6339.0, 11874.0, 24350.0, 66587.0, 703817.0, 146837.0, 40365.0, 17009.0, 8910.0, 5062.0, 2947.0, 1788.0, 1052.0, 656.0, 448.0, 282.0, 181.0, 114.0, 93.0, 60.0, 55.0, 34.0, 20.0, 11.0, 17.0, 5.0, 3.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.671875, -1.61376953125, -1.5556640625, -1.49755859375, -1.439453125, -1.38134765625, -1.3232421875, -1.26513671875, -1.20703125, -1.14892578125, -1.0908203125, -1.03271484375, -0.974609375, -0.91650390625, -0.8583984375, -0.80029296875, -0.7421875, -0.68408203125, -0.6259765625, -0.56787109375, -0.509765625, -0.45166015625, -0.3935546875, -0.33544921875, -0.27734375, -0.21923828125, -0.1611328125, -0.10302734375, -0.044921875, 0.01318359375, 0.0712890625, 0.12939453125, 0.1875, 0.24560546875, 0.3037109375, 0.36181640625, 0.419921875, 0.47802734375, 0.5361328125, 0.59423828125, 0.65234375, 0.71044921875, 0.7685546875, 0.82666015625, 0.884765625, 0.94287109375, 1.0009765625, 1.05908203125, 1.1171875, 1.17529296875, 1.2333984375, 1.29150390625, 1.349609375, 1.40771484375, 1.4658203125, 1.52392578125, 1.58203125, 1.64013671875, 1.6982421875, 1.75634765625, 1.814453125, 1.87255859375, 1.9306640625, 1.98876953125, 2.046875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 17.0, 17.0, 4.0, 12.0, 13.0, 30.0, 42.0, 36.0, 51.0, 153.0, 323.0, 50.0, 58.0, 40.0, 20.0, 25.0, 17.0, 11.0, 8.0, 8.0, 12.0, 4.0, 7.0, 7.0, 2.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.393798828125, -0.3792381286621094, -0.36467742919921875, -0.3501167297363281, -0.3355560302734375, -0.3209953308105469, -0.30643463134765625, -0.2918739318847656, -0.277313232421875, -0.2627525329589844, -0.24819183349609375, -0.23363113403320312, -0.2190704345703125, -0.20450973510742188, -0.18994903564453125, -0.17538833618164062, -0.16082763671875, -0.14626693725585938, -0.13170623779296875, -0.11714553833007812, -0.1025848388671875, -0.08802413940429688, -0.07346343994140625, -0.058902740478515625, -0.044342041015625, -0.029781341552734375, -0.01522064208984375, -0.000659942626953125, 0.0139007568359375, 0.028461456298828125, 0.04302215576171875, 0.057582855224609375, 0.0721435546875, 0.08670425415039062, 0.10126495361328125, 0.11582565307617188, 0.1303863525390625, 0.14494705200195312, 0.15950775146484375, 0.17406845092773438, 0.188629150390625, 0.20318984985351562, 0.21775054931640625, 0.23231124877929688, 0.2468719482421875, 0.2614326477050781, 0.27599334716796875, 0.2905540466308594, 0.30511474609375, 0.3196754455566406, 0.33423614501953125, 0.3487968444824219, 0.3633575439453125, 0.3779182434082031, 0.39247894287109375, 0.4070396423339844, 0.421600341796875, 0.4361610412597656, 0.45072174072265625, 0.4652824401855469, 0.4798431396484375, 0.4944038391113281, 0.5089645385742188, 0.5235252380371094, 0.5380859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 10.0, 9.0, 10.0, 9.0, 23.0, 31.0, 39.0, 57.0, 79.0, 88.0, 135.0, 99.0, 93.0, 58.0, 51.0, 53.0, 33.0, 21.0, 23.0, 12.0, 11.0, 6.0, 7.0, 4.0, 3.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5896393060684204, -1.5361613035202026, -1.4826831817626953, -1.4292051792144775, -1.3757271766662598, -1.3222490549087524, -1.2687710523605347, -1.2152929306030273, -1.1618149280548096, -1.1083369255065918, -1.0548588037490845, -1.0013808012008667, -0.9479027390480042, -0.8944246768951416, -0.8409466743469238, -0.7874686121940613, -0.7339905500411987, -0.6805124878883362, -0.6270344257354736, -0.5735564231872559, -0.5200783610343933, -0.46660029888153076, -0.4131222665309906, -0.35964423418045044, -0.3061661720275879, -0.25268810987472534, -0.19921007752418518, -0.14573203027248383, -0.09225398302078247, -0.03877592086791992, 0.01470211148262024, 0.0681801438331604, 0.1216580867767334, 0.17513613402843475, 0.2286141812801361, 0.28209221363067627, 0.3355702757835388, 0.38904833793640137, 0.44252637028694153, 0.4960044026374817, 0.5494824647903442, 0.6029605269432068, 0.6564385890960693, 0.7099165916442871, 0.7633946537971497, 0.8168727159500122, 0.87035071849823, 0.9238287806510925, 0.9773068428039551, 1.0307848453521729, 1.0842629671096802, 1.137740969657898, 1.1912190914154053, 1.244697093963623, 1.2981750965118408, 1.3516530990600586, 1.405131220817566, 1.4586092233657837, 1.512087345123291, 1.5655653476715088, 1.6190433502197266, 1.6725214719772339, 1.7259994745254517, 1.779477596282959, 1.8329555988311768]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 9.0, 12.0, 11.0, 11.0, 20.0, 28.0, 26.0, 27.0, 20.0, 29.0, 38.0, 30.0, 40.0, 29.0, 51.0, 35.0, 29.0, 48.0, 39.0, 45.0, 40.0, 34.0, 32.0, 39.0, 26.0, 31.0, 22.0, 26.0, 35.0, 23.0, 16.0, 17.0, 17.0, 6.0, 2.0, 11.0, 8.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.099994421005249, -1.0658196210861206, -1.0316448211669922, -0.9974700808525085, -0.9632953405380249, -0.9291205406188965, -0.8949457406997681, -0.8607709407806396, -0.826596200466156, -0.7924214005470276, -0.758246660232544, -0.7240718603134155, -0.6898970603942871, -0.6557223200798035, -0.621547520160675, -0.5873727798461914, -0.553197979927063, -0.5190231800079346, -0.4848484396934509, -0.4506736397743225, -0.4164988696575165, -0.38232409954071045, -0.34814929962158203, -0.313974529504776, -0.27979975938796997, -0.24562498927116394, -0.21145020425319672, -0.1772754192352295, -0.14310064911842346, -0.10892587900161743, -0.07475109398365021, -0.04057630896568298, -0.006401419639587402, 0.027773357927799225, 0.06194813549518585, 0.09612291306257248, 0.1302976906299591, 0.16447246074676514, 0.19864724576473236, 0.23282203078269958, 0.2669968008995056, 0.30117157101631165, 0.3353463411331177, 0.3695211410522461, 0.4036959111690521, 0.43787068128585815, 0.4720454812049866, 0.5062202215194702, 0.5403950214385986, 0.574569821357727, 0.6087445616722107, 0.6429193615913391, 0.6770941019058228, 0.7112689018249512, 0.7454437017440796, 0.779618501663208, 0.8137932419776917, 0.8479680418968201, 0.8821427822113037, 0.9163175821304321, 0.9504923820495605, 0.9846671223640442, 1.0188418626785278, 1.0530166625976562, 1.0871914625167847]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 7.0, 13.0, 24.0, 25.0, 41.0, 72.0, 78.0, 135.0, 203.0, 278.0, 445.0, 583.0, 864.0, 1244.0, 1812.0, 2720.0, 4235.0, 6503.0, 9993.0, 15467.0, 24844.0, 41406.0, 71534.0, 134132.0, 305540.0, 1079556.0, 1560673.0, 514188.0, 191719.0, 94718.0, 51761.0, 30206.0, 18507.0, 11281.0, 7124.0, 4467.0, 2971.0, 1722.0, 1189.0, 718.0, 423.0, 292.0, 202.0, 117.0, 87.0, 49.0, 45.0, 22.0, 16.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4609375, -1.4155731201171875, -1.370208740234375, -1.3248443603515625, -1.27947998046875, -1.2341156005859375, -1.188751220703125, -1.1433868408203125, -1.0980224609375, -1.0526580810546875, -1.007293701171875, -0.9619293212890625, -0.91656494140625, -0.8712005615234375, -0.825836181640625, -0.7804718017578125, -0.735107421875, -0.6897430419921875, -0.644378662109375, -0.5990142822265625, -0.55364990234375, -0.5082855224609375, -0.462921142578125, -0.4175567626953125, -0.3721923828125, -0.3268280029296875, -0.281463623046875, -0.2360992431640625, -0.19073486328125, -0.1453704833984375, -0.100006103515625, -0.0546417236328125, -0.00927734375, 0.0360870361328125, 0.081451416015625, 0.1268157958984375, 0.17218017578125, 0.2175445556640625, 0.262908935546875, 0.3082733154296875, 0.3536376953125, 0.3990020751953125, 0.444366455078125, 0.4897308349609375, 0.53509521484375, 0.5804595947265625, 0.625823974609375, 0.6711883544921875, 0.716552734375, 0.7619171142578125, 0.807281494140625, 0.8526458740234375, 0.89801025390625, 0.9433746337890625, 0.988739013671875, 1.0341033935546875, 1.0794677734375, 1.1248321533203125, 1.170196533203125, 1.2155609130859375, 1.26092529296875, 1.3062896728515625, 1.351654052734375, 1.3970184326171875, 1.4423828125]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 8.0, 13.0, 9.0, 10.0, 17.0, 13.0, 21.0, 23.0, 23.0, 26.0, 32.0, 30.0, 37.0, 39.0, 45.0, 37.0, 42.0, 44.0, 43.0, 37.0, 42.0, 45.0, 35.0, 36.0, 31.0, 32.0, 31.0, 27.0, 32.0, 18.0, 27.0, 14.0, 19.0, 14.0, 11.0, 4.0, 8.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72021484375, -0.697967529296875, -0.67572021484375, -0.653472900390625, -0.6312255859375, -0.608978271484375, -0.58673095703125, -0.564483642578125, -0.542236328125, -0.519989013671875, -0.49774169921875, -0.475494384765625, -0.4532470703125, -0.430999755859375, -0.40875244140625, -0.386505126953125, -0.3642578125, -0.342010498046875, -0.31976318359375, -0.297515869140625, -0.2752685546875, -0.253021240234375, -0.23077392578125, -0.208526611328125, -0.186279296875, -0.164031982421875, -0.14178466796875, -0.119537353515625, -0.0972900390625, -0.075042724609375, -0.05279541015625, -0.030548095703125, -0.00830078125, 0.013946533203125, 0.03619384765625, 0.058441162109375, 0.0806884765625, 0.102935791015625, 0.12518310546875, 0.147430419921875, 0.169677734375, 0.191925048828125, 0.21417236328125, 0.236419677734375, 0.2586669921875, 0.280914306640625, 0.30316162109375, 0.325408935546875, 0.34765625, 0.369903564453125, 0.39215087890625, 0.414398193359375, 0.4366455078125, 0.458892822265625, 0.48114013671875, 0.503387451171875, 0.525634765625, 0.547882080078125, 0.57012939453125, 0.592376708984375, 0.6146240234375, 0.636871337890625, 0.65911865234375, 0.681365966796875, 0.70361328125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 2.0, 12.0, 21.0, 36.0, 47.0, 64.0, 98.0, 196.0, 276.0, 466.0, 829.0, 1273.0, 2219.0, 3697.0, 6480.0, 11495.0, 21223.0, 39934.0, 81823.0, 179184.0, 454462.0, 1512557.0, 1200104.0, 375146.0, 152547.0, 71062.0, 35686.0, 18790.0, 10407.0, 5893.0, 3320.0, 1945.0, 1200.0, 684.0, 427.0, 239.0, 176.0, 101.0, 55.0, 33.0, 35.0, 19.0, 6.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.4004364013671875, -1.353607177734375, -1.3067779541015625, -1.25994873046875, -1.2131195068359375, -1.166290283203125, -1.1194610595703125, -1.0726318359375, -1.0258026123046875, -0.978973388671875, -0.9321441650390625, -0.88531494140625, -0.8384857177734375, -0.791656494140625, -0.7448272705078125, -0.697998046875, -0.6511688232421875, -0.604339599609375, -0.5575103759765625, -0.51068115234375, -0.4638519287109375, -0.417022705078125, -0.3701934814453125, -0.3233642578125, -0.2765350341796875, -0.229705810546875, -0.1828765869140625, -0.13604736328125, -0.0892181396484375, -0.042388916015625, 0.0044403076171875, 0.05126953125, 0.0980987548828125, 0.144927978515625, 0.1917572021484375, 0.23858642578125, 0.2854156494140625, 0.332244873046875, 0.3790740966796875, 0.4259033203125, 0.4727325439453125, 0.519561767578125, 0.5663909912109375, 0.61322021484375, 0.6600494384765625, 0.706878662109375, 0.7537078857421875, 0.800537109375, 0.8473663330078125, 0.894195556640625, 0.9410247802734375, 0.98785400390625, 1.0346832275390625, 1.081512451171875, 1.1283416748046875, 1.1751708984375, 1.2220001220703125, 1.268829345703125, 1.3156585693359375, 1.36248779296875, 1.4093170166015625, 1.456146240234375, 1.5029754638671875, 1.5498046875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 10.0, 22.0, 19.0, 25.0, 23.0, 33.0, 41.0, 71.0, 85.0, 92.0, 98.0, 125.0, 153.0, 203.0, 195.0, 231.0, 265.0, 286.0, 281.0, 291.0, 226.0, 231.0, 196.0, 156.0, 128.0, 117.0, 89.0, 60.0, 54.0, 60.0, 41.0, 39.0, 25.0, 13.0, 19.0, 10.0, 13.0, 10.0, 4.0, 10.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0], "bins": [-0.436767578125, -0.4246978759765625, -0.412628173828125, -0.4005584716796875, -0.38848876953125, -0.3764190673828125, -0.364349365234375, -0.3522796630859375, -0.3402099609375, -0.3281402587890625, -0.316070556640625, -0.3040008544921875, -0.29193115234375, -0.2798614501953125, -0.267791748046875, -0.2557220458984375, -0.24365234375, -0.2315826416015625, -0.219512939453125, -0.2074432373046875, -0.19537353515625, -0.1833038330078125, -0.171234130859375, -0.1591644287109375, -0.1470947265625, -0.1350250244140625, -0.122955322265625, -0.1108856201171875, -0.09881591796875, -0.0867462158203125, -0.074676513671875, -0.0626068115234375, -0.050537109375, -0.0384674072265625, -0.026397705078125, -0.0143280029296875, -0.00225830078125, 0.0098114013671875, 0.021881103515625, 0.0339508056640625, 0.0460205078125, 0.0580902099609375, 0.070159912109375, 0.0822296142578125, 0.09429931640625, 0.1063690185546875, 0.118438720703125, 0.1305084228515625, 0.142578125, 0.1546478271484375, 0.166717529296875, 0.1787872314453125, 0.19085693359375, 0.2029266357421875, 0.214996337890625, 0.2270660400390625, 0.2391357421875, 0.2512054443359375, 0.263275146484375, 0.2753448486328125, 0.28741455078125, 0.2994842529296875, 0.311553955078125, 0.3236236572265625, 0.335693359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 1.0, 8.0, 6.0, 8.0, 7.0, 13.0, 26.0, 24.0, 44.0, 45.0, 76.0, 82.0, 117.0, 109.0, 105.0, 75.0, 60.0, 56.0, 34.0, 23.0, 14.0, 18.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6699382066726685, -1.6285617351531982, -1.587185263633728, -1.5458087921142578, -1.5044323205947876, -1.4630558490753174, -1.4216793775558472, -1.380302906036377, -1.3389265537261963, -1.297550082206726, -1.2561736106872559, -1.2147971391677856, -1.1734206676483154, -1.1320441961288452, -1.090667724609375, -1.0492913722991943, -1.0079147815704346, -0.9665383100509644, -0.9251618385314941, -0.8837853670120239, -0.8424088954925537, -0.8010324239730835, -0.7596560120582581, -0.7182795405387878, -0.6769030690193176, -0.6355265974998474, -0.5941501259803772, -0.552773654460907, -0.5113972425460815, -0.47002074122428894, -0.4286442995071411, -0.3872678279876709, -0.3458913564682007, -0.30451488494873047, -0.26313841342926025, -0.22176197171211243, -0.1803855001926422, -0.139009028673172, -0.09763257205486298, -0.056256115436553955, -0.01487964391708374, 0.026496820151805878, 0.0678732842206955, 0.10924974828958511, 0.15062621235847473, 0.19200268387794495, 0.23337914049625397, 0.274755597114563, 0.3161320686340332, 0.3575085401535034, 0.39888501167297363, 0.44026145339012146, 0.4816379249095917, 0.5230144262313843, 0.5643908381462097, 0.6057673096656799, 0.6471437811851501, 0.6885202527046204, 0.7298967242240906, 0.7712731957435608, 0.8126496076583862, 0.8540260791778564, 0.8954025506973267, 0.9367790222167969, 0.9781554937362671]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 7.0, 11.0, 13.0, 14.0, 19.0, 24.0, 26.0, 27.0, 20.0, 30.0, 27.0, 23.0, 31.0, 30.0, 33.0, 28.0, 30.0, 35.0, 27.0, 42.0, 46.0, 37.0, 36.0, 38.0, 45.0, 30.0, 38.0, 28.0, 38.0, 22.0, 19.0, 27.0, 12.0, 11.0, 14.0, 14.0, 13.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7955688834190369, -0.7720916867256165, -0.7486144304275513, -0.7251372337341309, -0.7016600370407104, -0.6781827807426453, -0.6547055840492249, -0.6312283277511597, -0.6077511310577393, -0.5842739343643188, -0.5607966780662537, -0.5373194813728333, -0.5138422250747681, -0.49036502838134766, -0.46688783168792725, -0.44341060519218445, -0.41993337869644165, -0.39645615220069885, -0.37297892570495605, -0.34950172901153564, -0.32602450251579285, -0.30254727602005005, -0.27907007932662964, -0.25559285283088684, -0.23211562633514404, -0.20863839983940125, -0.18516118824481964, -0.16168397665023804, -0.13820675015449524, -0.11472953110933304, -0.09125231206417084, -0.06777510046958923, -0.044297873973846436, -0.020820654928684235, 0.0026565641164779663, 0.026133783161640167, 0.04961100220680237, 0.07308822125196457, 0.09656544029712677, 0.12004265189170837, 0.14351987838745117, 0.16699710488319397, 0.19047431647777557, 0.21395152807235718, 0.23742875456809998, 0.2609059810638428, 0.2843831777572632, 0.307860404253006, 0.3313376307487488, 0.3548148572444916, 0.3782920837402344, 0.4017692804336548, 0.4252465069293976, 0.4487237334251404, 0.4722009301185608, 0.4956781566143036, 0.5191553831100464, 0.5426325798034668, 0.566109836101532, 0.5895870327949524, 0.6130642890930176, 0.636541485786438, 0.6600186824798584, 0.6834958791732788, 0.706973135471344]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 8.0, 21.0, 22.0, 37.0, 51.0, 82.0, 111.0, 193.0, 297.0, 436.0, 604.0, 883.0, 1305.0, 1871.0, 2786.0, 4027.0, 6423.0, 10285.0, 17422.0, 30891.0, 60231.0, 132743.0, 328325.0, 239364.0, 98540.0, 46977.0, 25055.0, 14356.0, 8678.0, 5405.0, 3601.0, 2357.0, 1634.0, 1140.0, 805.0, 525.0, 334.0, 224.0, 175.0, 104.0, 80.0, 44.0, 30.0, 25.0, 14.0, 10.0, 9.0, 7.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.56640625, -0.550140380859375, -0.53387451171875, -0.517608642578125, -0.5013427734375, -0.485076904296875, -0.46881103515625, -0.452545166015625, -0.436279296875, -0.420013427734375, -0.40374755859375, -0.387481689453125, -0.3712158203125, -0.354949951171875, -0.33868408203125, -0.322418212890625, -0.30615234375, -0.289886474609375, -0.27362060546875, -0.257354736328125, -0.2410888671875, -0.224822998046875, -0.20855712890625, -0.192291259765625, -0.176025390625, -0.159759521484375, -0.14349365234375, -0.127227783203125, -0.1109619140625, -0.094696044921875, -0.07843017578125, -0.062164306640625, -0.0458984375, -0.029632568359375, -0.01336669921875, 0.002899169921875, 0.0191650390625, 0.035430908203125, 0.05169677734375, 0.067962646484375, 0.084228515625, 0.100494384765625, 0.11676025390625, 0.133026123046875, 0.1492919921875, 0.165557861328125, 0.18182373046875, 0.198089599609375, 0.21435546875, 0.230621337890625, 0.24688720703125, 0.263153076171875, 0.2794189453125, 0.295684814453125, 0.31195068359375, 0.328216552734375, 0.344482421875, 0.360748291015625, 0.37701416015625, 0.393280029296875, 0.4095458984375, 0.425811767578125, 0.44207763671875, 0.458343505859375, 0.474609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 1.0, 6.0, 7.0, 5.0, 10.0, 14.0, 16.0, 14.0, 18.0, 26.0, 23.0, 34.0, 27.0, 31.0, 30.0, 29.0, 31.0, 38.0, 32.0, 30.0, 33.0, 53.0, 51.0, 46.0, 33.0, 37.0, 41.0, 37.0, 33.0, 30.0, 36.0, 32.0, 17.0, 18.0, 18.0, 11.0, 10.0, 17.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.84716796875, -0.8222732543945312, -0.7973785400390625, -0.7724838256835938, -0.747589111328125, -0.7226943969726562, -0.6977996826171875, -0.6729049682617188, -0.64801025390625, -0.6231155395507812, -0.5982208251953125, -0.5733261108398438, -0.548431396484375, -0.5235366821289062, -0.4986419677734375, -0.47374725341796875, -0.4488525390625, -0.42395782470703125, -0.3990631103515625, -0.37416839599609375, -0.349273681640625, -0.32437896728515625, -0.2994842529296875, -0.27458953857421875, -0.24969482421875, -0.22480010986328125, -0.1999053955078125, -0.17501068115234375, -0.150115966796875, -0.12522125244140625, -0.1003265380859375, -0.07543182373046875, -0.050537109375, -0.02564239501953125, -0.0007476806640625, 0.02414703369140625, 0.049041748046875, 0.07393646240234375, 0.0988311767578125, 0.12372589111328125, 0.14862060546875, 0.17351531982421875, 0.1984100341796875, 0.22330474853515625, 0.248199462890625, 0.27309417724609375, 0.2979888916015625, 0.32288360595703125, 0.3477783203125, 0.37267303466796875, 0.3975677490234375, 0.42246246337890625, 0.447357177734375, 0.47225189208984375, 0.4971466064453125, 0.5220413208007812, 0.54693603515625, 0.5718307495117188, 0.5967254638671875, 0.6216201782226562, 0.646514892578125, 0.6714096069335938, 0.6963043212890625, 0.7211990356445312, 0.74609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 11.0, 11.0, 17.0, 24.0, 31.0, 34.0, 59.0, 77.0, 135.0, 183.0, 249.0, 371.0, 485.0, 679.0, 1001.0, 1381.0, 2069.0, 3005.0, 4738.0, 7672.0, 13929.0, 29860.0, 103050.0, 659932.0, 144352.0, 35592.0, 15638.0, 8510.0, 5020.0, 3255.0, 2117.0, 1498.0, 986.0, 711.0, 503.0, 397.0, 265.0, 210.0, 134.0, 99.0, 74.0, 54.0, 42.0, 32.0, 19.0, 12.0, 13.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.873046875, -0.8470535278320312, -0.8210601806640625, -0.7950668334960938, -0.769073486328125, -0.7430801391601562, -0.7170867919921875, -0.6910934448242188, -0.66510009765625, -0.6391067504882812, -0.6131134033203125, -0.5871200561523438, -0.561126708984375, -0.5351333618164062, -0.5091400146484375, -0.48314666748046875, -0.4571533203125, -0.43115997314453125, -0.4051666259765625, -0.37917327880859375, -0.353179931640625, -0.32718658447265625, -0.3011932373046875, -0.27519989013671875, -0.24920654296875, -0.22321319580078125, -0.1972198486328125, -0.17122650146484375, -0.145233154296875, -0.11923980712890625, -0.0932464599609375, -0.06725311279296875, -0.041259765625, -0.01526641845703125, 0.0107269287109375, 0.03672027587890625, 0.062713623046875, 0.08870697021484375, 0.1147003173828125, 0.14069366455078125, 0.16668701171875, 0.19268035888671875, 0.2186737060546875, 0.24466705322265625, 0.270660400390625, 0.29665374755859375, 0.3226470947265625, 0.34864044189453125, 0.3746337890625, 0.40062713623046875, 0.4266204833984375, 0.45261383056640625, 0.478607177734375, 0.5046005249023438, 0.5305938720703125, 0.5565872192382812, 0.58258056640625, 0.6085739135742188, 0.6345672607421875, 0.6605606079101562, 0.686553955078125, 0.7125473022460938, 0.7385406494140625, 0.7645339965820312, 0.79052734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 4.0, 10.0, 12.0, 14.0, 20.0, 17.0, 18.0, 18.0, 20.0, 24.0, 28.0, 36.0, 32.0, 37.0, 29.0, 44.0, 44.0, 37.0, 51.0, 47.0, 33.0, 33.0, 37.0, 35.0, 41.0, 29.0, 29.0, 19.0, 23.0, 24.0, 28.0, 28.0, 11.0, 20.0, 11.0, 6.0, 7.0, 4.0, 6.0, 0.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.50732421875, -0.49143218994140625, -0.4755401611328125, -0.45964813232421875, -0.443756103515625, -0.42786407470703125, -0.4119720458984375, -0.39608001708984375, -0.38018798828125, -0.36429595947265625, -0.3484039306640625, -0.33251190185546875, -0.316619873046875, -0.30072784423828125, -0.2848358154296875, -0.26894378662109375, -0.2530517578125, -0.23715972900390625, -0.2212677001953125, -0.20537567138671875, -0.189483642578125, -0.17359161376953125, -0.1576995849609375, -0.14180755615234375, -0.12591552734375, -0.11002349853515625, -0.0941314697265625, -0.07823944091796875, -0.062347412109375, -0.04645538330078125, -0.0305633544921875, -0.01467132568359375, 0.001220703125, 0.01711273193359375, 0.0330047607421875, 0.04889678955078125, 0.064788818359375, 0.08068084716796875, 0.0965728759765625, 0.11246490478515625, 0.12835693359375, 0.14424896240234375, 0.1601409912109375, 0.17603302001953125, 0.191925048828125, 0.20781707763671875, 0.2237091064453125, 0.23960113525390625, 0.2554931640625, 0.27138519287109375, 0.2872772216796875, 0.30316925048828125, 0.319061279296875, 0.33495330810546875, 0.3508453369140625, 0.36673736572265625, 0.38262939453125, 0.39852142333984375, 0.4144134521484375, 0.43030548095703125, 0.446197509765625, 0.46208953857421875, 0.4779815673828125, 0.49387359619140625, 0.509765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 6.0, 9.0, 18.0, 30.0, 36.0, 46.0, 44.0, 73.0, 112.0, 129.0, 199.0, 302.0, 408.0, 565.0, 866.0, 1524.0, 2738.0, 5480.0, 12417.0, 37934.0, 249229.0, 647300.0, 57331.0, 16560.0, 6869.0, 3304.0, 1771.0, 1013.0, 669.0, 435.0, 320.0, 217.0, 155.0, 94.0, 80.0, 70.0, 41.0, 37.0, 25.0, 18.0, 14.0, 15.0, 10.0, 5.0, 4.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.244384765625, -0.23701095581054688, -0.22963714599609375, -0.22226333618164062, -0.2148895263671875, -0.20751571655273438, -0.20014190673828125, -0.19276809692382812, -0.185394287109375, -0.17802047729492188, -0.17064666748046875, -0.16327285766601562, -0.1558990478515625, -0.14852523803710938, -0.14115142822265625, -0.13377761840820312, -0.12640380859375, -0.11902999877929688, -0.11165618896484375, -0.10428237915039062, -0.0969085693359375, -0.08953475952148438, -0.08216094970703125, -0.07478713989257812, -0.067413330078125, -0.060039520263671875, -0.05266571044921875, -0.045291900634765625, -0.0379180908203125, -0.030544281005859375, -0.02317047119140625, -0.015796661376953125, -0.0084228515625, -0.001049041748046875, 0.00632476806640625, 0.013698577880859375, 0.0210723876953125, 0.028446197509765625, 0.03582000732421875, 0.043193817138671875, 0.050567626953125, 0.057941436767578125, 0.06531524658203125, 0.07268905639648438, 0.0800628662109375, 0.08743667602539062, 0.09481048583984375, 0.10218429565429688, 0.10955810546875, 0.11693191528320312, 0.12430572509765625, 0.13167953491210938, 0.1390533447265625, 0.14642715454101562, 0.15380096435546875, 0.16117477416992188, 0.168548583984375, 0.17592239379882812, 0.18329620361328125, 0.19067001342773438, 0.1980438232421875, 0.20541763305664062, 0.21279144287109375, 0.22016525268554688, 0.2275390625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 5.0, 4.0, 8.0, 11.0, 14.0, 12.0, 14.0, 24.0, 17.0, 20.0, 37.0, 47.0, 53.0, 90.0, 95.0, 93.0, 85.0, 90.0, 78.0, 44.0, 38.0, 27.0, 26.0, 16.0, 16.0, 10.0, 3.0, 6.0, 4.0, 0.0, 1.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-06, -5.142763257026672e-06, -4.9211084842681885e-06, -4.699453711509705e-06, -4.477798938751221e-06, -4.256144165992737e-06, -4.034489393234253e-06, -3.812834620475769e-06, -3.591179847717285e-06, -3.3695250749588013e-06, -3.1478703022003174e-06, -2.9262155294418335e-06, -2.7045607566833496e-06, -2.4829059839248657e-06, -2.261251211166382e-06, -2.039596438407898e-06, -1.817941665649414e-06, -1.5962868928909302e-06, -1.3746321201324463e-06, -1.1529773473739624e-06, -9.313225746154785e-07, -7.096678018569946e-07, -4.880130290985107e-07, -2.6635825634002686e-07, -4.470348358154297e-08, 1.7695128917694092e-07, 3.986060619354248e-07, 6.202608346939087e-07, 8.419156074523926e-07, 1.0635703802108765e-06, 1.2852251529693604e-06, 1.5068799257278442e-06, 1.7285346984863281e-06, 1.950189471244812e-06, 2.171844244003296e-06, 2.3934990167617798e-06, 2.6151537895202637e-06, 2.8368085622787476e-06, 3.0584633350372314e-06, 3.2801181077957153e-06, 3.5017728805541992e-06, 3.723427653312683e-06, 3.945082426071167e-06, 4.166737198829651e-06, 4.388391971588135e-06, 4.610046744346619e-06, 4.8317015171051025e-06, 5.0533562898635864e-06, 5.27501106262207e-06, 5.496665835380554e-06, 5.718320608139038e-06, 5.939975380897522e-06, 6.161630153656006e-06, 6.38328492641449e-06, 6.604939699172974e-06, 6.8265944719314575e-06, 7.048249244689941e-06, 7.269904017448425e-06, 7.491558790206909e-06, 7.713213562965393e-06, 7.934868335723877e-06, 8.15652310848236e-06, 8.378177881240845e-06, 8.599832653999329e-06, 8.821487426757812e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 17.0, 13.0, 17.0, 29.0, 32.0, 49.0, 61.0, 108.0, 141.0, 184.0, 252.0, 358.0, 517.0, 785.0, 1182.0, 1575.0, 2409.0, 3644.0, 5951.0, 10285.0, 18709.0, 38426.0, 92283.0, 347492.0, 347247.0, 91732.0, 38689.0, 18732.0, 10064.0, 5970.0, 3805.0, 2417.0, 1686.0, 1098.0, 790.0, 511.0, 389.0, 273.0, 193.0, 124.0, 106.0, 64.0, 42.0, 28.0, 23.0, 26.0, 13.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.145751953125, -0.14119720458984375, -0.1366424560546875, -0.13208770751953125, -0.127532958984375, -0.12297821044921875, -0.1184234619140625, -0.11386871337890625, -0.10931396484375, -0.10475921630859375, -0.1002044677734375, -0.09564971923828125, -0.091094970703125, -0.08654022216796875, -0.0819854736328125, -0.07743072509765625, -0.0728759765625, -0.06832122802734375, -0.0637664794921875, -0.05921173095703125, -0.054656982421875, -0.05010223388671875, -0.0455474853515625, -0.04099273681640625, -0.03643798828125, -0.03188323974609375, -0.0273284912109375, -0.02277374267578125, -0.018218994140625, -0.01366424560546875, -0.0091094970703125, -0.00455474853515625, 0.0, 0.00455474853515625, 0.0091094970703125, 0.01366424560546875, 0.018218994140625, 0.02277374267578125, 0.0273284912109375, 0.03188323974609375, 0.03643798828125, 0.04099273681640625, 0.0455474853515625, 0.05010223388671875, 0.054656982421875, 0.05921173095703125, 0.0637664794921875, 0.06832122802734375, 0.0728759765625, 0.07743072509765625, 0.0819854736328125, 0.08654022216796875, 0.091094970703125, 0.09564971923828125, 0.1002044677734375, 0.10475921630859375, 0.10931396484375, 0.11386871337890625, 0.1184234619140625, 0.12297821044921875, 0.127532958984375, 0.13208770751953125, 0.1366424560546875, 0.14119720458984375, 0.145751953125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 0.0, 11.0, 2.0, 8.0, 3.0, 5.0, 12.0, 15.0, 15.0, 26.0, 22.0, 35.0, 35.0, 40.0, 61.0, 69.0, 87.0, 77.0, 88.0, 77.0, 56.0, 49.0, 37.0, 28.0, 23.0, 27.0, 21.0, 10.0, 14.0, 9.0, 4.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.029510498046875, -0.028545856475830078, -0.027581214904785156, -0.026616573333740234, -0.025651931762695312, -0.02468729019165039, -0.02372264862060547, -0.022758007049560547, -0.021793365478515625, -0.020828723907470703, -0.01986408233642578, -0.01889944076538086, -0.017934799194335938, -0.016970157623291016, -0.016005516052246094, -0.015040874481201172, -0.01407623291015625, -0.013111591339111328, -0.012146949768066406, -0.011182308197021484, -0.010217666625976562, -0.00925302505493164, -0.008288383483886719, -0.007323741912841797, -0.006359100341796875, -0.005394458770751953, -0.004429817199707031, -0.0034651756286621094, -0.0025005340576171875, -0.0015358924865722656, -0.0005712509155273438, 0.0003933906555175781, 0.0013580322265625, 0.002322673797607422, 0.0032873153686523438, 0.004251956939697266, 0.0052165985107421875, 0.006181240081787109, 0.007145881652832031, 0.008110523223876953, 0.009075164794921875, 0.010039806365966797, 0.011004447937011719, 0.01196908950805664, 0.012933731079101562, 0.013898372650146484, 0.014863014221191406, 0.015827655792236328, 0.01679229736328125, 0.017756938934326172, 0.018721580505371094, 0.019686222076416016, 0.020650863647460938, 0.02161550521850586, 0.02258014678955078, 0.023544788360595703, 0.024509429931640625, 0.025474071502685547, 0.02643871307373047, 0.02740335464477539, 0.028367996215820312, 0.029332637786865234, 0.030297279357910156, 0.03126192092895508, 0.0322265625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 7.0, 5.0, 1.0, 5.0, 7.0, 5.0, 13.0, 14.0, 14.0, 23.0, 36.0, 49.0, 57.0, 90.0, 89.0, 112.0, 103.0, 91.0, 60.0, 55.0, 55.0, 27.0, 19.0, 14.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.568750262260437, -1.5293562412261963, -1.4899623394012451, -1.4505683183670044, -1.4111742973327637, -1.3717803955078125, -1.3323863744735718, -1.292992353439331, -1.2535984516143799, -1.2142044305801392, -1.174810528755188, -1.1354165077209473, -1.096022605895996, -1.0566285848617554, -1.0172345638275146, -0.9778406023979187, -0.9384466409683228, -0.8990526795387268, -0.8596587181091309, -0.8202646970748901, -0.7808707356452942, -0.7414767742156982, -0.7020827531814575, -0.6626887917518616, -0.6232948303222656, -0.5839008688926697, -0.5445069074630737, -0.505112886428833, -0.46571892499923706, -0.4263249635696411, -0.3869309723377228, -0.34753698110580444, -0.3081430196762085, -0.26874905824661255, -0.2293550670146942, -0.18996109068393707, -0.15056711435317993, -0.11117313802242279, -0.07177916169166565, -0.032385170459747314, 0.007008790969848633, 0.046402767300605774, 0.08579674363136292, 0.12519071996212006, 0.1645846962928772, 0.20397867262363434, 0.24337264895439148, 0.2827666401863098, 0.32216060161590576, 0.3615545630455017, 0.40094855427742004, 0.4403425455093384, 0.4797365069389343, 0.5191304683685303, 0.558524489402771, 0.5979184508323669, 0.6373124122619629, 0.6767063736915588, 0.7161003351211548, 0.7554943561553955, 0.7948883175849915, 0.8342822790145874, 0.8736763000488281, 0.9130702614784241, 0.95246422290802]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 7.0, 8.0, 9.0, 12.0, 15.0, 16.0, 23.0, 34.0, 23.0, 21.0, 27.0, 29.0, 26.0, 26.0, 29.0, 36.0, 28.0, 29.0, 31.0, 31.0, 43.0, 43.0, 42.0, 37.0, 39.0, 41.0, 29.0, 36.0, 29.0, 38.0, 28.0, 20.0, 23.0, 12.0, 13.0, 13.0, 14.0, 12.0, 8.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7862319946289062, -0.7630535960197449, -0.7398751974105835, -0.7166967988014221, -0.6935184001922607, -0.6703400015830994, -0.647161602973938, -0.6239831447601318, -0.6008048057556152, -0.5776264071464539, -0.5544480085372925, -0.5312696099281311, -0.5080912113189697, -0.48491281270980835, -0.4617343842983246, -0.4385559856891632, -0.41537755727767944, -0.39219915866851807, -0.3690207600593567, -0.3458423614501953, -0.32266396284103394, -0.29948556423187256, -0.2763071358203888, -0.2531287372112274, -0.22995033860206604, -0.20677193999290466, -0.1835935413837433, -0.16041512787342072, -0.13723672926425934, -0.11405833065509796, -0.09087991714477539, -0.06770151853561401, -0.04452311992645264, -0.02134471759200096, 0.0018336847424507141, 0.025012090802192688, 0.048190489411354065, 0.07136888802051544, 0.09454730153083801, 0.11772570013999939, 0.14090409874916077, 0.16408249735832214, 0.18726089596748352, 0.2104393094778061, 0.23361770808696747, 0.25679612159729004, 0.2799745202064514, 0.3031529188156128, 0.32633131742477417, 0.34950971603393555, 0.3726881146430969, 0.3958665132522583, 0.4190449118614197, 0.44222331047058105, 0.4654017388820648, 0.4885801374912262, 0.51175856590271, 0.5349369645118713, 0.5581153631210327, 0.5812937617301941, 0.6044721603393555, 0.6276505589485168, 0.6508289575576782, 0.6740074157714844, 0.697185754776001]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 12.0, 8.0, 9.0, 19.0, 43.0, 53.0, 102.0, 147.0, 210.0, 323.0, 500.0, 761.0, 1186.0, 1987.0, 3005.0, 4805.0, 7594.0, 11969.0, 19644.0, 32658.0, 58061.0, 110111.0, 211809.0, 257041.0, 145588.0, 75432.0, 41340.0, 23886.0, 14730.0, 9435.0, 5875.0, 3720.0, 2367.0, 1524.0, 935.0, 601.0, 379.0, 247.0, 177.0, 107.0, 59.0, 41.0, 30.0, 15.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.373046875, -1.3290557861328125, -1.285064697265625, -1.2410736083984375, -1.19708251953125, -1.1530914306640625, -1.109100341796875, -1.0651092529296875, -1.0211181640625, -0.9771270751953125, -0.933135986328125, -0.8891448974609375, -0.84515380859375, -0.8011627197265625, -0.757171630859375, -0.7131805419921875, -0.669189453125, -0.6251983642578125, -0.581207275390625, -0.5372161865234375, -0.49322509765625, -0.4492340087890625, -0.405242919921875, -0.3612518310546875, -0.3172607421875, -0.2732696533203125, -0.229278564453125, -0.1852874755859375, -0.14129638671875, -0.0973052978515625, -0.053314208984375, -0.0093231201171875, 0.03466796875, 0.0786590576171875, 0.122650146484375, 0.1666412353515625, 0.21063232421875, 0.2546234130859375, 0.298614501953125, 0.3426055908203125, 0.3865966796875, 0.4305877685546875, 0.474578857421875, 0.5185699462890625, 0.56256103515625, 0.6065521240234375, 0.650543212890625, 0.6945343017578125, 0.738525390625, 0.7825164794921875, 0.826507568359375, 0.8704986572265625, 0.91448974609375, 0.9584808349609375, 1.002471923828125, 1.0464630126953125, 1.0904541015625, 1.1344451904296875, 1.178436279296875, 1.2224273681640625, 1.26641845703125, 1.3104095458984375, 1.354400634765625, 1.3983917236328125, 1.4423828125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 5.0, 3.0, 10.0, 20.0, 16.0, 20.0, 28.0, 26.0, 16.0, 26.0, 21.0, 38.0, 27.0, 24.0, 17.0, 38.0, 35.0, 33.0, 31.0, 28.0, 38.0, 44.0, 32.0, 28.0, 31.0, 29.0, 31.0, 34.0, 27.0, 33.0, 29.0, 28.0, 20.0, 26.0, 10.0, 12.0, 18.0, 9.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61279296875, -0.5936203002929688, -0.5744476318359375, -0.5552749633789062, -0.536102294921875, -0.5169296264648438, -0.4977569580078125, -0.47858428955078125, -0.45941162109375, -0.44023895263671875, -0.4210662841796875, -0.40189361572265625, -0.382720947265625, -0.36354827880859375, -0.3443756103515625, -0.32520294189453125, -0.3060302734375, -0.28685760498046875, -0.2676849365234375, -0.24851226806640625, -0.229339599609375, -0.21016693115234375, -0.1909942626953125, -0.17182159423828125, -0.15264892578125, -0.13347625732421875, -0.1143035888671875, -0.09513092041015625, -0.075958251953125, -0.05678558349609375, -0.0376129150390625, -0.01844024658203125, 0.000732421875, 0.01990509033203125, 0.0390777587890625, 0.05825042724609375, 0.077423095703125, 0.09659576416015625, 0.1157684326171875, 0.13494110107421875, 0.15411376953125, 0.17328643798828125, 0.1924591064453125, 0.21163177490234375, 0.230804443359375, 0.24997711181640625, 0.2691497802734375, 0.28832244873046875, 0.3074951171875, 0.32666778564453125, 0.3458404541015625, 0.36501312255859375, 0.384185791015625, 0.40335845947265625, 0.4225311279296875, 0.44170379638671875, 0.46087646484375, 0.48004913330078125, 0.4992218017578125, 0.5183944702148438, 0.537567138671875, 0.5567398071289062, 0.5759124755859375, 0.5950851440429688, 0.6142578125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 13.0, 11.0, 28.0, 42.0, 57.0, 84.0, 137.0, 169.0, 284.0, 367.0, 594.0, 870.0, 1324.0, 2077.0, 3321.0, 5222.0, 8426.0, 13939.0, 23593.0, 41650.0, 77837.0, 153947.0, 286682.0, 202817.0, 99656.0, 52073.0, 29032.0, 17017.0, 10048.0, 6134.0, 3924.0, 2449.0, 1675.0, 1009.0, 661.0, 464.0, 315.0, 180.0, 149.0, 74.0, 58.0, 48.0, 30.0, 22.0, 8.0, 11.0, 7.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.462890625, -1.4181365966796875, -1.373382568359375, -1.3286285400390625, -1.28387451171875, -1.2391204833984375, -1.194366455078125, -1.1496124267578125, -1.1048583984375, -1.0601043701171875, -1.015350341796875, -0.9705963134765625, -0.92584228515625, -0.8810882568359375, -0.836334228515625, -0.7915802001953125, -0.746826171875, -0.7020721435546875, -0.657318115234375, -0.6125640869140625, -0.56781005859375, -0.5230560302734375, -0.478302001953125, -0.4335479736328125, -0.3887939453125, -0.3440399169921875, -0.299285888671875, -0.2545318603515625, -0.20977783203125, -0.1650238037109375, -0.120269775390625, -0.0755157470703125, -0.03076171875, 0.0139923095703125, 0.058746337890625, 0.1035003662109375, 0.14825439453125, 0.1930084228515625, 0.237762451171875, 0.2825164794921875, 0.3272705078125, 0.3720245361328125, 0.416778564453125, 0.4615325927734375, 0.50628662109375, 0.5510406494140625, 0.595794677734375, 0.6405487060546875, 0.685302734375, 0.7300567626953125, 0.774810791015625, 0.8195648193359375, 0.86431884765625, 0.9090728759765625, 0.953826904296875, 0.9985809326171875, 1.0433349609375, 1.0880889892578125, 1.132843017578125, 1.1775970458984375, 1.22235107421875, 1.2671051025390625, 1.311859130859375, 1.3566131591796875, 1.4013671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 5.0, 8.0, 15.0, 10.0, 16.0, 13.0, 20.0, 35.0, 23.0, 26.0, 41.0, 34.0, 39.0, 45.0, 53.0, 45.0, 43.0, 62.0, 47.0, 50.0, 48.0, 38.0, 37.0, 35.0, 39.0, 25.0, 23.0, 25.0, 27.0, 17.0, 17.0, 8.0, 13.0, 8.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.456298828125, -0.4395713806152344, -0.42284393310546875, -0.4061164855957031, -0.3893890380859375, -0.3726615905761719, -0.35593414306640625, -0.3392066955566406, -0.322479248046875, -0.3057518005371094, -0.28902435302734375, -0.2722969055175781, -0.2555694580078125, -0.23884201049804688, -0.22211456298828125, -0.20538711547851562, -0.18865966796875, -0.17193222045898438, -0.15520477294921875, -0.13847732543945312, -0.1217498779296875, -0.10502243041992188, -0.08829498291015625, -0.07156753540039062, -0.054840087890625, -0.038112640380859375, -0.02138519287109375, -0.004657745361328125, 0.0120697021484375, 0.028797149658203125, 0.04552459716796875, 0.062252044677734375, 0.0789794921875, 0.09570693969726562, 0.11243438720703125, 0.12916183471679688, 0.1458892822265625, 0.16261672973632812, 0.17934417724609375, 0.19607162475585938, 0.212799072265625, 0.22952651977539062, 0.24625396728515625, 0.2629814147949219, 0.2797088623046875, 0.2964363098144531, 0.31316375732421875, 0.3298912048339844, 0.34661865234375, 0.3633460998535156, 0.38007354736328125, 0.3968009948730469, 0.4135284423828125, 0.4302558898925781, 0.44698333740234375, 0.4637107849121094, 0.480438232421875, 0.4971656799316406, 0.5138931274414062, 0.5306205749511719, 0.5473480224609375, 0.5640754699707031, 0.5808029174804688, 0.5975303649902344, 0.6142578125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 4.0, 14.0, 28.0, 32.0, 57.0, 76.0, 89.0, 137.0, 213.0, 225.0, 356.0, 531.0, 794.0, 1053.0, 1535.0, 2259.0, 3379.0, 5353.0, 8628.0, 15140.0, 29752.0, 76101.0, 625150.0, 175249.0, 48447.0, 21576.0, 11829.0, 6843.0, 4356.0, 2948.0, 1918.0, 1323.0, 901.0, 662.0, 468.0, 341.0, 216.0, 151.0, 127.0, 98.0, 54.0, 48.0, 30.0, 23.0, 13.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.794921875, -0.7706756591796875, -0.746429443359375, -0.7221832275390625, -0.69793701171875, -0.6736907958984375, -0.649444580078125, -0.6251983642578125, -0.6009521484375, -0.5767059326171875, -0.552459716796875, -0.5282135009765625, -0.50396728515625, -0.4797210693359375, -0.455474853515625, -0.4312286376953125, -0.406982421875, -0.3827362060546875, -0.358489990234375, -0.3342437744140625, -0.30999755859375, -0.2857513427734375, -0.261505126953125, -0.2372589111328125, -0.2130126953125, -0.1887664794921875, -0.164520263671875, -0.1402740478515625, -0.11602783203125, -0.0917816162109375, -0.067535400390625, -0.0432891845703125, -0.01904296875, 0.0052032470703125, 0.029449462890625, 0.0536956787109375, 0.07794189453125, 0.1021881103515625, 0.126434326171875, 0.1506805419921875, 0.1749267578125, 0.1991729736328125, 0.223419189453125, 0.2476654052734375, 0.27191162109375, 0.2961578369140625, 0.320404052734375, 0.3446502685546875, 0.368896484375, 0.3931427001953125, 0.417388916015625, 0.4416351318359375, 0.46588134765625, 0.4901275634765625, 0.514373779296875, 0.5386199951171875, 0.5628662109375, 0.5871124267578125, 0.611358642578125, 0.6356048583984375, 0.65985107421875, 0.6840972900390625, 0.708343505859375, 0.7325897216796875, 0.7568359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 15.0, 17.0, 17.0, 32.0, 37.0, 48.0, 69.0, 152.0, 231.0, 78.0, 60.0, 43.0, 36.0, 30.0, 14.0, 16.0, 13.0, 12.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9073486328125e-05, -1.8417835235595703e-05, -1.7762184143066406e-05, -1.710653305053711e-05, -1.6450881958007812e-05, -1.5795230865478516e-05, -1.5139579772949219e-05, -1.4483928680419922e-05, -1.3828277587890625e-05, -1.3172626495361328e-05, -1.2516975402832031e-05, -1.1861324310302734e-05, -1.1205673217773438e-05, -1.055002212524414e-05, -9.894371032714844e-06, -9.238719940185547e-06, -8.58306884765625e-06, -7.927417755126953e-06, -7.271766662597656e-06, -6.616115570068359e-06, -5.9604644775390625e-06, -5.304813385009766e-06, -4.649162292480469e-06, -3.993511199951172e-06, -3.337860107421875e-06, -2.682209014892578e-06, -2.0265579223632812e-06, -1.3709068298339844e-06, -7.152557373046875e-07, -5.960464477539063e-08, 5.960464477539062e-07, 1.2516975402832031e-06, 1.9073486328125e-06, 2.562999725341797e-06, 3.2186508178710938e-06, 3.874301910400391e-06, 4.5299530029296875e-06, 5.185604095458984e-06, 5.841255187988281e-06, 6.496906280517578e-06, 7.152557373046875e-06, 7.808208465576172e-06, 8.463859558105469e-06, 9.119510650634766e-06, 9.775161743164062e-06, 1.043081283569336e-05, 1.1086463928222656e-05, 1.1742115020751953e-05, 1.239776611328125e-05, 1.3053417205810547e-05, 1.3709068298339844e-05, 1.436471939086914e-05, 1.5020370483398438e-05, 1.5676021575927734e-05, 1.633167266845703e-05, 1.6987323760986328e-05, 1.7642974853515625e-05, 1.8298625946044922e-05, 1.895427703857422e-05, 1.9609928131103516e-05, 2.0265579223632812e-05, 2.092123031616211e-05, 2.1576881408691406e-05, 2.2232532501220703e-05, 2.288818359375e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 7.0, 21.0, 27.0, 35.0, 57.0, 66.0, 92.0, 188.0, 185.0, 338.0, 536.0, 916.0, 1250.0, 2090.0, 3406.0, 5448.0, 9118.0, 16304.0, 33389.0, 97461.0, 678363.0, 118274.0, 37548.0, 18050.0, 9961.0, 5778.0, 3511.0, 2198.0, 1333.0, 866.0, 603.0, 414.0, 197.0, 148.0, 120.0, 94.0, 55.0, 25.0, 23.0, 16.0, 13.0, 8.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8585433959960938, -0.8313446044921875, -0.8041458129882812, -0.776947021484375, -0.7497482299804688, -0.7225494384765625, -0.6953506469726562, -0.66815185546875, -0.6409530639648438, -0.6137542724609375, -0.5865554809570312, -0.559356689453125, -0.5321578979492188, -0.5049591064453125, -0.47776031494140625, -0.4505615234375, -0.42336273193359375, -0.3961639404296875, -0.36896514892578125, -0.341766357421875, -0.31456756591796875, -0.2873687744140625, -0.26016998291015625, -0.23297119140625, -0.20577239990234375, -0.1785736083984375, -0.15137481689453125, -0.124176025390625, -0.09697723388671875, -0.0697784423828125, -0.04257965087890625, -0.015380859375, 0.01181793212890625, 0.0390167236328125, 0.06621551513671875, 0.093414306640625, 0.12061309814453125, 0.1478118896484375, 0.17501068115234375, 0.20220947265625, 0.22940826416015625, 0.2566070556640625, 0.28380584716796875, 0.311004638671875, 0.33820343017578125, 0.3654022216796875, 0.39260101318359375, 0.4197998046875, 0.44699859619140625, 0.4741973876953125, 0.5013961791992188, 0.528594970703125, 0.5557937622070312, 0.5829925537109375, 0.6101913452148438, 0.63739013671875, 0.6645889282226562, 0.6917877197265625, 0.7189865112304688, 0.746185302734375, 0.7733840942382812, 0.8005828857421875, 0.8277816772460938, 0.85498046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 6.0, 7.0, 6.0, 9.0, 6.0, 17.0, 21.0, 20.0, 23.0, 53.0, 70.0, 75.0, 298.0, 86.0, 56.0, 48.0, 29.0, 18.0, 17.0, 17.0, 14.0, 12.0, 7.0, 15.0, 7.0, 11.0, 6.0, 1.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1964111328125, -0.1897144317626953, -0.18301773071289062, -0.17632102966308594, -0.16962432861328125, -0.16292762756347656, -0.15623092651367188, -0.1495342254638672, -0.1428375244140625, -0.1361408233642578, -0.12944412231445312, -0.12274742126464844, -0.11605072021484375, -0.10935401916503906, -0.10265731811523438, -0.09596061706542969, -0.089263916015625, -0.08256721496582031, -0.07587051391601562, -0.06917381286621094, -0.06247711181640625, -0.05578041076660156, -0.049083709716796875, -0.04238700866699219, -0.0356903076171875, -0.028993606567382812, -0.022296905517578125, -0.015600204467773438, -0.00890350341796875, -0.0022068023681640625, 0.004489898681640625, 0.011186599731445312, 0.01788330078125, 0.024580001831054688, 0.031276702880859375, 0.03797340393066406, 0.04467010498046875, 0.05136680603027344, 0.058063507080078125, 0.06476020812988281, 0.0714569091796875, 0.07815361022949219, 0.08485031127929688, 0.09154701232910156, 0.09824371337890625, 0.10494041442871094, 0.11163711547851562, 0.11833381652832031, 0.125030517578125, 0.1317272186279297, 0.13842391967773438, 0.14512062072753906, 0.15181732177734375, 0.15851402282714844, 0.16521072387695312, 0.1719074249267578, 0.1786041259765625, 0.1853008270263672, 0.19199752807617188, 0.19869422912597656, 0.20539093017578125, 0.21208763122558594, 0.21878433227539062, 0.2254810333251953, 0.232177734375]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 11.0, 11.0, 13.0, 21.0, 26.0, 44.0, 63.0, 94.0, 121.0, 141.0, 110.0, 91.0, 56.0, 40.0, 32.0, 28.0, 22.0, 14.0, 16.0, 12.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.494354248046875, -1.4522393941879272, -1.4101245403289795, -1.3680098056793213, -1.3258949518203735, -1.2837800979614258, -1.241665244102478, -1.1995503902435303, -1.157435655593872, -1.1153208017349243, -1.0732059478759766, -1.0310912132263184, -0.9889763593673706, -0.9468615055084229, -0.9047466516494751, -0.8626317977905273, -0.8205169439315796, -0.7784020900726318, -0.7362872958183289, -0.6941724419593811, -0.6520576477050781, -0.6099427938461304, -0.5678279399871826, -0.5257130861282349, -0.4835982918739319, -0.4414834678173065, -0.39936864376068115, -0.3572537899017334, -0.31513896584510803, -0.27302414178848267, -0.2309092879295349, -0.18879446387290955, -0.14667952060699463, -0.10456468909978867, -0.0624498575925827, -0.020335018634796143, 0.021779805421829224, 0.06389462947845459, 0.10600948333740234, 0.1481243073940277, 0.19023913145065308, 0.23235395550727844, 0.2744687795639038, 0.31658363342285156, 0.35869845747947693, 0.4008132815361023, 0.44292813539505005, 0.4850429594516754, 0.5271577835083008, 0.5692726373672485, 0.6113874316215515, 0.6535022854804993, 0.6956170797348022, 0.73773193359375, 0.7798467874526978, 0.8219616413116455, 0.8640764355659485, 0.9061912894248962, 0.9483060836791992, 0.990420937538147, 1.0325357913970947, 1.074650526046753, 1.1167654991149902, 1.1588802337646484, 1.2009950876235962]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 9.0, 14.0, 9.0, 17.0, 18.0, 10.0, 30.0, 23.0, 19.0, 27.0, 23.0, 31.0, 29.0, 29.0, 25.0, 20.0, 36.0, 44.0, 37.0, 41.0, 43.0, 38.0, 38.0, 28.0, 38.0, 21.0, 32.0, 26.0, 27.0, 28.0, 17.0, 23.0, 18.0, 22.0, 8.0, 10.0, 9.0, 9.0, 10.0, 7.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.6485298275947571, -0.6287035942077637, -0.6088773608207703, -0.5890511274337769, -0.5692248940467834, -0.54939866065979, -0.5295724272727966, -0.5097461938858032, -0.4899199903011322, -0.4700937569141388, -0.4502675235271454, -0.430441290140152, -0.41061508655548096, -0.39078885316848755, -0.37096261978149414, -0.35113638639450073, -0.3313101530075073, -0.3114839196205139, -0.2916576862335205, -0.2718314528465271, -0.2520052194595337, -0.23217900097370148, -0.21235278248786926, -0.19252654910087585, -0.17270031571388245, -0.15287408232688904, -0.13304784893989563, -0.11322163045406342, -0.09339539706707001, -0.0735691636800766, -0.05374293774366379, -0.03391671180725098, -0.014090538024902344, 0.005735691636800766, 0.025561921298503876, 0.045388150960206985, 0.0652143806219101, 0.0850406140089035, 0.10486683994531631, 0.12469306588172913, 0.14451929926872253, 0.16434553265571594, 0.18417176604270935, 0.20399798452854156, 0.22382421791553497, 0.24365045130252838, 0.2634766697883606, 0.283302903175354, 0.3031291365623474, 0.3229553699493408, 0.34278160333633423, 0.36260783672332764, 0.38243407011032104, 0.40226030349731445, 0.4220865070819855, 0.4419127404689789, 0.4617389738559723, 0.4815652072429657, 0.5013914108276367, 0.5212176442146301, 0.5410438776016235, 0.5608701109886169, 0.5806963443756104, 0.6005225777626038, 0.6203488111495972]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 22.0, 32.0, 47.0, 56.0, 99.0, 151.0, 190.0, 254.0, 360.0, 518.0, 687.0, 1036.0, 1398.0, 2081.0, 2906.0, 4400.0, 6342.0, 9829.0, 15349.0, 24160.0, 40745.0, 70161.0, 128735.0, 265407.0, 798388.0, 1628113.0, 663968.0, 248076.0, 118941.0, 64203.0, 36573.0, 22088.0, 13625.0, 8637.0, 5594.0, 3635.0, 2485.0, 1713.0, 1101.0, 744.0, 519.0, 347.0, 182.0, 134.0, 90.0, 50.0, 33.0, 17.0, 15.0, 8.0, 10.0, 13.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.90185546875, -0.8731536865234375, -0.844451904296875, -0.8157501220703125, -0.78704833984375, -0.7583465576171875, -0.729644775390625, -0.7009429931640625, -0.6722412109375, -0.6435394287109375, -0.614837646484375, -0.5861358642578125, -0.55743408203125, -0.5287322998046875, -0.500030517578125, -0.4713287353515625, -0.442626953125, -0.4139251708984375, -0.385223388671875, -0.3565216064453125, -0.32781982421875, -0.2991180419921875, -0.270416259765625, -0.2417144775390625, -0.2130126953125, -0.1843109130859375, -0.155609130859375, -0.1269073486328125, -0.09820556640625, -0.0695037841796875, -0.040802001953125, -0.0121002197265625, 0.0166015625, 0.0453033447265625, 0.074005126953125, 0.1027069091796875, 0.13140869140625, 0.1601104736328125, 0.188812255859375, 0.2175140380859375, 0.2462158203125, 0.2749176025390625, 0.303619384765625, 0.3323211669921875, 0.36102294921875, 0.3897247314453125, 0.418426513671875, 0.4471282958984375, 0.475830078125, 0.5045318603515625, 0.533233642578125, 0.5619354248046875, 0.59063720703125, 0.6193389892578125, 0.648040771484375, 0.6767425537109375, 0.7054443359375, 0.7341461181640625, 0.762847900390625, 0.7915496826171875, 0.82025146484375, 0.8489532470703125, 0.877655029296875, 0.9063568115234375, 0.93505859375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 13.0, 8.0, 7.0, 6.0, 11.0, 8.0, 15.0, 20.0, 21.0, 24.0, 19.0, 19.0, 26.0, 33.0, 30.0, 27.0, 29.0, 32.0, 33.0, 35.0, 38.0, 39.0, 38.0, 39.0, 35.0, 30.0, 27.0, 34.0, 28.0, 34.0, 20.0, 31.0, 21.0, 19.0, 22.0, 20.0, 16.0, 10.0, 14.0, 6.0, 10.0, 7.0, 7.0, 8.0, 4.0, 1.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.41650390625, -0.40410614013671875, -0.3917083740234375, -0.37931060791015625, -0.366912841796875, -0.35451507568359375, -0.3421173095703125, -0.32971954345703125, -0.31732177734375, -0.30492401123046875, -0.2925262451171875, -0.28012847900390625, -0.267730712890625, -0.25533294677734375, -0.2429351806640625, -0.23053741455078125, -0.2181396484375, -0.20574188232421875, -0.1933441162109375, -0.18094635009765625, -0.168548583984375, -0.15615081787109375, -0.1437530517578125, -0.13135528564453125, -0.11895751953125, -0.10655975341796875, -0.0941619873046875, -0.08176422119140625, -0.069366455078125, -0.05696868896484375, -0.0445709228515625, -0.03217315673828125, -0.019775390625, -0.00737762451171875, 0.0050201416015625, 0.01741790771484375, 0.029815673828125, 0.04221343994140625, 0.0546112060546875, 0.06700897216796875, 0.07940673828125, 0.09180450439453125, 0.1042022705078125, 0.11660003662109375, 0.128997802734375, 0.14139556884765625, 0.1537933349609375, 0.16619110107421875, 0.1785888671875, 0.19098663330078125, 0.2033843994140625, 0.21578216552734375, 0.228179931640625, 0.24057769775390625, 0.2529754638671875, 0.26537322998046875, 0.27777099609375, 0.29016876220703125, 0.3025665283203125, 0.31496429443359375, 0.327362060546875, 0.33975982666015625, 0.3521575927734375, 0.36455535888671875, 0.376953125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 13.0, 18.0, 25.0, 46.0, 60.0, 97.0, 137.0, 193.0, 304.0, 438.0, 683.0, 1071.0, 1493.0, 2395.0, 3457.0, 5415.0, 8223.0, 12932.0, 20387.0, 33247.0, 54705.0, 94647.0, 173684.0, 351813.0, 827249.0, 1363628.0, 615552.0, 276198.0, 141800.0, 79676.0, 46643.0, 28201.0, 17712.0, 11090.0, 7097.0, 4769.0, 3104.0, 2023.0, 1329.0, 899.0, 620.0, 395.0, 274.0, 151.0, 125.0, 87.0, 57.0, 45.0, 24.0, 19.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.74365234375, -0.7206573486328125, -0.697662353515625, -0.6746673583984375, -0.65167236328125, -0.6286773681640625, -0.605682373046875, -0.5826873779296875, -0.5596923828125, -0.5366973876953125, -0.513702392578125, -0.4907073974609375, -0.46771240234375, -0.4447174072265625, -0.421722412109375, -0.3987274169921875, -0.375732421875, -0.3527374267578125, -0.329742431640625, -0.3067474365234375, -0.28375244140625, -0.2607574462890625, -0.237762451171875, -0.2147674560546875, -0.1917724609375, -0.1687774658203125, -0.145782470703125, -0.1227874755859375, -0.09979248046875, -0.0767974853515625, -0.053802490234375, -0.0308074951171875, -0.0078125, 0.0151824951171875, 0.038177490234375, 0.0611724853515625, 0.08416748046875, 0.1071624755859375, 0.130157470703125, 0.1531524658203125, 0.1761474609375, 0.1991424560546875, 0.222137451171875, 0.2451324462890625, 0.26812744140625, 0.2911224365234375, 0.314117431640625, 0.3371124267578125, 0.360107421875, 0.3831024169921875, 0.406097412109375, 0.4290924072265625, 0.45208740234375, 0.4750823974609375, 0.498077392578125, 0.5210723876953125, 0.5440673828125, 0.5670623779296875, 0.590057373046875, 0.6130523681640625, 0.63604736328125, 0.6590423583984375, 0.682037353515625, 0.7050323486328125, 0.72802734375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 16.0, 22.0, 18.0, 26.0, 30.0, 40.0, 53.0, 76.0, 62.0, 102.0, 106.0, 106.0, 145.0, 181.0, 201.0, 217.0, 238.0, 271.0, 252.0, 259.0, 220.0, 219.0, 206.0, 182.0, 149.0, 134.0, 107.0, 89.0, 67.0, 46.0, 55.0, 33.0, 41.0, 18.0, 18.0, 16.0, 10.0, 2.0, 11.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.249481201171875, -0.24188232421875, -0.234283447265625, -0.2266845703125, -0.219085693359375, -0.21148681640625, -0.203887939453125, -0.1962890625, -0.188690185546875, -0.18109130859375, -0.173492431640625, -0.1658935546875, -0.158294677734375, -0.15069580078125, -0.143096923828125, -0.135498046875, -0.127899169921875, -0.12030029296875, -0.112701416015625, -0.1051025390625, -0.097503662109375, -0.08990478515625, -0.082305908203125, -0.07470703125, -0.067108154296875, -0.05950927734375, -0.051910400390625, -0.0443115234375, -0.036712646484375, -0.02911376953125, -0.021514892578125, -0.013916015625, -0.006317138671875, 0.00128173828125, 0.008880615234375, 0.0164794921875, 0.024078369140625, 0.03167724609375, 0.039276123046875, 0.046875, 0.054473876953125, 0.06207275390625, 0.069671630859375, 0.0772705078125, 0.084869384765625, 0.09246826171875, 0.100067138671875, 0.107666015625, 0.115264892578125, 0.12286376953125, 0.130462646484375, 0.1380615234375, 0.145660400390625, 0.15325927734375, 0.160858154296875, 0.16845703125, 0.176055908203125, 0.18365478515625, 0.191253662109375, 0.1988525390625, 0.206451416015625, 0.21405029296875, 0.221649169921875, 0.229248046875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 8.0, 15.0, 17.0, 17.0, 15.0, 35.0, 53.0, 52.0, 94.0, 114.0, 126.0, 116.0, 88.0, 49.0, 52.0, 32.0, 21.0, 16.0, 24.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9037691950798035, -0.8759884238243103, -0.8482075929641724, -0.8204268217086792, -0.792646050453186, -0.7648652791976929, -0.7370844483375549, -0.7093036770820618, -0.6815229058265686, -0.6537421345710754, -0.6259613037109375, -0.5981805324554443, -0.5703997611999512, -0.542618989944458, -0.5148381590843201, -0.4870573878288269, -0.45927658677101135, -0.4314957857131958, -0.40371501445770264, -0.3759342133998871, -0.3481534421443939, -0.32037264108657837, -0.2925918698310852, -0.26481106877326965, -0.2370302826166153, -0.20924949645996094, -0.18146871030330658, -0.15368792414665222, -0.12590712308883667, -0.09812633693218231, -0.07034555077552795, -0.042564764618873596, -0.014783978462219238, 0.012996809557080269, 0.040777597576379776, 0.06855838745832443, 0.09633917361497879, 0.12411996722221375, 0.1519007533788681, 0.17968153953552246, 0.20746232569217682, 0.23524311184883118, 0.26302391290664673, 0.2908046841621399, 0.31858548521995544, 0.346366286277771, 0.37414705753326416, 0.4019278287887573, 0.4297086298465729, 0.4574894309043884, 0.4852702021598816, 0.5130509734153748, 0.5408318042755127, 0.5686125755310059, 0.596393346786499, 0.6241741180419922, 0.6519549489021301, 0.6797357201576233, 0.7075165510177612, 0.7352973222732544, 0.7630780935287476, 0.7908588647842407, 0.8186396956443787, 0.8464204668998718, 0.874201238155365]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 7.0, 11.0, 10.0, 7.0, 9.0, 16.0, 14.0, 18.0, 17.0, 17.0, 23.0, 24.0, 32.0, 21.0, 28.0, 43.0, 33.0, 35.0, 40.0, 45.0, 49.0, 43.0, 29.0, 32.0, 37.0, 31.0, 27.0, 26.0, 38.0, 28.0, 14.0, 26.0, 29.0, 23.0, 18.0, 19.0, 12.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5099623799324036, -0.49492689967155457, -0.4798913896083832, -0.4648559093475342, -0.4498203992843628, -0.4347849190235138, -0.4197494387626648, -0.4047139286994934, -0.389678418636322, -0.374642938375473, -0.35960742831230164, -0.34457194805145264, -0.32953643798828125, -0.31450095772743225, -0.29946547746658325, -0.28442996740341187, -0.26939448714256287, -0.25435900688171387, -0.23932349681854248, -0.22428801655769348, -0.2092525064945221, -0.1942170262336731, -0.1791815310716629, -0.1641460359096527, -0.14911054074764252, -0.13407504558563232, -0.11903955042362213, -0.10400406271219254, -0.08896856755018234, -0.07393307238817215, -0.058897584676742554, -0.04386208951473236, -0.028826594352722168, -0.013791101053357124, 0.0012443922460079193, 0.016279883682727814, 0.03131537884473801, 0.0463508740067482, 0.061386361718177795, 0.07642185688018799, 0.09145735204219818, 0.10649284720420837, 0.12152834236621857, 0.13656383752822876, 0.15159931778907776, 0.16663482785224915, 0.18167030811309814, 0.19670580327510834, 0.21174129843711853, 0.22677679359912872, 0.24181228876113892, 0.2568477690219879, 0.2718832790851593, 0.2869187593460083, 0.3019542694091797, 0.3169897496700287, 0.3320252299308777, 0.3470607101917267, 0.36209622025489807, 0.37713170051574707, 0.39216721057891846, 0.40720269083976746, 0.42223817110061646, 0.43727368116378784, 0.45230919122695923]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 16.0, 13.0, 27.0, 31.0, 45.0, 80.0, 117.0, 147.0, 220.0, 303.0, 496.0, 813.0, 1238.0, 1976.0, 3070.0, 4990.0, 8050.0, 13453.0, 23030.0, 42114.0, 83780.0, 200446.0, 362019.0, 149823.0, 67425.0, 35020.0, 19610.0, 11529.0, 6769.0, 4386.0, 2655.0, 1668.0, 1099.0, 685.0, 491.0, 299.0, 204.0, 126.0, 73.0, 56.0, 48.0, 33.0, 21.0, 16.0, 9.0, 10.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4130859375, -0.39947509765625, -0.3858642578125, -0.37225341796875, -0.358642578125, -0.34503173828125, -0.3314208984375, -0.31781005859375, -0.30419921875, -0.29058837890625, -0.2769775390625, -0.26336669921875, -0.249755859375, -0.23614501953125, -0.2225341796875, -0.20892333984375, -0.1953125, -0.18170166015625, -0.1680908203125, -0.15447998046875, -0.140869140625, -0.12725830078125, -0.1136474609375, -0.10003662109375, -0.08642578125, -0.07281494140625, -0.0592041015625, -0.04559326171875, -0.031982421875, -0.01837158203125, -0.0047607421875, 0.00885009765625, 0.0224609375, 0.03607177734375, 0.0496826171875, 0.06329345703125, 0.076904296875, 0.09051513671875, 0.1041259765625, 0.11773681640625, 0.13134765625, 0.14495849609375, 0.1585693359375, 0.17218017578125, 0.185791015625, 0.19940185546875, 0.2130126953125, 0.22662353515625, 0.240234375, 0.25384521484375, 0.2674560546875, 0.28106689453125, 0.294677734375, 0.30828857421875, 0.3218994140625, 0.33551025390625, 0.34912109375, 0.36273193359375, 0.3763427734375, 0.38995361328125, 0.403564453125, 0.41717529296875, 0.4307861328125, 0.44439697265625, 0.4580078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 5.0, 9.0, 12.0, 6.0, 6.0, 8.0, 13.0, 18.0, 15.0, 20.0, 21.0, 28.0, 29.0, 40.0, 25.0, 31.0, 36.0, 35.0, 48.0, 46.0, 48.0, 39.0, 36.0, 35.0, 38.0, 28.0, 34.0, 38.0, 27.0, 29.0, 19.0, 24.0, 25.0, 23.0, 20.0, 14.0, 14.0, 8.0, 13.0, 9.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.56591796875, -0.5498428344726562, -0.5337677001953125, -0.5176925659179688, -0.501617431640625, -0.48554229736328125, -0.4694671630859375, -0.45339202880859375, -0.43731689453125, -0.42124176025390625, -0.4051666259765625, -0.38909149169921875, -0.373016357421875, -0.35694122314453125, -0.3408660888671875, -0.32479095458984375, -0.3087158203125, -0.29264068603515625, -0.2765655517578125, -0.26049041748046875, -0.244415283203125, -0.22834014892578125, -0.2122650146484375, -0.19618988037109375, -0.18011474609375, -0.16403961181640625, -0.1479644775390625, -0.13188934326171875, -0.115814208984375, -0.09973907470703125, -0.0836639404296875, -0.06758880615234375, -0.051513671875, -0.03543853759765625, -0.0193634033203125, -0.00328826904296875, 0.012786865234375, 0.02886199951171875, 0.0449371337890625, 0.06101226806640625, 0.07708740234375, 0.09316253662109375, 0.1092376708984375, 0.12531280517578125, 0.141387939453125, 0.15746307373046875, 0.1735382080078125, 0.18961334228515625, 0.2056884765625, 0.22176361083984375, 0.2378387451171875, 0.25391387939453125, 0.269989013671875, 0.28606414794921875, 0.3021392822265625, 0.31821441650390625, 0.33428955078125, 0.35036468505859375, 0.3664398193359375, 0.38251495361328125, 0.398590087890625, 0.41466522216796875, 0.4307403564453125, 0.44681549072265625, 0.462890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 8.0, 9.0, 20.0, 25.0, 39.0, 58.0, 67.0, 104.0, 141.0, 187.0, 293.0, 398.0, 579.0, 876.0, 1195.0, 1774.0, 2697.0, 4315.0, 7242.0, 13099.0, 28314.0, 93432.0, 673731.0, 146395.0, 35380.0, 15710.0, 8262.0, 4924.0, 3043.0, 1875.0, 1304.0, 914.0, 602.0, 457.0, 331.0, 200.0, 151.0, 122.0, 87.0, 51.0, 35.0, 33.0, 20.0, 19.0, 10.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.71533203125, -0.6940536499023438, -0.6727752685546875, -0.6514968872070312, -0.630218505859375, -0.6089401245117188, -0.5876617431640625, -0.5663833618164062, -0.54510498046875, -0.5238265991210938, -0.5025482177734375, -0.48126983642578125, -0.459991455078125, -0.43871307373046875, -0.4174346923828125, -0.39615631103515625, -0.3748779296875, -0.35359954833984375, -0.3323211669921875, -0.31104278564453125, -0.289764404296875, -0.26848602294921875, -0.2472076416015625, -0.22592926025390625, -0.20465087890625, -0.18337249755859375, -0.1620941162109375, -0.14081573486328125, -0.119537353515625, -0.09825897216796875, -0.0769805908203125, -0.05570220947265625, -0.034423828125, -0.01314544677734375, 0.0081329345703125, 0.02941131591796875, 0.050689697265625, 0.07196807861328125, 0.0932464599609375, 0.11452484130859375, 0.13580322265625, 0.15708160400390625, 0.1783599853515625, 0.19963836669921875, 0.220916748046875, 0.24219512939453125, 0.2634735107421875, 0.28475189208984375, 0.3060302734375, 0.32730865478515625, 0.3485870361328125, 0.36986541748046875, 0.391143798828125, 0.41242218017578125, 0.4337005615234375, 0.45497894287109375, 0.47625732421875, 0.49753570556640625, 0.5188140869140625, 0.5400924682617188, 0.561370849609375, 0.5826492309570312, 0.6039276123046875, 0.6252059936523438, 0.646484375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 8.0, 4.0, 7.0, 16.0, 18.0, 11.0, 15.0, 21.0, 22.0, 33.0, 24.0, 15.0, 30.0, 38.0, 40.0, 42.0, 34.0, 40.0, 26.0, 43.0, 31.0, 44.0, 53.0, 40.0, 40.0, 35.0, 34.0, 33.0, 27.0, 19.0, 20.0, 16.0, 23.0, 9.0, 18.0, 14.0, 11.0, 7.0, 7.0, 11.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.34375, -0.3334503173828125, -0.323150634765625, -0.3128509521484375, -0.30255126953125, -0.2922515869140625, -0.281951904296875, -0.2716522216796875, -0.2613525390625, -0.2510528564453125, -0.240753173828125, -0.2304534912109375, -0.22015380859375, -0.2098541259765625, -0.199554443359375, -0.1892547607421875, -0.178955078125, -0.1686553955078125, -0.158355712890625, -0.1480560302734375, -0.13775634765625, -0.1274566650390625, -0.117156982421875, -0.1068572998046875, -0.0965576171875, -0.0862579345703125, -0.075958251953125, -0.0656585693359375, -0.05535888671875, -0.0450592041015625, -0.034759521484375, -0.0244598388671875, -0.01416015625, -0.0038604736328125, 0.006439208984375, 0.0167388916015625, 0.02703857421875, 0.0373382568359375, 0.047637939453125, 0.0579376220703125, 0.0682373046875, 0.0785369873046875, 0.088836669921875, 0.0991363525390625, 0.10943603515625, 0.1197357177734375, 0.130035400390625, 0.1403350830078125, 0.150634765625, 0.1609344482421875, 0.171234130859375, 0.1815338134765625, 0.19183349609375, 0.2021331787109375, 0.212432861328125, 0.2227325439453125, 0.2330322265625, 0.2433319091796875, 0.253631591796875, 0.2639312744140625, 0.27423095703125, 0.2845306396484375, 0.294830322265625, 0.3051300048828125, 0.3154296875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 14.0, 14.0, 25.0, 28.0, 38.0, 53.0, 74.0, 119.0, 132.0, 172.0, 256.0, 367.0, 486.0, 691.0, 917.0, 1302.0, 2010.0, 3162.0, 5065.0, 9110.0, 17871.0, 40556.0, 126376.0, 635452.0, 123087.0, 39370.0, 17708.0, 9089.0, 5217.0, 3189.0, 2072.0, 1297.0, 908.0, 607.0, 470.0, 354.0, 233.0, 193.0, 125.0, 89.0, 77.0, 54.0, 35.0, 22.0, 20.0, 13.0, 7.0, 9.0, 3.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.08941650390625, -0.08648395538330078, -0.08355140686035156, -0.08061885833740234, -0.07768630981445312, -0.0747537612915039, -0.07182121276855469, -0.06888866424560547, -0.06595611572265625, -0.06302356719970703, -0.06009101867675781, -0.057158470153808594, -0.054225921630859375, -0.051293373107910156, -0.04836082458496094, -0.04542827606201172, -0.0424957275390625, -0.03956317901611328, -0.03663063049316406, -0.033698081970214844, -0.030765533447265625, -0.027832984924316406, -0.024900436401367188, -0.02196788787841797, -0.01903533935546875, -0.01610279083251953, -0.013170242309570312, -0.010237693786621094, -0.007305145263671875, -0.004372596740722656, -0.0014400482177734375, 0.0014925003051757812, 0.004425048828125, 0.007357597351074219, 0.010290145874023438, 0.013222694396972656, 0.016155242919921875, 0.019087791442871094, 0.022020339965820312, 0.02495288848876953, 0.02788543701171875, 0.03081798553466797, 0.03375053405761719, 0.036683082580566406, 0.039615631103515625, 0.042548179626464844, 0.04548072814941406, 0.04841327667236328, 0.0513458251953125, 0.05427837371826172, 0.05721092224121094, 0.060143470764160156, 0.06307601928710938, 0.0660085678100586, 0.06894111633300781, 0.07187366485595703, 0.07480621337890625, 0.07773876190185547, 0.08067131042480469, 0.0836038589477539, 0.08653640747070312, 0.08946895599365234, 0.09240150451660156, 0.09533405303955078, 0.0982666015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 2.0, 9.0, 8.0, 17.0, 6.0, 16.0, 20.0, 22.0, 27.0, 22.0, 37.0, 83.0, 64.0, 68.0, 66.0, 141.0, 83.0, 51.0, 54.0, 36.0, 42.0, 19.0, 18.0, 18.0, 14.0, 11.0, 7.0, 6.0, 4.0, 6.0, 0.0, 0.0, 0.0, 7.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.76837158203125e-06, -4.636123776435852e-06, -4.503875970840454e-06, -4.371628165245056e-06, -4.239380359649658e-06, -4.10713255405426e-06, -3.974884748458862e-06, -3.842636942863464e-06, -3.7103891372680664e-06, -3.5781413316726685e-06, -3.4458935260772705e-06, -3.3136457204818726e-06, -3.1813979148864746e-06, -3.0491501092910767e-06, -2.9169023036956787e-06, -2.7846544981002808e-06, -2.652406692504883e-06, -2.520158886909485e-06, -2.387911081314087e-06, -2.255663275718689e-06, -2.123415470123291e-06, -1.991167664527893e-06, -1.8589198589324951e-06, -1.7266720533370972e-06, -1.5944242477416992e-06, -1.4621764421463013e-06, -1.3299286365509033e-06, -1.1976808309555054e-06, -1.0654330253601074e-06, -9.331852197647095e-07, -8.009374141693115e-07, -6.686896085739136e-07, -5.364418029785156e-07, -4.041939973831177e-07, -2.7194619178771973e-07, -1.3969838619232178e-07, -7.450580596923828e-09, 1.2479722499847412e-07, 2.5704503059387207e-07, 3.8929283618927e-07, 5.21540641784668e-07, 6.537884473800659e-07, 7.860362529754639e-07, 9.182840585708618e-07, 1.0505318641662598e-06, 1.1827796697616577e-06, 1.3150274753570557e-06, 1.4472752809524536e-06, 1.5795230865478516e-06, 1.7117708921432495e-06, 1.8440186977386475e-06, 1.9762665033340454e-06, 2.1085143089294434e-06, 2.2407621145248413e-06, 2.3730099201202393e-06, 2.505257725715637e-06, 2.637505531311035e-06, 2.769753336906433e-06, 2.902001142501831e-06, 3.034248948097229e-06, 3.166496753692627e-06, 3.298744559288025e-06, 3.430992364883423e-06, 3.563240170478821e-06, 3.6954879760742188e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 11.0, 10.0, 22.0, 43.0, 43.0, 57.0, 86.0, 143.0, 216.0, 388.0, 597.0, 885.0, 1475.0, 2472.0, 4073.0, 7176.0, 12653.0, 23852.0, 49382.0, 119409.0, 435768.0, 233603.0, 78666.0, 35698.0, 17996.0, 9776.0, 5616.0, 3267.0, 1892.0, 1201.0, 773.0, 459.0, 303.0, 188.0, 116.0, 76.0, 37.0, 44.0, 42.0, 20.0, 9.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08151912689208984, -0.07887077331542969, -0.07622241973876953, -0.07357406616210938, -0.07092571258544922, -0.06827735900878906, -0.0656290054321289, -0.06298065185546875, -0.060332298278808594, -0.05768394470214844, -0.05503559112548828, -0.052387237548828125, -0.04973888397216797, -0.04709053039550781, -0.044442176818847656, -0.0417938232421875, -0.039145469665527344, -0.03649711608886719, -0.03384876251220703, -0.031200408935546875, -0.02855205535888672, -0.025903701782226562, -0.023255348205566406, -0.02060699462890625, -0.017958641052246094, -0.015310287475585938, -0.012661933898925781, -0.010013580322265625, -0.007365226745605469, -0.0047168731689453125, -0.0020685195922851562, 0.000579833984375, 0.0032281875610351562, 0.0058765411376953125, 0.008524894714355469, 0.011173248291015625, 0.013821601867675781, 0.016469955444335938, 0.019118309020996094, 0.02176666259765625, 0.024415016174316406, 0.027063369750976562, 0.02971172332763672, 0.032360076904296875, 0.03500843048095703, 0.03765678405761719, 0.040305137634277344, 0.0429534912109375, 0.045601844787597656, 0.04825019836425781, 0.05089855194091797, 0.053546905517578125, 0.05619525909423828, 0.05884361267089844, 0.061491966247558594, 0.06414031982421875, 0.0667886734008789, 0.06943702697753906, 0.07208538055419922, 0.07473373413085938, 0.07738208770751953, 0.08003044128417969, 0.08267879486083984, 0.0853271484375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 12.0, 6.0, 19.0, 17.0, 26.0, 27.0, 30.0, 50.0, 64.0, 107.0, 168.0, 146.0, 82.0, 61.0, 34.0, 30.0, 20.0, 10.0, 15.0, 11.0, 17.0, 4.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0394287109375, -0.038153648376464844, -0.03687858581542969, -0.03560352325439453, -0.034328460693359375, -0.03305339813232422, -0.03177833557128906, -0.030503273010253906, -0.02922821044921875, -0.027953147888183594, -0.026678085327148438, -0.02540302276611328, -0.024127960205078125, -0.02285289764404297, -0.021577835083007812, -0.020302772521972656, -0.0190277099609375, -0.017752647399902344, -0.016477584838867188, -0.015202522277832031, -0.013927459716796875, -0.012652397155761719, -0.011377334594726562, -0.010102272033691406, -0.00882720947265625, -0.007552146911621094, -0.0062770843505859375, -0.005002021789550781, -0.003726959228515625, -0.0024518966674804688, -0.0011768341064453125, 9.822845458984375e-05, 0.001373291015625, 0.0026483535766601562, 0.0039234161376953125, 0.005198478698730469, 0.006473541259765625, 0.007748603820800781, 0.009023666381835938, 0.010298728942871094, 0.01157379150390625, 0.012848854064941406, 0.014123916625976562, 0.015398979187011719, 0.016674041748046875, 0.01794910430908203, 0.019224166870117188, 0.020499229431152344, 0.0217742919921875, 0.023049354553222656, 0.024324417114257812, 0.02559947967529297, 0.026874542236328125, 0.02814960479736328, 0.029424667358398438, 0.030699729919433594, 0.03197479248046875, 0.033249855041503906, 0.03452491760253906, 0.03579998016357422, 0.037075042724609375, 0.03835010528564453, 0.03962516784667969, 0.040900230407714844, 0.04217529296875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 6.0, 11.0, 12.0, 17.0, 16.0, 12.0, 30.0, 33.0, 50.0, 47.0, 101.0, 124.0, 113.0, 125.0, 77.0, 52.0, 39.0, 34.0, 18.0, 26.0, 15.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8401376008987427, -0.813301146030426, -0.7864646911621094, -0.759628176689148, -0.7327917218208313, -0.7059552669525146, -0.6791187524795532, -0.6522822976112366, -0.6254458427429199, -0.5986093878746033, -0.5717729330062866, -0.5449364185333252, -0.5180999636650085, -0.4912635087966919, -0.46442702412605286, -0.4375905394554138, -0.41075408458709717, -0.3839176297187805, -0.3570811450481415, -0.33024466037750244, -0.3034082055091858, -0.27657175064086914, -0.2497352659702301, -0.22289879620075226, -0.19606232643127441, -0.16922585666179657, -0.14238938689231873, -0.11555291712284088, -0.08871644735336304, -0.06187997758388519, -0.03504350781440735, -0.008207038044929504, 0.018629491329193115, 0.04546596109867096, 0.0723024308681488, 0.09913890063762665, 0.1259753704071045, 0.15281184017658234, 0.17964830994606018, 0.20648477971553802, 0.23332124948501587, 0.2601577043533325, 0.28699418902397156, 0.3138306736946106, 0.34066712856292725, 0.3675035834312439, 0.39434006810188293, 0.421176552772522, 0.4480130076408386, 0.4748494625091553, 0.5016859769821167, 0.5285224318504333, 0.55535888671875, 0.5821953415870667, 0.6090317964553833, 0.6358683109283447, 0.6627047657966614, 0.689541220664978, 0.7163777351379395, 0.7432141900062561, 0.7700506448745728, 0.7968870997428894, 0.823723554611206, 0.8505600690841675, 0.8773965239524841]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 5.0, 3.0, 9.0, 9.0, 12.0, 8.0, 6.0, 16.0, 16.0, 17.0, 9.0, 18.0, 25.0, 25.0, 22.0, 29.0, 26.0, 34.0, 38.0, 36.0, 39.0, 41.0, 49.0, 44.0, 35.0, 34.0, 30.0, 35.0, 28.0, 28.0, 36.0, 26.0, 27.0, 19.0, 29.0, 28.0, 21.0, 16.0, 13.0, 13.0, 10.0, 13.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5082613229751587, -0.4933927655220032, -0.47852417826652527, -0.46365562081336975, -0.44878706336021423, -0.43391847610473633, -0.4190499186515808, -0.4041813611984253, -0.3893127739429474, -0.37444421648979187, -0.35957562923431396, -0.34470707178115845, -0.32983851432800293, -0.314969927072525, -0.3001013696193695, -0.2852327823638916, -0.2703642249107361, -0.25549566745758057, -0.24062709510326385, -0.22575852274894714, -0.21088995039463043, -0.19602137804031372, -0.1811528205871582, -0.1662842482328415, -0.15141570568084717, -0.13654713332653046, -0.12167856842279434, -0.10681000351905823, -0.09194143116474152, -0.0770728662610054, -0.06220430135726929, -0.047335729002952576, -0.032467156648635864, -0.01759858801960945, -0.0027300212532281876, 0.012138545513153076, 0.02700711414217949, 0.0418756827712059, 0.05674424767494202, 0.07161282002925873, 0.08648138493299484, 0.10134994983673096, 0.11621852219104767, 0.13108709454536438, 0.1459556519985199, 0.1608242243528366, 0.17569279670715332, 0.19056135416030884, 0.20542992651462555, 0.22029849886894226, 0.23516705632209778, 0.2500356435775757, 0.2649042010307312, 0.2797727584838867, 0.29464131593704224, 0.30950990319252014, 0.32437846064567566, 0.3392470180988312, 0.3541156053543091, 0.3689841628074646, 0.3838527202606201, 0.398721307516098, 0.41358986496925354, 0.42845845222473145, 0.44332700967788696]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 8.0, 11.0, 9.0, 28.0, 43.0, 74.0, 77.0, 126.0, 192.0, 279.0, 396.0, 538.0, 814.0, 1222.0, 1755.0, 2700.0, 4101.0, 6248.0, 9708.0, 15649.0, 25860.0, 42874.0, 73726.0, 132146.0, 236596.0, 211744.0, 115428.0, 65353.0, 38337.0, 22877.0, 14037.0, 8887.0, 5596.0, 3633.0, 2417.0, 1542.0, 1065.0, 789.0, 505.0, 331.0, 250.0, 188.0, 114.0, 92.0, 65.0, 36.0, 30.0, 13.0, 12.0, 12.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.82666015625, -0.799896240234375, -0.77313232421875, -0.746368408203125, -0.7196044921875, -0.692840576171875, -0.66607666015625, -0.639312744140625, -0.612548828125, -0.585784912109375, -0.55902099609375, -0.532257080078125, -0.5054931640625, -0.478729248046875, -0.45196533203125, -0.425201416015625, -0.3984375, -0.371673583984375, -0.34490966796875, -0.318145751953125, -0.2913818359375, -0.264617919921875, -0.23785400390625, -0.211090087890625, -0.184326171875, -0.157562255859375, -0.13079833984375, -0.104034423828125, -0.0772705078125, -0.050506591796875, -0.02374267578125, 0.003021240234375, 0.02978515625, 0.056549072265625, 0.08331298828125, 0.110076904296875, 0.1368408203125, 0.163604736328125, 0.19036865234375, 0.217132568359375, 0.243896484375, 0.270660400390625, 0.29742431640625, 0.324188232421875, 0.3509521484375, 0.377716064453125, 0.40447998046875, 0.431243896484375, 0.4580078125, 0.484771728515625, 0.51153564453125, 0.538299560546875, 0.5650634765625, 0.591827392578125, 0.61859130859375, 0.645355224609375, 0.672119140625, 0.698883056640625, 0.72564697265625, 0.752410888671875, 0.7791748046875, 0.805938720703125, 0.83270263671875, 0.859466552734375, 0.88623046875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 10.0, 5.0, 6.0, 4.0, 5.0, 7.0, 8.0, 11.0, 10.0, 13.0, 23.0, 18.0, 29.0, 16.0, 30.0, 30.0, 17.0, 26.0, 46.0, 39.0, 31.0, 34.0, 40.0, 42.0, 34.0, 36.0, 32.0, 39.0, 35.0, 34.0, 30.0, 28.0, 27.0, 20.0, 26.0, 21.0, 29.0, 21.0, 9.0, 13.0, 14.0, 13.0, 9.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.46435546875, -0.45098114013671875, -0.4376068115234375, -0.42423248291015625, -0.410858154296875, -0.39748382568359375, -0.3841094970703125, -0.37073516845703125, -0.35736083984375, -0.34398651123046875, -0.3306121826171875, -0.31723785400390625, -0.303863525390625, -0.29048919677734375, -0.2771148681640625, -0.26374053955078125, -0.2503662109375, -0.23699188232421875, -0.2236175537109375, -0.21024322509765625, -0.196868896484375, -0.18349456787109375, -0.1701202392578125, -0.15674591064453125, -0.14337158203125, -0.12999725341796875, -0.1166229248046875, -0.10324859619140625, -0.089874267578125, -0.07649993896484375, -0.0631256103515625, -0.04975128173828125, -0.036376953125, -0.02300262451171875, -0.0096282958984375, 0.00374603271484375, 0.017120361328125, 0.03049468994140625, 0.0438690185546875, 0.05724334716796875, 0.07061767578125, 0.08399200439453125, 0.0973663330078125, 0.11074066162109375, 0.124114990234375, 0.13748931884765625, 0.1508636474609375, 0.16423797607421875, 0.1776123046875, 0.19098663330078125, 0.2043609619140625, 0.21773529052734375, 0.231109619140625, 0.24448394775390625, 0.2578582763671875, 0.27123260498046875, 0.28460693359375, 0.29798126220703125, 0.3113555908203125, 0.32472991943359375, 0.338104248046875, 0.35147857666015625, 0.3648529052734375, 0.37822723388671875, 0.3916015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 13.0, 25.0, 33.0, 45.0, 78.0, 86.0, 108.0, 197.0, 283.0, 412.0, 617.0, 913.0, 1380.0, 2164.0, 3230.0, 5181.0, 8467.0, 13840.0, 23543.0, 41154.0, 74667.0, 145128.0, 279377.0, 210091.0, 103737.0, 55347.0, 30890.0, 18119.0, 10894.0, 6611.0, 4145.0, 2619.0, 1744.0, 1090.0, 716.0, 490.0, 338.0, 250.0, 165.0, 111.0, 85.0, 43.0, 34.0, 31.0, 20.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8564682006835938, -0.8276824951171875, -0.7988967895507812, -0.770111083984375, -0.7413253784179688, -0.7125396728515625, -0.6837539672851562, -0.65496826171875, -0.6261825561523438, -0.5973968505859375, -0.5686111450195312, -0.539825439453125, -0.5110397338867188, -0.4822540283203125, -0.45346832275390625, -0.4246826171875, -0.39589691162109375, -0.3671112060546875, -0.33832550048828125, -0.309539794921875, -0.28075408935546875, -0.2519683837890625, -0.22318267822265625, -0.19439697265625, -0.16561126708984375, -0.1368255615234375, -0.10803985595703125, -0.079254150390625, -0.05046844482421875, -0.0216827392578125, 0.00710296630859375, 0.035888671875, 0.06467437744140625, 0.0934600830078125, 0.12224578857421875, 0.151031494140625, 0.17981719970703125, 0.2086029052734375, 0.23738861083984375, 0.26617431640625, 0.29496002197265625, 0.3237457275390625, 0.35253143310546875, 0.381317138671875, 0.41010284423828125, 0.4388885498046875, 0.46767425537109375, 0.4964599609375, 0.5252456665039062, 0.5540313720703125, 0.5828170776367188, 0.611602783203125, 0.6403884887695312, 0.6691741943359375, 0.6979598999023438, 0.72674560546875, 0.7555313110351562, 0.7843170166015625, 0.8131027221679688, 0.841888427734375, 0.8706741333007812, 0.8994598388671875, 0.9282455444335938, 0.95703125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 2.0, 5.0, 4.0, 3.0, 10.0, 12.0, 13.0, 15.0, 13.0, 12.0, 16.0, 20.0, 23.0, 25.0, 39.0, 31.0, 30.0, 34.0, 55.0, 42.0, 40.0, 42.0, 42.0, 37.0, 48.0, 39.0, 42.0, 42.0, 33.0, 37.0, 26.0, 21.0, 20.0, 23.0, 15.0, 14.0, 11.0, 10.0, 8.0, 13.0, 13.0, 7.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.335205078125, -0.3254280090332031, -0.31565093994140625, -0.3058738708496094, -0.2960968017578125, -0.2863197326660156, -0.27654266357421875, -0.2667655944824219, -0.256988525390625, -0.24721145629882812, -0.23743438720703125, -0.22765731811523438, -0.2178802490234375, -0.20810317993164062, -0.19832611083984375, -0.18854904174804688, -0.17877197265625, -0.16899490356445312, -0.15921783447265625, -0.14944076538085938, -0.1396636962890625, -0.12988662719726562, -0.12010955810546875, -0.11033248901367188, -0.100555419921875, -0.09077835083007812, -0.08100128173828125, -0.07122421264648438, -0.0614471435546875, -0.051670074462890625, -0.04189300537109375, -0.032115936279296875, -0.0223388671875, -0.012561798095703125, -0.00278472900390625, 0.006992340087890625, 0.0167694091796875, 0.026546478271484375, 0.03632354736328125, 0.046100616455078125, 0.055877685546875, 0.06565475463867188, 0.07543182373046875, 0.08520889282226562, 0.0949859619140625, 0.10476303100585938, 0.11454010009765625, 0.12431716918945312, 0.13409423828125, 0.14387130737304688, 0.15364837646484375, 0.16342544555664062, 0.1732025146484375, 0.18297958374023438, 0.19275665283203125, 0.20253372192382812, 0.212310791015625, 0.22208786010742188, 0.23186492919921875, 0.24164199829101562, 0.2514190673828125, 0.2611961364746094, 0.27097320556640625, 0.2807502746582031, 0.29052734375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 9.0, 9.0, 15.0, 14.0, 32.0, 34.0, 57.0, 66.0, 95.0, 142.0, 221.0, 353.0, 504.0, 801.0, 1229.0, 2055.0, 3133.0, 4967.0, 8653.0, 14732.0, 28311.0, 64162.0, 605827.0, 203233.0, 52440.0, 24312.0, 13076.0, 7552.0, 4581.0, 2816.0, 1831.0, 1062.0, 735.0, 491.0, 313.0, 218.0, 116.0, 95.0, 68.0, 52.0, 25.0, 31.0, 23.0, 16.0, 10.0, 11.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.5947265625, -0.5766448974609375, -0.558563232421875, -0.5404815673828125, -0.52239990234375, -0.5043182373046875, -0.486236572265625, -0.4681549072265625, -0.4500732421875, -0.4319915771484375, -0.413909912109375, -0.3958282470703125, -0.37774658203125, -0.3596649169921875, -0.341583251953125, -0.3235015869140625, -0.305419921875, -0.2873382568359375, -0.269256591796875, -0.2511749267578125, -0.23309326171875, -0.2150115966796875, -0.196929931640625, -0.1788482666015625, -0.1607666015625, -0.1426849365234375, -0.124603271484375, -0.1065216064453125, -0.08843994140625, -0.0703582763671875, -0.052276611328125, -0.0341949462890625, -0.01611328125, 0.0019683837890625, 0.020050048828125, 0.0381317138671875, 0.05621337890625, 0.0742950439453125, 0.092376708984375, 0.1104583740234375, 0.1285400390625, 0.1466217041015625, 0.164703369140625, 0.1827850341796875, 0.20086669921875, 0.2189483642578125, 0.237030029296875, 0.2551116943359375, 0.273193359375, 0.2912750244140625, 0.309356689453125, 0.3274383544921875, 0.34552001953125, 0.3636016845703125, 0.381683349609375, 0.3997650146484375, 0.4178466796875, 0.4359283447265625, 0.454010009765625, 0.4720916748046875, 0.49017333984375, 0.5082550048828125, 0.526336669921875, 0.5444183349609375, 0.5625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 8.0, 11.0, 7.0, 11.0, 18.0, 18.0, 36.0, 46.0, 77.0, 165.0, 279.0, 109.0, 62.0, 34.0, 18.0, 18.0, 17.0, 12.0, 8.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.996755599975586e-05, -1.9385479390621185e-05, -1.880340278148651e-05, -1.8221326172351837e-05, -1.7639249563217163e-05, -1.705717295408249e-05, -1.6475096344947815e-05, -1.589301973581314e-05, -1.5310943126678467e-05, -1.4728866517543793e-05, -1.4146789908409119e-05, -1.3564713299274445e-05, -1.298263669013977e-05, -1.2400560081005096e-05, -1.1818483471870422e-05, -1.1236406862735748e-05, -1.0654330253601074e-05, -1.00722536444664e-05, -9.490177035331726e-06, -8.908100426197052e-06, -8.326023817062378e-06, -7.743947207927704e-06, -7.16187059879303e-06, -6.579793989658356e-06, -5.997717380523682e-06, -5.4156407713890076e-06, -4.8335641622543335e-06, -4.2514875531196594e-06, -3.6694109439849854e-06, -3.0873343348503113e-06, -2.505257725715637e-06, -1.923181116580963e-06, -1.341104507446289e-06, -7.59027898311615e-07, -1.7695128917694092e-07, 4.0512531995773315e-07, 9.872019290924072e-07, 1.5692785382270813e-06, 2.1513551473617554e-06, 2.7334317564964294e-06, 3.3155083656311035e-06, 3.897584974765778e-06, 4.479661583900452e-06, 5.061738193035126e-06, 5.6438148021698e-06, 6.225891411304474e-06, 6.807968020439148e-06, 7.390044629573822e-06, 7.972121238708496e-06, 8.55419784784317e-06, 9.136274456977844e-06, 9.718351066112518e-06, 1.0300427675247192e-05, 1.0882504284381866e-05, 1.146458089351654e-05, 1.2046657502651215e-05, 1.2628734111785889e-05, 1.3210810720920563e-05, 1.3792887330055237e-05, 1.4374963939189911e-05, 1.4957040548324585e-05, 1.553911715745926e-05, 1.6121193766593933e-05, 1.6703270375728607e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 14.0, 16.0, 28.0, 30.0, 49.0, 98.0, 104.0, 198.0, 253.0, 427.0, 618.0, 942.0, 1454.0, 2197.0, 3476.0, 5825.0, 10047.0, 20742.0, 49331.0, 255262.0, 592530.0, 55121.0, 22294.0, 11020.0, 6044.0, 3609.0, 2362.0, 1515.0, 1007.0, 665.0, 419.0, 292.0, 186.0, 128.0, 66.0, 64.0, 33.0, 30.0, 13.0, 11.0, 11.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.78173828125, -0.758087158203125, -0.73443603515625, -0.710784912109375, -0.6871337890625, -0.663482666015625, -0.63983154296875, -0.616180419921875, -0.592529296875, -0.568878173828125, -0.54522705078125, -0.521575927734375, -0.4979248046875, -0.474273681640625, -0.45062255859375, -0.426971435546875, -0.4033203125, -0.379669189453125, -0.35601806640625, -0.332366943359375, -0.3087158203125, -0.285064697265625, -0.26141357421875, -0.237762451171875, -0.214111328125, -0.190460205078125, -0.16680908203125, -0.143157958984375, -0.1195068359375, -0.095855712890625, -0.07220458984375, -0.048553466796875, -0.02490234375, -0.001251220703125, 0.02239990234375, 0.046051025390625, 0.0697021484375, 0.093353271484375, 0.11700439453125, 0.140655517578125, 0.164306640625, 0.187957763671875, 0.21160888671875, 0.235260009765625, 0.2589111328125, 0.282562255859375, 0.30621337890625, 0.329864501953125, 0.353515625, 0.377166748046875, 0.40081787109375, 0.424468994140625, 0.4481201171875, 0.471771240234375, 0.49542236328125, 0.519073486328125, 0.542724609375, 0.566375732421875, 0.59002685546875, 0.613677978515625, 0.6373291015625, 0.660980224609375, 0.68463134765625, 0.708282470703125, 0.73193359375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 3.0, 10.0, 8.0, 7.0, 15.0, 19.0, 26.0, 25.0, 42.0, 44.0, 85.0, 366.0, 93.0, 41.0, 43.0, 31.0, 28.0, 10.0, 23.0, 13.0, 7.0, 9.0, 7.0, 3.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22577667236328125, -0.2196197509765625, -0.21346282958984375, -0.207305908203125, -0.20114898681640625, -0.1949920654296875, -0.18883514404296875, -0.18267822265625, -0.17652130126953125, -0.1703643798828125, -0.16420745849609375, -0.158050537109375, -0.15189361572265625, -0.1457366943359375, -0.13957977294921875, -0.1334228515625, -0.12726593017578125, -0.1211090087890625, -0.11495208740234375, -0.108795166015625, -0.10263824462890625, -0.0964813232421875, -0.09032440185546875, -0.08416748046875, -0.07801055908203125, -0.0718536376953125, -0.06569671630859375, -0.059539794921875, -0.05338287353515625, -0.0472259521484375, -0.04106903076171875, -0.034912109375, -0.02875518798828125, -0.0225982666015625, -0.01644134521484375, -0.010284423828125, -0.00412750244140625, 0.0020294189453125, 0.00818634033203125, 0.01434326171875, 0.02050018310546875, 0.0266571044921875, 0.03281402587890625, 0.038970947265625, 0.04512786865234375, 0.0512847900390625, 0.05744171142578125, 0.0635986328125, 0.06975555419921875, 0.0759124755859375, 0.08206939697265625, 0.088226318359375, 0.09438323974609375, 0.1005401611328125, 0.10669708251953125, 0.11285400390625, 0.11901092529296875, 0.1251678466796875, 0.13132476806640625, 0.137481689453125, 0.14363861083984375, 0.1497955322265625, 0.15595245361328125, 0.162109375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 8.0, 14.0, 9.0, 25.0, 24.0, 36.0, 39.0, 55.0, 62.0, 103.0, 95.0, 101.0, 74.0, 67.0, 51.0, 42.0, 34.0, 25.0, 22.0, 18.0, 20.0, 6.0, 6.0, 4.0, 10.0, 4.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6671497821807861, -0.6462233662605286, -0.625296950340271, -0.6043705344200134, -0.5834441184997559, -0.5625177621841431, -0.5415913462638855, -0.5206649303436279, -0.49973851442337036, -0.4788120985031128, -0.4578856825828552, -0.43695929646492004, -0.4160328805446625, -0.3951064646244049, -0.3741800785064697, -0.35325366258621216, -0.3323272466659546, -0.311400830745697, -0.29047441482543945, -0.2695480287075043, -0.2486216127872467, -0.22769519686698914, -0.20676879584789276, -0.1858423948287964, -0.16491597890853882, -0.14398956298828125, -0.12306316196918488, -0.1021367534995079, -0.08121034502983093, -0.06028393656015396, -0.03935752809047699, -0.018431127071380615, 0.002495288848876953, 0.023421697318553925, 0.044348105788230896, 0.06527451425790787, 0.08620092272758484, 0.10712733119726181, 0.12805373966693878, 0.14898014068603516, 0.16990655660629272, 0.1908329725265503, 0.21175937354564667, 0.23268577456474304, 0.2536121904850006, 0.2745386064052582, 0.29546499252319336, 0.3163914084434509, 0.3373178243637085, 0.35824424028396606, 0.37917065620422363, 0.4000970423221588, 0.4210234582424164, 0.44194987416267395, 0.46287626028060913, 0.4838026762008667, 0.5047290921211243, 0.5256555080413818, 0.5465819239616394, 0.567508339881897, 0.5884346961975098, 0.6093611121177673, 0.6302875280380249, 0.6512139439582825, 0.67214035987854]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 11.0, 6.0, 8.0, 5.0, 7.0, 12.0, 8.0, 12.0, 10.0, 13.0, 8.0, 21.0, 29.0, 26.0, 24.0, 28.0, 32.0, 35.0, 34.0, 22.0, 28.0, 36.0, 27.0, 31.0, 40.0, 32.0, 38.0, 45.0, 20.0, 35.0, 31.0, 24.0, 34.0, 30.0, 27.0, 28.0, 22.0, 30.0, 22.0, 9.0, 6.0, 7.0, 8.0, 3.0, 6.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.4383643865585327, -0.42473548650741577, -0.41110658645629883, -0.3974776864051819, -0.38384878635406494, -0.370219886302948, -0.35659098625183105, -0.3429620862007141, -0.32933318614959717, -0.3157042860984802, -0.3020753860473633, -0.28844648599624634, -0.2748175859451294, -0.26118868589401245, -0.2475597858428955, -0.23393088579177856, -0.22030198574066162, -0.20667308568954468, -0.19304418563842773, -0.1794152855873108, -0.16578638553619385, -0.1521574854850769, -0.13852858543395996, -0.12489968538284302, -0.11127078533172607, -0.09764188528060913, -0.08401298522949219, -0.07038408517837524, -0.0567551851272583, -0.04312628507614136, -0.029497385025024414, -0.01586848497390747, -0.0022395551204681396, 0.011389344930648804, 0.025018244981765747, 0.03864714503288269, 0.052276045083999634, 0.06590494513511658, 0.07953384518623352, 0.09316274523735046, 0.10679164528846741, 0.12042054533958435, 0.1340494453907013, 0.14767834544181824, 0.16130724549293518, 0.17493614554405212, 0.18856504559516907, 0.202193945646286, 0.21582284569740295, 0.2294517457485199, 0.24308064579963684, 0.2567095458507538, 0.2703384459018707, 0.28396734595298767, 0.2975962460041046, 0.31122514605522156, 0.3248540461063385, 0.33848294615745544, 0.3521118462085724, 0.36574074625968933, 0.3793696463108063, 0.3929985463619232, 0.40662744641304016, 0.4202563464641571, 0.43388524651527405]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 11.0, 18.0, 29.0, 29.0, 48.0, 73.0, 96.0, 131.0, 146.0, 250.0, 389.0, 536.0, 780.0, 1201.0, 1678.0, 2488.0, 3722.0, 5888.0, 9101.0, 14550.0, 24008.0, 40630.0, 72011.0, 135255.0, 294106.0, 909029.0, 1647415.0, 569537.0, 210251.0, 104799.0, 57923.0, 33013.0, 20225.0, 12103.0, 7871.0, 4938.0, 3313.0, 2122.0, 1453.0, 1031.0, 624.0, 471.0, 314.0, 228.0, 135.0, 97.0, 67.0, 55.0, 28.0, 22.0, 13.0, 12.0, 9.0, 4.0, 3.0, 2.0], "bins": [-0.67822265625, -0.6584625244140625, -0.638702392578125, -0.6189422607421875, -0.59918212890625, -0.5794219970703125, -0.559661865234375, -0.5399017333984375, -0.5201416015625, -0.5003814697265625, -0.480621337890625, -0.4608612060546875, -0.44110107421875, -0.4213409423828125, -0.401580810546875, -0.3818206787109375, -0.362060546875, -0.3423004150390625, -0.322540283203125, -0.3027801513671875, -0.28302001953125, -0.2632598876953125, -0.243499755859375, -0.2237396240234375, -0.2039794921875, -0.1842193603515625, -0.164459228515625, -0.1446990966796875, -0.12493896484375, -0.1051788330078125, -0.085418701171875, -0.0656585693359375, -0.0458984375, -0.0261383056640625, -0.006378173828125, 0.0133819580078125, 0.03314208984375, 0.0529022216796875, 0.072662353515625, 0.0924224853515625, 0.1121826171875, 0.1319427490234375, 0.151702880859375, 0.1714630126953125, 0.19122314453125, 0.2109832763671875, 0.230743408203125, 0.2505035400390625, 0.270263671875, 0.2900238037109375, 0.309783935546875, 0.3295440673828125, 0.34930419921875, 0.3690643310546875, 0.388824462890625, 0.4085845947265625, 0.4283447265625, 0.4481048583984375, 0.467864990234375, 0.4876251220703125, 0.50738525390625, 0.5271453857421875, 0.546905517578125, 0.5666656494140625, 0.58642578125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 3.0, 6.0, 5.0, 10.0, 8.0, 7.0, 13.0, 13.0, 10.0, 12.0, 13.0, 9.0, 18.0, 22.0, 27.0, 30.0, 20.0, 25.0, 38.0, 23.0, 33.0, 32.0, 21.0, 34.0, 47.0, 41.0, 36.0, 39.0, 35.0, 31.0, 24.0, 35.0, 25.0, 24.0, 27.0, 27.0, 27.0, 22.0, 23.0, 17.0, 14.0, 10.0, 9.0, 11.0, 8.0, 5.0, 6.0, 2.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.255859375, -0.24770736694335938, -0.23955535888671875, -0.23140335083007812, -0.2232513427734375, -0.21509933471679688, -0.20694732666015625, -0.19879531860351562, -0.190643310546875, -0.18249130249023438, -0.17433929443359375, -0.16618728637695312, -0.1580352783203125, -0.14988327026367188, -0.14173126220703125, -0.13357925415039062, -0.12542724609375, -0.11727523803710938, -0.10912322998046875, -0.10097122192382812, -0.0928192138671875, -0.08466720581054688, -0.07651519775390625, -0.06836318969726562, -0.060211181640625, -0.052059173583984375, -0.04390716552734375, -0.035755157470703125, -0.0276031494140625, -0.019451141357421875, -0.01129913330078125, -0.003147125244140625, 0.0050048828125, 0.013156890869140625, 0.02130889892578125, 0.029460906982421875, 0.0376129150390625, 0.045764923095703125, 0.05391693115234375, 0.062068939208984375, 0.070220947265625, 0.07837295532226562, 0.08652496337890625, 0.09467697143554688, 0.1028289794921875, 0.11098098754882812, 0.11913299560546875, 0.12728500366210938, 0.13543701171875, 0.14358901977539062, 0.15174102783203125, 0.15989303588867188, 0.1680450439453125, 0.17619705200195312, 0.18434906005859375, 0.19250106811523438, 0.200653076171875, 0.20880508422851562, 0.21695709228515625, 0.22510910034179688, 0.2332611083984375, 0.24141311645507812, 0.24956512451171875, 0.2577171325683594, 0.265869140625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 12.0, 32.0, 30.0, 53.0, 82.0, 133.0, 229.0, 319.0, 477.0, 790.0, 1206.0, 1920.0, 3177.0, 5110.0, 8531.0, 14446.0, 24476.0, 43595.0, 80998.0, 162526.0, 360165.0, 1021028.0, 1501234.0, 515460.0, 214380.0, 104194.0, 54910.0, 30402.0, 17498.0, 10446.0, 6166.0, 3944.0, 2384.0, 1390.0, 883.0, 598.0, 379.0, 223.0, 157.0, 104.0, 61.0, 51.0, 28.0, 18.0, 13.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5881729125976562, -0.5699005126953125, -0.5516281127929688, -0.533355712890625, -0.5150833129882812, -0.4968109130859375, -0.47853851318359375, -0.46026611328125, -0.44199371337890625, -0.4237213134765625, -0.40544891357421875, -0.387176513671875, -0.36890411376953125, -0.3506317138671875, -0.33235931396484375, -0.3140869140625, -0.29581451416015625, -0.2775421142578125, -0.25926971435546875, -0.240997314453125, -0.22272491455078125, -0.2044525146484375, -0.18618011474609375, -0.16790771484375, -0.14963531494140625, -0.1313629150390625, -0.11309051513671875, -0.094818115234375, -0.07654571533203125, -0.0582733154296875, -0.04000091552734375, -0.021728515625, -0.00345611572265625, 0.0148162841796875, 0.03308868408203125, 0.051361083984375, 0.06963348388671875, 0.0879058837890625, 0.10617828369140625, 0.12445068359375, 0.14272308349609375, 0.1609954833984375, 0.17926788330078125, 0.197540283203125, 0.21581268310546875, 0.2340850830078125, 0.25235748291015625, 0.2706298828125, 0.28890228271484375, 0.3071746826171875, 0.32544708251953125, 0.343719482421875, 0.36199188232421875, 0.3802642822265625, 0.39853668212890625, 0.41680908203125, 0.43508148193359375, 0.4533538818359375, 0.47162628173828125, 0.489898681640625, 0.5081710815429688, 0.5264434814453125, 0.5447158813476562, 0.56298828125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 9.0, 10.0, 21.0, 18.0, 16.0, 40.0, 33.0, 45.0, 50.0, 61.0, 101.0, 89.0, 102.0, 126.0, 163.0, 197.0, 204.0, 216.0, 262.0, 281.0, 280.0, 267.0, 241.0, 202.0, 164.0, 136.0, 136.0, 97.0, 89.0, 80.0, 66.0, 42.0, 46.0, 31.0, 27.0, 22.0, 15.0, 23.0, 10.0, 7.0, 7.0, 15.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.15771484375, -0.1527729034423828, -0.14783096313476562, -0.14288902282714844, -0.13794708251953125, -0.13300514221191406, -0.12806320190429688, -0.12312126159667969, -0.1181793212890625, -0.11323738098144531, -0.10829544067382812, -0.10335350036621094, -0.09841156005859375, -0.09346961975097656, -0.08852767944335938, -0.08358573913574219, -0.078643798828125, -0.07370185852050781, -0.06875991821289062, -0.06381797790527344, -0.05887603759765625, -0.05393409729003906, -0.048992156982421875, -0.04405021667480469, -0.0391082763671875, -0.03416633605957031, -0.029224395751953125, -0.024282455444335938, -0.01934051513671875, -0.014398574829101562, -0.009456634521484375, -0.0045146942138671875, 0.00042724609375, 0.0053691864013671875, 0.010311126708984375, 0.015253067016601562, 0.02019500732421875, 0.025136947631835938, 0.030078887939453125, 0.03502082824707031, 0.0399627685546875, 0.04490470886230469, 0.049846649169921875, 0.05478858947753906, 0.05973052978515625, 0.06467247009277344, 0.06961441040039062, 0.07455635070800781, 0.079498291015625, 0.08444023132324219, 0.08938217163085938, 0.09432411193847656, 0.09926605224609375, 0.10420799255371094, 0.10914993286132812, 0.11409187316894531, 0.1190338134765625, 0.12397575378417969, 0.12891769409179688, 0.13385963439941406, 0.13880157470703125, 0.14374351501464844, 0.14868545532226562, 0.1536273956298828, 0.1585693359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 10.0, 7.0, 5.0, 9.0, 12.0, 14.0, 21.0, 18.0, 35.0, 43.0, 47.0, 56.0, 72.0, 86.0, 111.0, 80.0, 88.0, 43.0, 42.0, 41.0, 24.0, 25.0, 17.0, 20.0, 6.0, 18.0, 6.0, 5.0, 8.0, 6.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4045407772064209, -0.3903734087944031, -0.37620604038238525, -0.36203867197036743, -0.3478713035583496, -0.3337039351463318, -0.31953656673431396, -0.30536919832229614, -0.2912018299102783, -0.2770344614982605, -0.2628670930862427, -0.24869972467422485, -0.23453235626220703, -0.2203649878501892, -0.2061976194381714, -0.19203025102615356, -0.17786286771297455, -0.16369549930095673, -0.1495281308889389, -0.13536076247692108, -0.12119339406490326, -0.10702601820230484, -0.09285864979028702, -0.0786912813782692, -0.06452391296625137, -0.05035654455423355, -0.03618917614221573, -0.022021804004907608, -0.007854435592889786, 0.006312936544418335, 0.020480304956436157, 0.03464767336845398, 0.0488150417804718, 0.06298241019248962, 0.07714977860450745, 0.09131714701652527, 0.10548451542854309, 0.11965189129114151, 0.13381925225257874, 0.14798662066459656, 0.16215398907661438, 0.1763213574886322, 0.19048872590065002, 0.20465609431266785, 0.21882346272468567, 0.2329908311367035, 0.2471581995487213, 0.26132556796073914, 0.27549296617507935, 0.28966033458709717, 0.303827702999115, 0.3179950714111328, 0.33216243982315063, 0.34632980823516846, 0.3604971766471863, 0.3746645450592041, 0.3888319134712219, 0.40299928188323975, 0.41716665029525757, 0.4313340187072754, 0.4455013871192932, 0.45966875553131104, 0.47383612394332886, 0.4880034923553467, 0.5021708607673645]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 8.0, 10.0, 9.0, 11.0, 15.0, 21.0, 17.0, 20.0, 22.0, 26.0, 30.0, 28.0, 25.0, 27.0, 32.0, 34.0, 36.0, 45.0, 39.0, 30.0, 29.0, 36.0, 33.0, 39.0, 38.0, 30.0, 37.0, 39.0, 42.0, 21.0, 31.0, 25.0, 22.0, 12.0, 11.0, 11.0, 14.0, 12.0, 6.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34295332431793213, -0.332820862531662, -0.32268840074539185, -0.3125559687614441, -0.30242350697517395, -0.2922910451889038, -0.28215858340263367, -0.2720261216163635, -0.2618936598300934, -0.25176119804382324, -0.2416287511587143, -0.23149628937244415, -0.221363827586174, -0.21123138070106506, -0.20109891891479492, -0.19096645712852478, -0.18083401024341583, -0.1707015484571457, -0.16056910157203674, -0.1504366397857666, -0.14030417799949646, -0.13017171621322632, -0.12003926932811737, -0.10990680754184723, -0.09977435320615768, -0.08964189887046814, -0.079509437084198, -0.06937698274850845, -0.05924452468752861, -0.04911206662654877, -0.03897961229085922, -0.02884715050458908, -0.018714696168899536, -0.008582239039242268, 0.001550218090415001, 0.011682674288749695, 0.021815132349729538, 0.03194759041070938, 0.042080044746398926, 0.05221250653266907, 0.06234496086835861, 0.07247741520404816, 0.0826098769903183, 0.09274233132600784, 0.10287478566169739, 0.11300724744796753, 0.12313970178365707, 0.1332721710205078, 0.14340461790561676, 0.1535370796918869, 0.16366952657699585, 0.173801988363266, 0.18393445014953613, 0.19406691193580627, 0.20419935882091522, 0.21433182060718536, 0.2244642674922943, 0.23459672927856445, 0.2447291761636734, 0.25486165285110474, 0.2649940848350525, 0.27512654662132263, 0.2852590084075928, 0.2953914701938629, 0.30552393198013306]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 13.0, 11.0, 12.0, 16.0, 34.0, 43.0, 61.0, 87.0, 119.0, 197.0, 270.0, 388.0, 530.0, 863.0, 1254.0, 1950.0, 3077.0, 4732.0, 7404.0, 11642.0, 18952.0, 31720.0, 56523.0, 112819.0, 280803.0, 269237.0, 109335.0, 54857.0, 31084.0, 18592.0, 11310.0, 7208.0, 4645.0, 2994.0, 1888.0, 1302.0, 805.0, 571.0, 370.0, 259.0, 188.0, 121.0, 94.0, 58.0, 41.0, 28.0, 23.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2841796875, -0.2755622863769531, -0.26694488525390625, -0.2583274841308594, -0.2497100830078125, -0.24109268188476562, -0.23247528076171875, -0.22385787963867188, -0.215240478515625, -0.20662307739257812, -0.19800567626953125, -0.18938827514648438, -0.1807708740234375, -0.17215347290039062, -0.16353607177734375, -0.15491867065429688, -0.14630126953125, -0.13768386840820312, -0.12906646728515625, -0.12044906616210938, -0.1118316650390625, -0.10321426391601562, -0.09459686279296875, -0.08597946166992188, -0.077362060546875, -0.06874465942382812, -0.06012725830078125, -0.051509857177734375, -0.0428924560546875, -0.034275054931640625, -0.02565765380859375, -0.017040252685546875, -0.0084228515625, 0.000194549560546875, 0.00881195068359375, 0.017429351806640625, 0.0260467529296875, 0.034664154052734375, 0.04328155517578125, 0.051898956298828125, 0.060516357421875, 0.06913375854492188, 0.07775115966796875, 0.08636856079101562, 0.0949859619140625, 0.10360336303710938, 0.11222076416015625, 0.12083816528320312, 0.12945556640625, 0.13807296752929688, 0.14669036865234375, 0.15530776977539062, 0.1639251708984375, 0.17254257202148438, 0.18115997314453125, 0.18977737426757812, 0.198394775390625, 0.20701217651367188, 0.21562957763671875, 0.22424697875976562, 0.2328643798828125, 0.24148178100585938, 0.25009918212890625, 0.2587165832519531, 0.267333984375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 13.0, 15.0, 18.0, 9.0, 16.0, 28.0, 28.0, 28.0, 16.0, 26.0, 26.0, 29.0, 25.0, 32.0, 45.0, 30.0, 38.0, 29.0, 32.0, 41.0, 35.0, 34.0, 38.0, 29.0, 37.0, 35.0, 28.0, 26.0, 31.0, 31.0, 18.0, 17.0, 11.0, 3.0, 14.0, 13.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.3203125, -0.31081390380859375, -0.3013153076171875, -0.29181671142578125, -0.282318115234375, -0.27281951904296875, -0.2633209228515625, -0.25382232666015625, -0.24432373046875, -0.23482513427734375, -0.2253265380859375, -0.21582794189453125, -0.206329345703125, -0.19683074951171875, -0.1873321533203125, -0.17783355712890625, -0.1683349609375, -0.15883636474609375, -0.1493377685546875, -0.13983917236328125, -0.130340576171875, -0.12084197998046875, -0.1113433837890625, -0.10184478759765625, -0.09234619140625, -0.08284759521484375, -0.0733489990234375, -0.06385040283203125, -0.054351806640625, -0.04485321044921875, -0.0353546142578125, -0.02585601806640625, -0.016357421875, -0.00685882568359375, 0.0026397705078125, 0.01213836669921875, 0.021636962890625, 0.03113555908203125, 0.0406341552734375, 0.05013275146484375, 0.05963134765625, 0.06912994384765625, 0.0786285400390625, 0.08812713623046875, 0.097625732421875, 0.10712432861328125, 0.1166229248046875, 0.12612152099609375, 0.1356201171875, 0.14511871337890625, 0.1546173095703125, 0.16411590576171875, 0.173614501953125, 0.18311309814453125, 0.1926116943359375, 0.20211029052734375, 0.21160888671875, 0.22110748291015625, 0.2306060791015625, 0.24010467529296875, 0.249603271484375, 0.25910186767578125, 0.2686004638671875, 0.27809906005859375, 0.28759765625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 5.0, 10.0, 9.0, 13.0, 10.0, 22.0, 26.0, 40.0, 51.0, 55.0, 93.0, 125.0, 184.0, 224.0, 330.0, 460.0, 657.0, 939.0, 1298.0, 1912.0, 2744.0, 4335.0, 6970.0, 12102.0, 24455.0, 65429.0, 561610.0, 268413.0, 47678.0, 20074.0, 10230.0, 6100.0, 3740.0, 2458.0, 1642.0, 1171.0, 809.0, 589.0, 425.0, 287.0, 229.0, 174.0, 125.0, 97.0, 63.0, 43.0, 40.0, 20.0, 12.0, 8.0, 13.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.45458984375, -0.4398612976074219, -0.42513275146484375, -0.4104042053222656, -0.3956756591796875, -0.3809471130371094, -0.36621856689453125, -0.3514900207519531, -0.336761474609375, -0.3220329284667969, -0.30730438232421875, -0.2925758361816406, -0.2778472900390625, -0.2631187438964844, -0.24839019775390625, -0.23366165161132812, -0.21893310546875, -0.20420455932617188, -0.18947601318359375, -0.17474746704101562, -0.1600189208984375, -0.14529037475585938, -0.13056182861328125, -0.11583328247070312, -0.101104736328125, -0.08637619018554688, -0.07164764404296875, -0.056919097900390625, -0.0421905517578125, -0.027462005615234375, -0.01273345947265625, 0.001995086669921875, 0.0167236328125, 0.031452178955078125, 0.04618072509765625, 0.060909271240234375, 0.0756378173828125, 0.09036636352539062, 0.10509490966796875, 0.11982345581054688, 0.134552001953125, 0.14928054809570312, 0.16400909423828125, 0.17873764038085938, 0.1934661865234375, 0.20819473266601562, 0.22292327880859375, 0.23765182495117188, 0.25238037109375, 0.2671089172363281, 0.28183746337890625, 0.2965660095214844, 0.3112945556640625, 0.3260231018066406, 0.34075164794921875, 0.3554801940917969, 0.370208740234375, 0.3849372863769531, 0.39966583251953125, 0.4143943786621094, 0.4291229248046875, 0.4438514709472656, 0.45858001708984375, 0.4733085632324219, 0.488037109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 5.0, 7.0, 9.0, 18.0, 11.0, 10.0, 20.0, 23.0, 23.0, 19.0, 32.0, 20.0, 35.0, 35.0, 21.0, 33.0, 40.0, 42.0, 55.0, 38.0, 52.0, 31.0, 25.0, 29.0, 32.0, 35.0, 25.0, 32.0, 30.0, 11.0, 22.0, 32.0, 13.0, 16.0, 14.0, 14.0, 21.0, 13.0, 7.0, 9.0, 3.0, 7.0, 12.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.19677734375, -0.19060897827148438, -0.18444061279296875, -0.17827224731445312, -0.1721038818359375, -0.16593551635742188, -0.15976715087890625, -0.15359878540039062, -0.147430419921875, -0.14126205444335938, -0.13509368896484375, -0.12892532348632812, -0.1227569580078125, -0.11658859252929688, -0.11042022705078125, -0.10425186157226562, -0.09808349609375, -0.09191513061523438, -0.08574676513671875, -0.07957839965820312, -0.0734100341796875, -0.06724166870117188, -0.06107330322265625, -0.054904937744140625, -0.048736572265625, -0.042568206787109375, -0.03639984130859375, -0.030231475830078125, -0.0240631103515625, -0.017894744873046875, -0.01172637939453125, -0.005558013916015625, 0.0006103515625, 0.006778717041015625, 0.01294708251953125, 0.019115447998046875, 0.0252838134765625, 0.031452178955078125, 0.03762054443359375, 0.043788909912109375, 0.049957275390625, 0.056125640869140625, 0.06229400634765625, 0.06846237182617188, 0.0746307373046875, 0.08079910278320312, 0.08696746826171875, 0.09313583374023438, 0.09930419921875, 0.10547256469726562, 0.11164093017578125, 0.11780929565429688, 0.1239776611328125, 0.13014602661132812, 0.13631439208984375, 0.14248275756835938, 0.148651123046875, 0.15481948852539062, 0.16098785400390625, 0.16715621948242188, 0.1733245849609375, 0.17949295043945312, 0.18566131591796875, 0.19182968139648438, 0.197998046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 12.0, 12.0, 8.0, 15.0, 20.0, 25.0, 36.0, 45.0, 54.0, 53.0, 78.0, 123.0, 130.0, 192.0, 247.0, 323.0, 475.0, 712.0, 1136.0, 1808.0, 3080.0, 5899.0, 14006.0, 50561.0, 779155.0, 147121.0, 23801.0, 8568.0, 4257.0, 2326.0, 1294.0, 848.0, 553.0, 356.0, 287.0, 215.0, 147.0, 120.0, 106.0, 78.0, 61.0, 44.0, 43.0, 25.0, 23.0, 23.0, 20.0, 6.0, 8.0, 4.0, 2.0, 10.0, 2.0, 0.0, 3.0, 3.0], "bins": [-0.11767578125, -0.11408138275146484, -0.11048698425292969, -0.10689258575439453, -0.10329818725585938, -0.09970378875732422, -0.09610939025878906, -0.0925149917602539, -0.08892059326171875, -0.0853261947631836, -0.08173179626464844, -0.07813739776611328, -0.07454299926757812, -0.07094860076904297, -0.06735420227050781, -0.06375980377197266, -0.0601654052734375, -0.056571006774902344, -0.05297660827636719, -0.04938220977783203, -0.045787811279296875, -0.04219341278076172, -0.03859901428222656, -0.035004615783691406, -0.03141021728515625, -0.027815818786621094, -0.024221420288085938, -0.02062702178955078, -0.017032623291015625, -0.013438224792480469, -0.009843826293945312, -0.006249427795410156, -0.002655029296875, 0.0009393692016601562, 0.0045337677001953125, 0.008128166198730469, 0.011722564697265625, 0.015316963195800781, 0.018911361694335938, 0.022505760192871094, 0.02610015869140625, 0.029694557189941406, 0.03328895568847656, 0.03688335418701172, 0.040477752685546875, 0.04407215118408203, 0.04766654968261719, 0.051260948181152344, 0.0548553466796875, 0.058449745178222656, 0.06204414367675781, 0.06563854217529297, 0.06923294067382812, 0.07282733917236328, 0.07642173767089844, 0.0800161361694336, 0.08361053466796875, 0.0872049331665039, 0.09079933166503906, 0.09439373016357422, 0.09798812866210938, 0.10158252716064453, 0.10517692565917969, 0.10877132415771484, 0.11236572265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 9.0, 3.0, 10.0, 15.0, 16.0, 30.0, 28.0, 20.0, 57.0, 71.0, 33.0, 85.0, 74.0, 33.0, 101.0, 77.0, 29.0, 75.0, 37.0, 21.0, 19.0, 29.0, 15.0, 13.0, 23.0, 7.0, 11.0, 11.0, 2.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.337860107421875e-06, -3.238208591938019e-06, -3.1385570764541626e-06, -3.0389055609703064e-06, -2.93925404548645e-06, -2.839602530002594e-06, -2.739951014518738e-06, -2.6402994990348816e-06, -2.5406479835510254e-06, -2.440996468067169e-06, -2.341344952583313e-06, -2.2416934370994568e-06, -2.1420419216156006e-06, -2.0423904061317444e-06, -1.942738890647888e-06, -1.843087375164032e-06, -1.7434358596801758e-06, -1.6437843441963196e-06, -1.5441328287124634e-06, -1.4444813132286072e-06, -1.344829797744751e-06, -1.2451782822608948e-06, -1.1455267667770386e-06, -1.0458752512931824e-06, -9.462237358093262e-07, -8.4657222032547e-07, -7.469207048416138e-07, -6.472691893577576e-07, -5.476176738739014e-07, -4.4796615839004517e-07, -3.4831464290618896e-07, -2.4866312742233276e-07, -1.4901161193847656e-07, -4.936009645462036e-08, 5.029141902923584e-08, 1.4994293451309204e-07, 2.4959444999694824e-07, 3.4924596548080444e-07, 4.4889748096466064e-07, 5.485489964485168e-07, 6.48200511932373e-07, 7.478520274162292e-07, 8.475035429000854e-07, 9.471550583839417e-07, 1.0468065738677979e-06, 1.146458089351654e-06, 1.2461096048355103e-06, 1.3457611203193665e-06, 1.4454126358032227e-06, 1.5450641512870789e-06, 1.644715666770935e-06, 1.7443671822547913e-06, 1.8440186977386475e-06, 1.9436702132225037e-06, 2.04332172870636e-06, 2.142973244190216e-06, 2.2426247596740723e-06, 2.3422762751579285e-06, 2.4419277906417847e-06, 2.541579306125641e-06, 2.641230821609497e-06, 2.7408823370933533e-06, 2.8405338525772095e-06, 2.9401853680610657e-06, 3.039836883544922e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 10.0, 6.0, 18.0, 13.0, 28.0, 32.0, 56.0, 69.0, 113.0, 155.0, 212.0, 284.0, 414.0, 585.0, 857.0, 1192.0, 1939.0, 3117.0, 4910.0, 8706.0, 16125.0, 34633.0, 96432.0, 515809.0, 243459.0, 62671.0, 25379.0, 12542.0, 6909.0, 4104.0, 2546.0, 1691.0, 1070.0, 744.0, 537.0, 317.0, 237.0, 189.0, 146.0, 93.0, 62.0, 48.0, 36.0, 26.0, 11.0, 5.0, 12.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0841064453125, -0.08154296875, -0.0789794921875, -0.076416015625, -0.0738525390625, -0.0712890625, -0.0687255859375, -0.066162109375, -0.0635986328125, -0.06103515625, -0.0584716796875, -0.055908203125, -0.0533447265625, -0.05078125, -0.0482177734375, -0.045654296875, -0.0430908203125, -0.04052734375, -0.0379638671875, -0.035400390625, -0.0328369140625, -0.0302734375, -0.0277099609375, -0.025146484375, -0.0225830078125, -0.02001953125, -0.0174560546875, -0.014892578125, -0.0123291015625, -0.009765625, -0.0072021484375, -0.004638671875, -0.0020751953125, 0.00048828125, 0.0030517578125, 0.005615234375, 0.0081787109375, 0.0107421875, 0.0133056640625, 0.015869140625, 0.0184326171875, 0.02099609375, 0.0235595703125, 0.026123046875, 0.0286865234375, 0.03125, 0.0338134765625, 0.036376953125, 0.0389404296875, 0.04150390625, 0.0440673828125, 0.046630859375, 0.0491943359375, 0.0517578125, 0.0543212890625, 0.056884765625, 0.0594482421875, 0.06201171875, 0.0645751953125, 0.067138671875, 0.0697021484375, 0.072265625, 0.0748291015625, 0.077392578125, 0.0799560546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 7.0, 8.0, 14.0, 11.0, 14.0, 17.0, 14.0, 18.0, 25.0, 33.0, 40.0, 63.0, 84.0, 125.0, 141.0, 78.0, 56.0, 60.0, 41.0, 26.0, 19.0, 15.0, 21.0, 15.0, 5.0, 11.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.015106201171875, -0.014635562896728516, -0.014164924621582031, -0.013694286346435547, -0.013223648071289062, -0.012753009796142578, -0.012282371520996094, -0.01181173324584961, -0.011341094970703125, -0.01087045669555664, -0.010399818420410156, -0.009929180145263672, -0.009458541870117188, -0.008987903594970703, -0.008517265319824219, -0.008046627044677734, -0.00757598876953125, -0.007105350494384766, -0.006634712219238281, -0.006164073944091797, -0.0056934356689453125, -0.005222797393798828, -0.004752159118652344, -0.004281520843505859, -0.003810882568359375, -0.0033402442932128906, -0.0028696060180664062, -0.002398967742919922, -0.0019283294677734375, -0.0014576911926269531, -0.0009870529174804688, -0.0005164146423339844, -4.57763671875e-05, 0.0004248619079589844, 0.0008955001831054688, 0.0013661384582519531, 0.0018367767333984375, 0.002307415008544922, 0.0027780532836914062, 0.0032486915588378906, 0.003719329833984375, 0.004189968109130859, 0.004660606384277344, 0.005131244659423828, 0.0056018829345703125, 0.006072521209716797, 0.006543159484863281, 0.007013797760009766, 0.00748443603515625, 0.007955074310302734, 0.008425712585449219, 0.008896350860595703, 0.009366989135742188, 0.009837627410888672, 0.010308265686035156, 0.01077890396118164, 0.011249542236328125, 0.01172018051147461, 0.012190818786621094, 0.012661457061767578, 0.013132095336914062, 0.013602733612060547, 0.014073371887207031, 0.014544010162353516, 0.0150146484375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 11.0, 9.0, 9.0, 6.0, 11.0, 19.0, 16.0, 27.0, 33.0, 47.0, 58.0, 49.0, 74.0, 98.0, 96.0, 90.0, 72.0, 47.0, 34.0, 34.0, 37.0, 19.0, 11.0, 16.0, 13.0, 12.0, 6.0, 11.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38890865445137024, -0.37509986758232117, -0.3612910509109497, -0.34748226404190063, -0.3336734473705292, -0.3198646605014801, -0.30605584383010864, -0.29224705696105957, -0.2784382402896881, -0.26462945342063904, -0.2508206367492676, -0.2370118349790573, -0.22320303320884705, -0.20939424633979797, -0.1955854296684265, -0.18177664279937744, -0.16796784102916718, -0.1541590392589569, -0.14035023748874664, -0.12654143571853638, -0.11273263394832611, -0.09892383962869644, -0.08511503785848618, -0.07130623608827591, -0.05749743431806564, -0.04368863254785538, -0.02987983264029026, -0.016071032732725143, -0.0022622309625148773, 0.01154656708240509, 0.025355368852615356, 0.03916417062282562, 0.05297297239303589, 0.06678177416324615, 0.08059057593345642, 0.09439937770366669, 0.10820817947387695, 0.12201697379350662, 0.13582578301429749, 0.14963456988334656, 0.16344338655471802, 0.17725218832492828, 0.19106099009513855, 0.20486979186534882, 0.21867859363555908, 0.23248738050460815, 0.24629619717597961, 0.2601049840450287, 0.27391380071640015, 0.2877225875854492, 0.3015314042568207, 0.31534019112586975, 0.3291490077972412, 0.3429577946662903, 0.35676661133766174, 0.3705753982067108, 0.3843841850757599, 0.39819297194480896, 0.4120017886161804, 0.4258105754852295, 0.43961939215660095, 0.45342817902565, 0.4672369956970215, 0.48104578256607056, 0.494854599237442]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 3.0, 5.0, 9.0, 6.0, 12.0, 11.0, 15.0, 21.0, 16.0, 20.0, 22.0, 24.0, 27.0, 28.0, 28.0, 29.0, 21.0, 42.0, 33.0, 47.0, 34.0, 35.0, 31.0, 34.0, 30.0, 37.0, 43.0, 28.0, 40.0, 34.0, 39.0, 27.0, 34.0, 19.0, 24.0, 14.0, 13.0, 8.0, 15.0, 12.0, 10.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3349111080169678, -0.3250650465488434, -0.315218985080719, -0.3053729236125946, -0.2955268621444702, -0.2856808006763458, -0.27583473920822144, -0.26598864793777466, -0.25614261627197266, -0.24629655480384827, -0.23645049333572388, -0.2266044318675995, -0.2167583703994751, -0.2069123089313507, -0.19706623256206512, -0.18722017109394073, -0.17737409472465515, -0.16752803325653076, -0.15768197178840637, -0.14783591032028198, -0.1379898488521576, -0.1281437873840332, -0.11829771101474762, -0.10845164954662323, -0.09860558807849884, -0.08875952661037445, -0.07891346514225006, -0.06906739622354507, -0.059221334755420685, -0.049375273287296295, -0.03952920809388161, -0.02968314290046692, -0.01983705163002014, -0.009990988299250603, -0.00014492496848106384, 0.009701138362288475, 0.019547201693058014, 0.029393263161182404, 0.03923932835459709, 0.04908539354801178, 0.05893145501613617, 0.06877751648426056, 0.07862357795238495, 0.08846964687108994, 0.09831570833921432, 0.10816176980733871, 0.1180078387260437, 0.1278539001941681, 0.13769996166229248, 0.14754602313041687, 0.15739208459854126, 0.16723814606666565, 0.17708420753479004, 0.18693026900291443, 0.1967763453722, 0.2066224068403244, 0.2164684683084488, 0.22631452977657318, 0.23616059124469757, 0.24600665271282196, 0.25585272908210754, 0.26569879055023193, 0.2755448520183563, 0.2853909134864807, 0.2952369749546051]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 12.0, 12.0, 20.0, 29.0, 46.0, 81.0, 98.0, 151.0, 295.0, 437.0, 708.0, 1147.0, 1895.0, 3095.0, 5290.0, 8812.0, 15128.0, 26636.0, 49716.0, 97333.0, 204638.0, 296789.0, 162885.0, 78781.0, 40686.0, 22257.0, 12653.0, 7453.0, 4535.0, 2666.0, 1642.0, 998.0, 595.0, 378.0, 238.0, 163.0, 96.0, 48.0, 44.0, 23.0, 15.0, 20.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59814453125, -0.5762710571289062, -0.5543975830078125, -0.5325241088867188, -0.510650634765625, -0.48877716064453125, -0.4669036865234375, -0.44503021240234375, -0.42315673828125, -0.40128326416015625, -0.3794097900390625, -0.35753631591796875, -0.335662841796875, -0.31378936767578125, -0.2919158935546875, -0.27004241943359375, -0.2481689453125, -0.22629547119140625, -0.2044219970703125, -0.18254852294921875, -0.160675048828125, -0.13880157470703125, -0.1169281005859375, -0.09505462646484375, -0.07318115234375, -0.05130767822265625, -0.0294342041015625, -0.00756072998046875, 0.014312744140625, 0.03618621826171875, 0.0580596923828125, 0.07993316650390625, 0.101806640625, 0.12368011474609375, 0.1455535888671875, 0.16742706298828125, 0.189300537109375, 0.21117401123046875, 0.2330474853515625, 0.25492095947265625, 0.27679443359375, 0.29866790771484375, 0.3205413818359375, 0.34241485595703125, 0.364288330078125, 0.38616180419921875, 0.4080352783203125, 0.42990875244140625, 0.4517822265625, 0.47365570068359375, 0.4955291748046875, 0.5174026489257812, 0.539276123046875, 0.5611495971679688, 0.5830230712890625, 0.6048965454101562, 0.62677001953125, 0.6486434936523438, 0.6705169677734375, 0.6923904418945312, 0.714263916015625, 0.7361373901367188, 0.7580108642578125, 0.7798843383789062, 0.8017578125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 4.0, 9.0, 10.0, 11.0, 12.0, 8.0, 18.0, 21.0, 20.0, 12.0, 31.0, 32.0, 22.0, 29.0, 30.0, 40.0, 34.0, 37.0, 47.0, 37.0, 39.0, 30.0, 43.0, 34.0, 39.0, 32.0, 43.0, 41.0, 37.0, 23.0, 21.0, 20.0, 27.0, 21.0, 12.0, 18.0, 10.0, 12.0, 8.0, 8.0, 3.0, 8.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.317138671875, -0.3077545166015625, -0.298370361328125, -0.2889862060546875, -0.27960205078125, -0.2702178955078125, -0.260833740234375, -0.2514495849609375, -0.2420654296875, -0.2326812744140625, -0.223297119140625, -0.2139129638671875, -0.20452880859375, -0.1951446533203125, -0.185760498046875, -0.1763763427734375, -0.1669921875, -0.1576080322265625, -0.148223876953125, -0.1388397216796875, -0.12945556640625, -0.1200714111328125, -0.110687255859375, -0.1013031005859375, -0.0919189453125, -0.0825347900390625, -0.073150634765625, -0.0637664794921875, -0.05438232421875, -0.0449981689453125, -0.035614013671875, -0.0262298583984375, -0.016845703125, -0.0074615478515625, 0.001922607421875, 0.0113067626953125, 0.02069091796875, 0.0300750732421875, 0.039459228515625, 0.0488433837890625, 0.0582275390625, 0.0676116943359375, 0.076995849609375, 0.0863800048828125, 0.09576416015625, 0.1051483154296875, 0.114532470703125, 0.1239166259765625, 0.13330078125, 0.1426849365234375, 0.152069091796875, 0.1614532470703125, 0.17083740234375, 0.1802215576171875, 0.189605712890625, 0.1989898681640625, 0.2083740234375, 0.2177581787109375, 0.227142333984375, 0.2365264892578125, 0.24591064453125, 0.2552947998046875, 0.264678955078125, 0.2740631103515625, 0.283447265625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 11.0, 21.0, 22.0, 35.0, 54.0, 67.0, 96.0, 150.0, 241.0, 336.0, 567.0, 846.0, 1358.0, 2155.0, 3537.0, 6375.0, 10802.0, 19876.0, 38313.0, 77756.0, 166300.0, 331421.0, 200099.0, 90729.0, 44316.0, 22977.0, 12392.0, 6918.0, 4123.0, 2492.0, 1440.0, 969.0, 610.0, 370.0, 254.0, 208.0, 86.0, 68.0, 52.0, 40.0, 21.0, 15.0, 13.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7473526000976562, -0.7237091064453125, -0.7000656127929688, -0.676422119140625, -0.6527786254882812, -0.6291351318359375, -0.6054916381835938, -0.58184814453125, -0.5582046508789062, -0.5345611572265625, -0.5109176635742188, -0.487274169921875, -0.46363067626953125, -0.4399871826171875, -0.41634368896484375, -0.3927001953125, -0.36905670166015625, -0.3454132080078125, -0.32176971435546875, -0.298126220703125, -0.27448272705078125, -0.2508392333984375, -0.22719573974609375, -0.20355224609375, -0.17990875244140625, -0.1562652587890625, -0.13262176513671875, -0.108978271484375, -0.08533477783203125, -0.0616912841796875, -0.03804779052734375, -0.014404296875, 0.00923919677734375, 0.0328826904296875, 0.05652618408203125, 0.080169677734375, 0.10381317138671875, 0.1274566650390625, 0.15110015869140625, 0.17474365234375, 0.19838714599609375, 0.2220306396484375, 0.24567413330078125, 0.269317626953125, 0.29296112060546875, 0.3166046142578125, 0.34024810791015625, 0.3638916015625, 0.38753509521484375, 0.4111785888671875, 0.43482208251953125, 0.458465576171875, 0.48210906982421875, 0.5057525634765625, 0.5293960571289062, 0.55303955078125, 0.5766830444335938, 0.6003265380859375, 0.6239700317382812, 0.647613525390625, 0.6712570190429688, 0.6949005126953125, 0.7185440063476562, 0.7421875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 10.0, 10.0, 9.0, 10.0, 19.0, 17.0, 28.0, 27.0, 17.0, 34.0, 33.0, 43.0, 42.0, 42.0, 47.0, 48.0, 34.0, 52.0, 48.0, 35.0, 44.0, 38.0, 41.0, 45.0, 33.0, 25.0, 32.0, 18.0, 26.0, 12.0, 11.0, 17.0, 14.0, 8.0, 6.0, 6.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2335205078125, -0.22669410705566406, -0.21986770629882812, -0.2130413055419922, -0.20621490478515625, -0.1993885040283203, -0.19256210327148438, -0.18573570251464844, -0.1789093017578125, -0.17208290100097656, -0.16525650024414062, -0.1584300994873047, -0.15160369873046875, -0.1447772979736328, -0.13795089721679688, -0.13112449645996094, -0.124298095703125, -0.11747169494628906, -0.11064529418945312, -0.10381889343261719, -0.09699249267578125, -0.09016609191894531, -0.08333969116210938, -0.07651329040527344, -0.0696868896484375, -0.06286048889160156, -0.056034088134765625, -0.04920768737792969, -0.04238128662109375, -0.03555488586425781, -0.028728485107421875, -0.021902084350585938, -0.01507568359375, -0.008249282836914062, -0.001422882080078125, 0.0054035186767578125, 0.01222991943359375, 0.019056320190429688, 0.025882720947265625, 0.03270912170410156, 0.0395355224609375, 0.04636192321777344, 0.053188323974609375, 0.06001472473144531, 0.06684112548828125, 0.07366752624511719, 0.08049392700195312, 0.08732032775878906, 0.094146728515625, 0.10097312927246094, 0.10779953002929688, 0.11462593078613281, 0.12145233154296875, 0.1282787322998047, 0.13510513305664062, 0.14193153381347656, 0.1487579345703125, 0.15558433532714844, 0.16241073608398438, 0.1692371368408203, 0.17606353759765625, 0.1828899383544922, 0.18971633911132812, 0.19654273986816406, 0.203369140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 7.0, 9.0, 12.0, 11.0, 22.0, 23.0, 33.0, 48.0, 65.0, 92.0, 153.0, 168.0, 261.0, 298.0, 447.0, 620.0, 803.0, 1115.0, 1532.0, 2050.0, 2751.0, 3952.0, 5518.0, 8024.0, 12207.0, 19044.0, 31720.0, 60678.0, 699964.0, 89388.0, 38846.0, 22788.0, 13959.0, 9370.0, 6331.0, 4483.0, 3132.0, 2291.0, 1657.0, 1218.0, 941.0, 678.0, 510.0, 356.0, 253.0, 214.0, 132.0, 101.0, 86.0, 62.0, 43.0, 28.0, 29.0, 17.0, 10.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.162841796875, -0.1577014923095703, -0.15256118774414062, -0.14742088317871094, -0.14228057861328125, -0.13714027404785156, -0.13199996948242188, -0.1268596649169922, -0.1217193603515625, -0.11657905578613281, -0.11143875122070312, -0.10629844665527344, -0.10115814208984375, -0.09601783752441406, -0.09087753295898438, -0.08573722839355469, -0.080596923828125, -0.07545661926269531, -0.07031631469726562, -0.06517601013183594, -0.06003570556640625, -0.05489540100097656, -0.049755096435546875, -0.04461479187011719, -0.0394744873046875, -0.03433418273925781, -0.029193878173828125, -0.024053573608398438, -0.01891326904296875, -0.013772964477539062, -0.008632659912109375, -0.0034923553466796875, 0.00164794921875, 0.0067882537841796875, 0.011928558349609375, 0.017068862915039062, 0.02220916748046875, 0.027349472045898438, 0.032489776611328125, 0.03763008117675781, 0.0427703857421875, 0.04791069030761719, 0.053050994873046875, 0.05819129943847656, 0.06333160400390625, 0.06847190856933594, 0.07361221313476562, 0.07875251770019531, 0.083892822265625, 0.08903312683105469, 0.09417343139648438, 0.09931373596191406, 0.10445404052734375, 0.10959434509277344, 0.11473464965820312, 0.11987495422363281, 0.1250152587890625, 0.1301555633544922, 0.13529586791992188, 0.14043617248535156, 0.14557647705078125, 0.15071678161621094, 0.15585708618164062, 0.1609973907470703, 0.1661376953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 15.0, 15.0, 20.0, 27.0, 41.0, 89.0, 340.0, 235.0, 80.0, 31.0, 29.0, 20.0, 10.0, 11.0, 4.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5795230865478516e-05, -1.5407800674438477e-05, -1.5020370483398438e-05, -1.4632940292358398e-05, -1.424551010131836e-05, -1.385807991027832e-05, -1.3470649719238281e-05, -1.3083219528198242e-05, -1.2695789337158203e-05, -1.2308359146118164e-05, -1.1920928955078125e-05, -1.1533498764038086e-05, -1.1146068572998047e-05, -1.0758638381958008e-05, -1.0371208190917969e-05, -9.98377799987793e-06, -9.59634780883789e-06, -9.208917617797852e-06, -8.821487426757812e-06, -8.434057235717773e-06, -8.046627044677734e-06, -7.659196853637695e-06, -7.271766662597656e-06, -6.884336471557617e-06, -6.496906280517578e-06, -6.109476089477539e-06, -5.7220458984375e-06, -5.334615707397461e-06, -4.947185516357422e-06, -4.559755325317383e-06, -4.172325134277344e-06, -3.7848949432373047e-06, -3.3974647521972656e-06, -3.0100345611572266e-06, -2.6226043701171875e-06, -2.2351741790771484e-06, -1.8477439880371094e-06, -1.4603137969970703e-06, -1.0728836059570312e-06, -6.854534149169922e-07, -2.980232238769531e-07, 8.940696716308594e-08, 4.76837158203125e-07, 8.642673492431641e-07, 1.2516975402832031e-06, 1.6391277313232422e-06, 2.0265579223632812e-06, 2.4139881134033203e-06, 2.8014183044433594e-06, 3.1888484954833984e-06, 3.5762786865234375e-06, 3.9637088775634766e-06, 4.351139068603516e-06, 4.738569259643555e-06, 5.125999450683594e-06, 5.513429641723633e-06, 5.900859832763672e-06, 6.288290023803711e-06, 6.67572021484375e-06, 7.063150405883789e-06, 7.450580596923828e-06, 7.838010787963867e-06, 8.225440979003906e-06, 8.612871170043945e-06, 9.000301361083984e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 13.0, 17.0, 32.0, 27.0, 43.0, 69.0, 82.0, 116.0, 161.0, 188.0, 264.0, 402.0, 488.0, 712.0, 960.0, 1352.0, 1955.0, 2822.0, 4243.0, 6563.0, 10490.0, 18110.0, 34109.0, 77087.0, 750941.0, 62990.0, 29867.0, 16063.0, 9408.0, 5888.0, 3911.0, 2687.0, 1797.0, 1305.0, 883.0, 724.0, 448.0, 366.0, 244.0, 193.0, 137.0, 102.0, 78.0, 64.0, 34.0, 27.0, 27.0, 16.0, 13.0, 7.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.2462158203125, -0.2383747100830078, -0.23053359985351562, -0.22269248962402344, -0.21485137939453125, -0.20701026916503906, -0.19916915893554688, -0.1913280487060547, -0.1834869384765625, -0.1756458282470703, -0.16780471801757812, -0.15996360778808594, -0.15212249755859375, -0.14428138732910156, -0.13644027709960938, -0.1285991668701172, -0.120758056640625, -0.11291694641113281, -0.10507583618164062, -0.09723472595214844, -0.08939361572265625, -0.08155250549316406, -0.07371139526367188, -0.06587028503417969, -0.0580291748046875, -0.05018806457519531, -0.042346954345703125, -0.03450584411621094, -0.02666473388671875, -0.018823623657226562, -0.010982513427734375, -0.0031414031982421875, 0.00469970703125, 0.012540817260742188, 0.020381927490234375, 0.028223037719726562, 0.03606414794921875, 0.04390525817871094, 0.051746368408203125, 0.05958747863769531, 0.0674285888671875, 0.07526969909667969, 0.08311080932617188, 0.09095191955566406, 0.09879302978515625, 0.10663414001464844, 0.11447525024414062, 0.12231636047363281, 0.130157470703125, 0.1379985809326172, 0.14583969116210938, 0.15368080139160156, 0.16152191162109375, 0.16936302185058594, 0.17720413208007812, 0.1850452423095703, 0.1928863525390625, 0.2007274627685547, 0.20856857299804688, 0.21640968322753906, 0.22425079345703125, 0.23209190368652344, 0.23993301391601562, 0.2477741241455078, 0.255615234375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 6.0, 12.0, 16.0, 13.0, 16.0, 25.0, 37.0, 21.0, 43.0, 556.0, 48.0, 22.0, 15.0, 22.0, 20.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0823974609375, -0.07986640930175781, -0.07733535766601562, -0.07480430603027344, -0.07227325439453125, -0.06974220275878906, -0.06721115112304688, -0.06468009948730469, -0.0621490478515625, -0.05961799621582031, -0.057086944580078125, -0.05455589294433594, -0.05202484130859375, -0.04949378967285156, -0.046962738037109375, -0.04443168640136719, -0.041900634765625, -0.03936958312988281, -0.036838531494140625, -0.03430747985839844, -0.03177642822265625, -0.029245376586914062, -0.026714324951171875, -0.024183273315429688, -0.0216522216796875, -0.019121170043945312, -0.016590118408203125, -0.014059066772460938, -0.01152801513671875, -0.008996963500976562, -0.006465911865234375, -0.0039348602294921875, -0.00140380859375, 0.0011272430419921875, 0.003658294677734375, 0.0061893463134765625, 0.00872039794921875, 0.011251449584960938, 0.013782501220703125, 0.016313552856445312, 0.0188446044921875, 0.021375656127929688, 0.023906707763671875, 0.026437759399414062, 0.02896881103515625, 0.03149986267089844, 0.034030914306640625, 0.03656196594238281, 0.039093017578125, 0.04162406921386719, 0.044155120849609375, 0.04668617248535156, 0.04921722412109375, 0.05174827575683594, 0.054279327392578125, 0.05681037902832031, 0.0593414306640625, 0.06187248229980469, 0.06440353393554688, 0.06693458557128906, 0.06946563720703125, 0.07199668884277344, 0.07452774047851562, 0.07705879211425781, 0.07958984375]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 3.0, 6.0, 6.0, 11.0, 13.0, 16.0, 19.0, 21.0, 34.0, 38.0, 46.0, 76.0, 105.0, 102.0, 110.0, 82.0, 58.0, 47.0, 41.0, 18.0, 30.0, 23.0, 17.0, 12.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4173910915851593, -0.40293681621551514, -0.38848257064819336, -0.3740282952785492, -0.35957401990890503, -0.34511977434158325, -0.3306654989719391, -0.3162112236022949, -0.30175697803497314, -0.287302702665329, -0.2728484570980072, -0.25839418172836304, -0.24393990635871887, -0.2294856458902359, -0.21503138542175293, -0.20057711005210876, -0.1861228346824646, -0.17166857421398163, -0.15721429884433746, -0.1427600383758545, -0.12830576300621033, -0.11385150253772736, -0.09939724206924438, -0.08494297415018082, -0.07048870623111725, -0.05603443831205368, -0.04158017411828041, -0.02712590992450714, -0.012671642005443573, 0.0017826259136199951, 0.016236886382102966, 0.030691154301166534, 0.04514545202255249, 0.05959971994161606, 0.07405398786067963, 0.0885082483291626, 0.10296251624822617, 0.11741678416728973, 0.1318710446357727, 0.14632532000541687, 0.16077958047389984, 0.1752338409423828, 0.18968811631202698, 0.20414237678050995, 0.21859663724899292, 0.23305091261863708, 0.24750517308712006, 0.261959433555603, 0.2764137089252472, 0.29086798429489136, 0.30532222986221313, 0.3197765052318573, 0.33423078060150146, 0.34868502616882324, 0.3631393015384674, 0.3775935769081116, 0.39204782247543335, 0.4065020978450775, 0.4209563434123993, 0.43541061878204346, 0.4498648941516876, 0.4643191695213318, 0.47877341508865356, 0.49322769045829773, 0.5076819658279419]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 9.0, 8.0, 3.0, 5.0, 11.0, 16.0, 14.0, 17.0, 20.0, 15.0, 24.0, 19.0, 29.0, 33.0, 30.0, 33.0, 44.0, 40.0, 25.0, 35.0, 40.0, 26.0, 39.0, 43.0, 33.0, 43.0, 38.0, 26.0, 33.0, 28.0, 41.0, 24.0, 27.0, 19.0, 23.0, 15.0, 13.0, 13.0, 8.0, 12.0, 9.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.30924877524375916, -0.29950910806655884, -0.2897694408893585, -0.2800297737121582, -0.2702901065349579, -0.26055043935775757, -0.25081077218055725, -0.24107110500335693, -0.23133143782615662, -0.2215917706489563, -0.21185210347175598, -0.20211243629455566, -0.19237276911735535, -0.18263310194015503, -0.1728934347629547, -0.1631537675857544, -0.15341410040855408, -0.14367443323135376, -0.13393476605415344, -0.12419509887695312, -0.11445543169975281, -0.10471576452255249, -0.09497609734535217, -0.08523643016815186, -0.07549676299095154, -0.06575709581375122, -0.0560174286365509, -0.046277761459350586, -0.03653809428215027, -0.02679842710494995, -0.017058759927749634, -0.007319092750549316, 0.0024205446243286133, 0.01216021180152893, 0.021899878978729248, 0.031639546155929565, 0.04137921333312988, 0.0511188805103302, 0.06085854768753052, 0.07059821486473083, 0.08033788204193115, 0.09007754921913147, 0.09981721639633179, 0.1095568835735321, 0.11929655075073242, 0.12903621792793274, 0.13877588510513306, 0.14851555228233337, 0.1582552194595337, 0.167994886636734, 0.17773455381393433, 0.18747422099113464, 0.19721388816833496, 0.20695355534553528, 0.2166932225227356, 0.2264328896999359, 0.23617255687713623, 0.24591222405433655, 0.25565189123153687, 0.2653915584087372, 0.2751312255859375, 0.2848708927631378, 0.29461055994033813, 0.30435022711753845, 0.31408989429473877]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 14.0, 13.0, 18.0, 30.0, 71.0, 94.0, 133.0, 232.0, 393.0, 648.0, 1087.0, 1774.0, 2974.0, 4988.0, 8500.0, 14579.0, 25476.0, 46905.0, 91702.0, 195657.0, 556398.0, 1880694.0, 874088.0, 253392.0, 109996.0, 54293.0, 29479.0, 16508.0, 9685.0, 5939.0, 3550.0, 2033.0, 1248.0, 726.0, 401.0, 223.0, 118.0, 71.0, 51.0, 36.0, 21.0, 22.0, 11.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.4167366027832031, -0.40110015869140625, -0.3854637145996094, -0.3698272705078125, -0.3541908264160156, -0.33855438232421875, -0.3229179382324219, -0.307281494140625, -0.2916450500488281, -0.27600860595703125, -0.2603721618652344, -0.2447357177734375, -0.22909927368164062, -0.21346282958984375, -0.19782638549804688, -0.18218994140625, -0.16655349731445312, -0.15091705322265625, -0.13528060913085938, -0.1196441650390625, -0.10400772094726562, -0.08837127685546875, -0.07273483276367188, -0.057098388671875, -0.041461944580078125, -0.02582550048828125, -0.010189056396484375, 0.0054473876953125, 0.021083831787109375, 0.03672027587890625, 0.052356719970703125, 0.0679931640625, 0.08362960815429688, 0.09926605224609375, 0.11490249633789062, 0.1305389404296875, 0.14617538452148438, 0.16181182861328125, 0.17744827270507812, 0.193084716796875, 0.20872116088867188, 0.22435760498046875, 0.23999404907226562, 0.2556304931640625, 0.2712669372558594, 0.28690338134765625, 0.3025398254394531, 0.31817626953125, 0.3338127136230469, 0.34944915771484375, 0.3650856018066406, 0.3807220458984375, 0.3963584899902344, 0.41199493408203125, 0.4276313781738281, 0.443267822265625, 0.4589042663574219, 0.47454071044921875, 0.4901771545410156, 0.5058135986328125, 0.5214500427246094, 0.5370864868164062, 0.5527229309082031, 0.568359375]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 11.0, 8.0, 20.0, 16.0, 11.0, 19.0, 20.0, 19.0, 26.0, 39.0, 33.0, 34.0, 34.0, 48.0, 41.0, 46.0, 38.0, 36.0, 56.0, 38.0, 35.0, 49.0, 34.0, 35.0, 31.0, 35.0, 29.0, 19.0, 22.0, 21.0, 10.0, 16.0, 12.0, 11.0, 4.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.18994712829589844, -0.18348312377929688, -0.1770191192626953, -0.17055511474609375, -0.1640911102294922, -0.15762710571289062, -0.15116310119628906, -0.1446990966796875, -0.13823509216308594, -0.13177108764648438, -0.1253070831298828, -0.11884307861328125, -0.11237907409667969, -0.10591506958007812, -0.09945106506347656, -0.092987060546875, -0.08652305603027344, -0.08005905151367188, -0.07359504699707031, -0.06713104248046875, -0.06066703796386719, -0.054203033447265625, -0.04773902893066406, -0.0412750244140625, -0.03481101989746094, -0.028347015380859375, -0.021883010864257812, -0.01541900634765625, -0.008955001831054688, -0.002490997314453125, 0.0039730072021484375, 0.01043701171875, 0.016901016235351562, 0.023365020751953125, 0.029829025268554688, 0.03629302978515625, 0.04275703430175781, 0.049221038818359375, 0.05568504333496094, 0.0621490478515625, 0.06861305236816406, 0.07507705688476562, 0.08154106140136719, 0.08800506591796875, 0.09446907043457031, 0.10093307495117188, 0.10739707946777344, 0.113861083984375, 0.12032508850097656, 0.12678909301757812, 0.1332530975341797, 0.13971710205078125, 0.1461811065673828, 0.15264511108398438, 0.15910911560058594, 0.1655731201171875, 0.17203712463378906, 0.17850112915039062, 0.1849651336669922, 0.19142913818359375, 0.1978931427001953, 0.20435714721679688, 0.21082115173339844, 0.21728515625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 4.0, 7.0, 11.0, 13.0, 13.0, 20.0, 40.0, 41.0, 69.0, 118.0, 179.0, 314.0, 500.0, 834.0, 1504.0, 2576.0, 4406.0, 7492.0, 13016.0, 22825.0, 40263.0, 75189.0, 148170.0, 320659.0, 854228.0, 1593315.0, 603994.0, 246066.0, 118600.0, 61511.0, 33146.0, 18927.0, 10830.0, 6350.0, 3725.0, 2090.0, 1238.0, 783.0, 445.0, 262.0, 176.0, 105.0, 67.0, 48.0, 26.0, 28.0, 15.0, 16.0, 5.0, 12.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.401123046875, -0.38909149169921875, -0.3770599365234375, -0.36502838134765625, -0.352996826171875, -0.34096527099609375, -0.3289337158203125, -0.31690216064453125, -0.30487060546875, -0.29283905029296875, -0.2808074951171875, -0.26877593994140625, -0.256744384765625, -0.24471282958984375, -0.2326812744140625, -0.22064971923828125, -0.2086181640625, -0.19658660888671875, -0.1845550537109375, -0.17252349853515625, -0.160491943359375, -0.14846038818359375, -0.1364288330078125, -0.12439727783203125, -0.11236572265625, -0.10033416748046875, -0.0883026123046875, -0.07627105712890625, -0.064239501953125, -0.05220794677734375, -0.0401763916015625, -0.02814483642578125, -0.01611328125, -0.00408172607421875, 0.0079498291015625, 0.01998138427734375, 0.032012939453125, 0.04404449462890625, 0.0560760498046875, 0.06810760498046875, 0.08013916015625, 0.09217071533203125, 0.1042022705078125, 0.11623382568359375, 0.128265380859375, 0.14029693603515625, 0.1523284912109375, 0.16436004638671875, 0.1763916015625, 0.18842315673828125, 0.2004547119140625, 0.21248626708984375, 0.224517822265625, 0.23654937744140625, 0.2485809326171875, 0.26061248779296875, 0.27264404296875, 0.28467559814453125, 0.2967071533203125, 0.30873870849609375, 0.320770263671875, 0.33280181884765625, 0.3448333740234375, 0.35686492919921875, 0.368896484375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 12.0, 17.0, 25.0, 18.0, 38.0, 32.0, 53.0, 69.0, 61.0, 86.0, 114.0, 144.0, 175.0, 218.0, 238.0, 245.0, 324.0, 347.0, 294.0, 277.0, 236.0, 229.0, 175.0, 133.0, 119.0, 98.0, 71.0, 60.0, 35.0, 38.0, 27.0, 17.0, 15.0, 7.0, 10.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10736083984375, -0.10346317291259766, -0.09956550598144531, -0.09566783905029297, -0.09177017211914062, -0.08787250518798828, -0.08397483825683594, -0.0800771713256836, -0.07617950439453125, -0.0722818374633789, -0.06838417053222656, -0.06448650360107422, -0.060588836669921875, -0.05669116973876953, -0.05279350280761719, -0.048895835876464844, -0.0449981689453125, -0.041100502014160156, -0.03720283508300781, -0.03330516815185547, -0.029407501220703125, -0.02550983428955078, -0.021612167358398438, -0.017714500427246094, -0.01381683349609375, -0.009919166564941406, -0.0060214996337890625, -0.0021238327026367188, 0.001773834228515625, 0.005671501159667969, 0.009569168090820312, 0.013466835021972656, 0.017364501953125, 0.021262168884277344, 0.025159835815429688, 0.02905750274658203, 0.032955169677734375, 0.03685283660888672, 0.04075050354003906, 0.044648170471191406, 0.04854583740234375, 0.052443504333496094, 0.05634117126464844, 0.06023883819580078, 0.06413650512695312, 0.06803417205810547, 0.07193183898925781, 0.07582950592041016, 0.0797271728515625, 0.08362483978271484, 0.08752250671386719, 0.09142017364501953, 0.09531784057617188, 0.09921550750732422, 0.10311317443847656, 0.1070108413696289, 0.11090850830078125, 0.1148061752319336, 0.11870384216308594, 0.12260150909423828, 0.12649917602539062, 0.13039684295654297, 0.1342945098876953, 0.13819217681884766, 0.14208984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 11.0, 9.0, 8.0, 9.0, 9.0, 22.0, 21.0, 27.0, 39.0, 43.0, 58.0, 62.0, 98.0, 104.0, 103.0, 84.0, 60.0, 50.0, 43.0, 31.0, 28.0, 20.0, 12.0, 10.0, 10.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.4097573757171631, -0.3989008069038391, -0.38804423809051514, -0.37718766927719116, -0.3663311004638672, -0.3554745614528656, -0.3446179926395416, -0.33376142382621765, -0.3229048550128937, -0.3120482861995697, -0.3011917173862457, -0.29033514857292175, -0.27947860956192017, -0.2686220407485962, -0.2577654719352722, -0.24690890312194824, -0.23605233430862427, -0.2251957654953003, -0.21433919668197632, -0.20348264276981354, -0.19262607395648956, -0.1817695051431656, -0.1709129512310028, -0.16005638241767883, -0.14919981360435486, -0.13834324479103088, -0.1274866759777069, -0.11663012206554413, -0.10577355325222015, -0.09491698443889618, -0.0840604230761528, -0.07320386171340942, -0.06234732270240784, -0.05149075761437416, -0.040634192526340485, -0.02977762743830681, -0.018921062350273132, -0.008064497262239456, 0.00279206782579422, 0.013648629188537598, 0.024505198001861572, 0.03536176308989525, 0.046218328177928925, 0.0570748932659626, 0.06793145835399628, 0.07878802716732025, 0.08964458853006363, 0.100501149892807, 0.11135771870613098, 0.12221428751945496, 0.13307085633277893, 0.1439274102449417, 0.15478397905826569, 0.16564054787158966, 0.17649710178375244, 0.18735367059707642, 0.1982102394104004, 0.20906680822372437, 0.21992337703704834, 0.23077993094921112, 0.2416364997625351, 0.2524930536746979, 0.26334962248802185, 0.2742061913013458, 0.2850627601146698]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 1.0, 2.0, 5.0, 2.0, 12.0, 13.0, 9.0, 17.0, 18.0, 20.0, 19.0, 22.0, 31.0, 27.0, 28.0, 33.0, 28.0, 34.0, 35.0, 34.0, 41.0, 35.0, 39.0, 36.0, 33.0, 36.0, 45.0, 35.0, 40.0, 23.0, 24.0, 30.0, 36.0, 15.0, 25.0, 21.0, 14.0, 12.0, 9.0, 10.0, 9.0, 10.0, 10.0, 5.0, 2.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20034931600093842, -0.19382792711257935, -0.18730653822422028, -0.1807851493358612, -0.17426376044750214, -0.16774237155914307, -0.1612209975719452, -0.15469959378242493, -0.14817821979522705, -0.14165683090686798, -0.1351354420185089, -0.12861405313014984, -0.12209266424179077, -0.1155712753534317, -0.10904989391565323, -0.10252850502729416, -0.09600710868835449, -0.08948571979999542, -0.08296433091163635, -0.07644294202327728, -0.06992155313491821, -0.06340016424655914, -0.05687878280878067, -0.0503573939204216, -0.04383600503206253, -0.03731461614370346, -0.03079322911798954, -0.02427184209227562, -0.01775045320391655, -0.01122906431555748, -0.0047076791524887085, 0.0018137097358703613, 0.008335113525390625, 0.01485650148242712, 0.021377889439463615, 0.027899276465177536, 0.034420665353536606, 0.040942054241895676, 0.04746343940496445, 0.05398482829332352, 0.06050621718168259, 0.06702760607004166, 0.07354899495840073, 0.0800703763961792, 0.08659176528453827, 0.09311315417289734, 0.09963454306125641, 0.10615593194961548, 0.11267732083797455, 0.11919870972633362, 0.1257200986146927, 0.13224148750305176, 0.13876287639141083, 0.1452842652797699, 0.15180563926696777, 0.15832704305648804, 0.1648484170436859, 0.17136980593204498, 0.17789119482040405, 0.18441258370876312, 0.1909339725971222, 0.19745536148548126, 0.20397675037384033, 0.2104981243610382, 0.21701952815055847]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 4.0, 15.0, 13.0, 19.0, 25.0, 51.0, 64.0, 107.0, 155.0, 269.0, 484.0, 690.0, 1195.0, 1856.0, 3166.0, 5264.0, 9227.0, 16368.0, 30339.0, 62674.0, 170256.0, 452341.0, 164648.0, 61053.0, 29824.0, 16119.0, 8973.0, 5290.0, 3080.0, 1945.0, 1152.0, 703.0, 416.0, 285.0, 179.0, 94.0, 62.0, 45.0, 38.0, 19.0, 8.0, 6.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2327880859375, -0.22562217712402344, -0.21845626831054688, -0.2112903594970703, -0.20412445068359375, -0.1969585418701172, -0.18979263305664062, -0.18262672424316406, -0.1754608154296875, -0.16829490661621094, -0.16112899780273438, -0.1539630889892578, -0.14679718017578125, -0.1396312713623047, -0.13246536254882812, -0.12529945373535156, -0.118133544921875, -0.11096763610839844, -0.10380172729492188, -0.09663581848144531, -0.08946990966796875, -0.08230400085449219, -0.07513809204101562, -0.06797218322753906, -0.0608062744140625, -0.05364036560058594, -0.046474456787109375, -0.03930854797363281, -0.03214263916015625, -0.024976730346679688, -0.017810821533203125, -0.010644912719726562, -0.00347900390625, 0.0036869049072265625, 0.010852813720703125, 0.018018722534179688, 0.02518463134765625, 0.03235054016113281, 0.039516448974609375, 0.04668235778808594, 0.0538482666015625, 0.06101417541503906, 0.06818008422851562, 0.07534599304199219, 0.08251190185546875, 0.08967781066894531, 0.09684371948242188, 0.10400962829589844, 0.111175537109375, 0.11834144592285156, 0.12550735473632812, 0.1326732635498047, 0.13983917236328125, 0.1470050811767578, 0.15417098999023438, 0.16133689880371094, 0.1685028076171875, 0.17566871643066406, 0.18283462524414062, 0.1900005340576172, 0.19716644287109375, 0.2043323516845703, 0.21149826049804688, 0.21866416931152344, 0.225830078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 12.0, 6.0, 13.0, 7.0, 16.0, 17.0, 17.0, 23.0, 20.0, 26.0, 28.0, 26.0, 44.0, 34.0, 36.0, 29.0, 34.0, 40.0, 30.0, 39.0, 35.0, 37.0, 40.0, 33.0, 38.0, 42.0, 32.0, 30.0, 39.0, 28.0, 22.0, 18.0, 16.0, 13.0, 14.0, 8.0, 10.0, 11.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2086181640625, -0.2018299102783203, -0.19504165649414062, -0.18825340270996094, -0.18146514892578125, -0.17467689514160156, -0.16788864135742188, -0.1611003875732422, -0.1543121337890625, -0.1475238800048828, -0.14073562622070312, -0.13394737243652344, -0.12715911865234375, -0.12037086486816406, -0.11358261108398438, -0.10679435729980469, -0.100006103515625, -0.09321784973144531, -0.08642959594726562, -0.07964134216308594, -0.07285308837890625, -0.06606483459472656, -0.059276580810546875, -0.05248832702636719, -0.0457000732421875, -0.03891181945800781, -0.032123565673828125, -0.025335311889648438, -0.01854705810546875, -0.011758804321289062, -0.004970550537109375, 0.0018177032470703125, 0.00860595703125, 0.015394210815429688, 0.022182464599609375, 0.028970718383789062, 0.03575897216796875, 0.04254722595214844, 0.049335479736328125, 0.05612373352050781, 0.0629119873046875, 0.06970024108886719, 0.07648849487304688, 0.08327674865722656, 0.09006500244140625, 0.09685325622558594, 0.10364151000976562, 0.11042976379394531, 0.117218017578125, 0.12400627136230469, 0.13079452514648438, 0.13758277893066406, 0.14437103271484375, 0.15115928649902344, 0.15794754028320312, 0.1647357940673828, 0.1715240478515625, 0.1783123016357422, 0.18510055541992188, 0.19188880920410156, 0.19867706298828125, 0.20546531677246094, 0.21225357055664062, 0.2190418243408203, 0.225830078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 8.0, 6.0, 7.0, 22.0, 20.0, 36.0, 31.0, 66.0, 84.0, 131.0, 159.0, 233.0, 350.0, 524.0, 751.0, 1137.0, 1646.0, 2659.0, 4377.0, 7484.0, 14900.0, 37470.0, 234837.0, 642954.0, 56074.0, 19148.0, 9344.0, 5169.0, 3046.0, 1868.0, 1223.0, 843.0, 609.0, 378.0, 257.0, 204.0, 128.0, 98.0, 86.0, 42.0, 43.0, 29.0, 18.0, 18.0, 6.0, 9.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.370849609375, -0.35894775390625, -0.3470458984375, -0.33514404296875, -0.3232421875, -0.31134033203125, -0.2994384765625, -0.28753662109375, -0.275634765625, -0.26373291015625, -0.2518310546875, -0.23992919921875, -0.22802734375, -0.21612548828125, -0.2042236328125, -0.19232177734375, -0.180419921875, -0.16851806640625, -0.1566162109375, -0.14471435546875, -0.1328125, -0.12091064453125, -0.1090087890625, -0.09710693359375, -0.085205078125, -0.07330322265625, -0.0614013671875, -0.04949951171875, -0.03759765625, -0.02569580078125, -0.0137939453125, -0.00189208984375, 0.010009765625, 0.02191162109375, 0.0338134765625, 0.04571533203125, 0.0576171875, 0.06951904296875, 0.0814208984375, 0.09332275390625, 0.105224609375, 0.11712646484375, 0.1290283203125, 0.14093017578125, 0.15283203125, 0.16473388671875, 0.1766357421875, 0.18853759765625, 0.200439453125, 0.21234130859375, 0.2242431640625, 0.23614501953125, 0.248046875, 0.25994873046875, 0.2718505859375, 0.28375244140625, 0.295654296875, 0.30755615234375, 0.3194580078125, 0.33135986328125, 0.34326171875, 0.35516357421875, 0.3670654296875, 0.37896728515625, 0.390869140625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 3.0, 7.0, 16.0, 19.0, 12.0, 24.0, 20.0, 22.0, 31.0, 24.0, 22.0, 42.0, 46.0, 42.0, 41.0, 47.0, 44.0, 46.0, 40.0, 46.0, 55.0, 45.0, 36.0, 30.0, 33.0, 29.0, 26.0, 23.0, 21.0, 15.0, 13.0, 15.0, 12.0, 17.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173095703125, -0.1680736541748047, -0.16305160522460938, -0.15802955627441406, -0.15300750732421875, -0.14798545837402344, -0.14296340942382812, -0.1379413604736328, -0.1329193115234375, -0.1278972625732422, -0.12287521362304688, -0.11785316467285156, -0.11283111572265625, -0.10780906677246094, -0.10278701782226562, -0.09776496887207031, -0.092742919921875, -0.08772087097167969, -0.08269882202148438, -0.07767677307128906, -0.07265472412109375, -0.06763267517089844, -0.06261062622070312, -0.05758857727050781, -0.0525665283203125, -0.04754447937011719, -0.042522430419921875, -0.03750038146972656, -0.03247833251953125, -0.027456283569335938, -0.022434234619140625, -0.017412185668945312, -0.01239013671875, -0.0073680877685546875, -0.002346038818359375, 0.0026760101318359375, 0.00769805908203125, 0.012720108032226562, 0.017742156982421875, 0.022764205932617188, 0.0277862548828125, 0.03280830383300781, 0.037830352783203125, 0.04285240173339844, 0.04787445068359375, 0.05289649963378906, 0.057918548583984375, 0.06294059753417969, 0.067962646484375, 0.07298469543457031, 0.07800674438476562, 0.08302879333496094, 0.08805084228515625, 0.09307289123535156, 0.09809494018554688, 0.10311698913574219, 0.1081390380859375, 0.11316108703613281, 0.11818313598632812, 0.12320518493652344, 0.12822723388671875, 0.13324928283691406, 0.13827133178710938, 0.1432933807373047, 0.1483154296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 10.0, 6.0, 13.0, 13.0, 16.0, 22.0, 41.0, 53.0, 68.0, 65.0, 103.0, 133.0, 141.0, 220.0, 322.0, 376.0, 553.0, 768.0, 1121.0, 1712.0, 2643.0, 4193.0, 7551.0, 15571.0, 45142.0, 438701.0, 448323.0, 44697.0, 15725.0, 7576.0, 4258.0, 2601.0, 1701.0, 1156.0, 746.0, 560.0, 408.0, 302.0, 231.0, 170.0, 127.0, 108.0, 71.0, 65.0, 47.0, 32.0, 26.0, 20.0, 13.0, 10.0, 8.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0], "bins": [-0.047760009765625, -0.046312808990478516, -0.04486560821533203, -0.04341840744018555, -0.04197120666503906, -0.04052400588989258, -0.039076805114746094, -0.03762960433959961, -0.036182403564453125, -0.03473520278930664, -0.033288002014160156, -0.03184080123901367, -0.030393600463867188, -0.028946399688720703, -0.02749919891357422, -0.026051998138427734, -0.02460479736328125, -0.023157596588134766, -0.02171039581298828, -0.020263195037841797, -0.018815994262695312, -0.017368793487548828, -0.015921592712402344, -0.01447439193725586, -0.013027191162109375, -0.01157999038696289, -0.010132789611816406, -0.008685588836669922, -0.0072383880615234375, -0.005791187286376953, -0.004343986511230469, -0.0028967857360839844, -0.0014495849609375, -2.384185791015625e-06, 0.0014448165893554688, 0.002892017364501953, 0.0043392181396484375, 0.005786418914794922, 0.007233619689941406, 0.00868082046508789, 0.010128021240234375, 0.01157522201538086, 0.013022422790527344, 0.014469623565673828, 0.015916824340820312, 0.017364025115966797, 0.01881122589111328, 0.020258426666259766, 0.02170562744140625, 0.023152828216552734, 0.02460002899169922, 0.026047229766845703, 0.027494430541992188, 0.028941631317138672, 0.030388832092285156, 0.03183603286743164, 0.033283233642578125, 0.03473043441772461, 0.036177635192871094, 0.03762483596801758, 0.03907203674316406, 0.04051923751831055, 0.04196643829345703, 0.043413639068603516, 0.04486083984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 11.0, 7.0, 8.0, 6.0, 18.0, 11.0, 21.0, 20.0, 24.0, 67.0, 41.0, 39.0, 68.0, 54.0, 138.0, 67.0, 66.0, 56.0, 92.0, 30.0, 17.0, 19.0, 12.0, 26.0, 7.0, 9.0, 12.0, 15.0, 10.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.3115426301956177e-06, -2.2388994693756104e-06, -2.166256308555603e-06, -2.0936131477355957e-06, -2.0209699869155884e-06, -1.948326826095581e-06, -1.8756836652755737e-06, -1.8030405044555664e-06, -1.730397343635559e-06, -1.6577541828155518e-06, -1.5851110219955444e-06, -1.5124678611755371e-06, -1.4398247003555298e-06, -1.3671815395355225e-06, -1.2945383787155151e-06, -1.2218952178955078e-06, -1.1492520570755005e-06, -1.0766088962554932e-06, -1.0039657354354858e-06, -9.313225746154785e-07, -8.586794137954712e-07, -7.860362529754639e-07, -7.133930921554565e-07, -6.407499313354492e-07, -5.681067705154419e-07, -4.954636096954346e-07, -4.2282044887542725e-07, -3.501772880554199e-07, -2.775341272354126e-07, -2.0489096641540527e-07, -1.3224780559539795e-07, -5.960464477539063e-08, 1.30385160446167e-08, 8.568167686462402e-08, 1.5832483768463135e-07, 2.3096799850463867e-07, 3.03611159324646e-07, 3.762543201446533e-07, 4.4889748096466064e-07, 5.21540641784668e-07, 5.941838026046753e-07, 6.668269634246826e-07, 7.394701242446899e-07, 8.121132850646973e-07, 8.847564458847046e-07, 9.57399606704712e-07, 1.0300427675247192e-06, 1.1026859283447266e-06, 1.1753290891647339e-06, 1.2479722499847412e-06, 1.3206154108047485e-06, 1.3932585716247559e-06, 1.4659017324447632e-06, 1.5385448932647705e-06, 1.6111880540847778e-06, 1.6838312149047852e-06, 1.7564743757247925e-06, 1.8291175365447998e-06, 1.9017606973648071e-06, 1.9744038581848145e-06, 2.0470470190048218e-06, 2.119690179824829e-06, 2.1923333406448364e-06, 2.2649765014648438e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 6.0, 15.0, 7.0, 21.0, 28.0, 37.0, 36.0, 50.0, 70.0, 122.0, 142.0, 181.0, 284.0, 381.0, 536.0, 739.0, 936.0, 1275.0, 1737.0, 2509.0, 3422.0, 5068.0, 7616.0, 11575.0, 19850.0, 34829.0, 75192.0, 296157.0, 400982.0, 86285.0, 38169.0, 21082.0, 12696.0, 8088.0, 5219.0, 3705.0, 2523.0, 1853.0, 1351.0, 997.0, 753.0, 516.0, 423.0, 289.0, 246.0, 132.0, 146.0, 81.0, 66.0, 46.0, 27.0, 23.0, 17.0, 9.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.03460693359375, -0.03352785110473633, -0.032448768615722656, -0.031369686126708984, -0.030290603637695312, -0.02921152114868164, -0.02813243865966797, -0.027053356170654297, -0.025974273681640625, -0.024895191192626953, -0.02381610870361328, -0.02273702621459961, -0.021657943725585938, -0.020578861236572266, -0.019499778747558594, -0.018420696258544922, -0.01734161376953125, -0.016262531280517578, -0.015183448791503906, -0.014104366302490234, -0.013025283813476562, -0.01194620132446289, -0.010867118835449219, -0.009788036346435547, -0.008708953857421875, -0.007629871368408203, -0.006550788879394531, -0.005471706390380859, -0.0043926239013671875, -0.0033135414123535156, -0.0022344589233398438, -0.0011553764343261719, -7.62939453125e-05, 0.0010027885437011719, 0.0020818710327148438, 0.0031609535217285156, 0.0042400360107421875, 0.005319118499755859, 0.006398200988769531, 0.007477283477783203, 0.008556365966796875, 0.009635448455810547, 0.010714530944824219, 0.01179361343383789, 0.012872695922851562, 0.013951778411865234, 0.015030860900878906, 0.016109943389892578, 0.01718902587890625, 0.018268108367919922, 0.019347190856933594, 0.020426273345947266, 0.021505355834960938, 0.02258443832397461, 0.02366352081298828, 0.024742603302001953, 0.025821685791015625, 0.026900768280029297, 0.02797985076904297, 0.02905893325805664, 0.030138015747070312, 0.031217098236083984, 0.032296180725097656, 0.03337526321411133, 0.034454345703125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 5.0, 4.0, 11.0, 10.0, 4.0, 21.0, 15.0, 19.0, 27.0, 34.0, 44.0, 76.0, 93.0, 169.0, 144.0, 77.0, 38.0, 52.0, 28.0, 25.0, 21.0, 16.0, 19.0, 15.0, 7.0, 8.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.0114593505859375, -0.01109933853149414, -0.010739326477050781, -0.010379314422607422, -0.010019302368164062, -0.009659290313720703, -0.009299278259277344, -0.008939266204833984, -0.008579254150390625, -0.008219242095947266, -0.007859230041503906, -0.007499217987060547, -0.0071392059326171875, -0.006779193878173828, -0.006419181823730469, -0.006059169769287109, -0.00569915771484375, -0.005339145660400391, -0.004979133605957031, -0.004619121551513672, -0.0042591094970703125, -0.003899097442626953, -0.0035390853881835938, -0.0031790733337402344, -0.002819061279296875, -0.0024590492248535156, -0.0020990371704101562, -0.0017390251159667969, -0.0013790130615234375, -0.0010190010070800781, -0.0006589889526367188, -0.0002989768981933594, 6.103515625e-05, 0.0004210472106933594, 0.0007810592651367188, 0.0011410713195800781, 0.0015010833740234375, 0.0018610954284667969, 0.0022211074829101562, 0.0025811195373535156, 0.002941131591796875, 0.0033011436462402344, 0.0036611557006835938, 0.004021167755126953, 0.0043811798095703125, 0.004741191864013672, 0.005101203918457031, 0.005461215972900391, 0.00582122802734375, 0.006181240081787109, 0.006541252136230469, 0.006901264190673828, 0.0072612762451171875, 0.007621288299560547, 0.007981300354003906, 0.008341312408447266, 0.008701324462890625, 0.009061336517333984, 0.009421348571777344, 0.009781360626220703, 0.010141372680664062, 0.010501384735107422, 0.010861396789550781, 0.01122140884399414, 0.0115814208984375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 12.0, 12.0, 12.0, 14.0, 27.0, 29.0, 38.0, 53.0, 61.0, 79.0, 113.0, 96.0, 99.0, 73.0, 56.0, 43.0, 40.0, 28.0, 19.0, 20.0, 13.0, 11.0, 7.0, 9.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.40748143196105957, -0.39656150341033936, -0.38564157485961914, -0.3747216761112213, -0.3638017475605011, -0.3528818190097809, -0.34196192026138306, -0.33104199171066284, -0.3201220631599426, -0.3092021346092224, -0.2982822060585022, -0.28736230731010437, -0.27644237875938416, -0.26552245020866394, -0.2546025514602661, -0.2436826229095459, -0.23276269435882568, -0.22184276580810547, -0.21092285215854645, -0.20000293850898743, -0.1890830099582672, -0.178163081407547, -0.16724316775798798, -0.15632325410842896, -0.14540332555770874, -0.13448339700698853, -0.1235634833574295, -0.11264356225728989, -0.10172364115715027, -0.09080372005701065, -0.07988379895687103, -0.06896387785673141, -0.058043986558914185, -0.04712406545877457, -0.03620414435863495, -0.02528422325849533, -0.014364302158355713, -0.003444381058216095, 0.007475540041923523, 0.01839546114206314, 0.02931538224220276, 0.04023530334234238, 0.051155224442481995, 0.06207514554262161, 0.07299506664276123, 0.08391498774290085, 0.09483490884304047, 0.10575482994318008, 0.1166747510433197, 0.12759467959403992, 0.13851459324359894, 0.14943450689315796, 0.16035443544387817, 0.1712743639945984, 0.1821942776441574, 0.19311419129371643, 0.20403411984443665, 0.21495404839515686, 0.22587396204471588, 0.2367938756942749, 0.24771380424499512, 0.25863373279571533, 0.26955366134643555, 0.2804735600948334, 0.2913934886455536]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 5.0, 1.0, 5.0, 10.0, 13.0, 7.0, 16.0, 18.0, 21.0, 22.0, 20.0, 29.0, 32.0, 20.0, 38.0, 25.0, 34.0, 36.0, 36.0, 37.0, 38.0, 35.0, 39.0, 33.0, 39.0, 36.0, 45.0, 38.0, 23.0, 23.0, 31.0, 30.0, 22.0, 20.0, 26.0, 13.0, 13.0, 8.0, 10.0, 10.0, 9.0, 11.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1973443478345871, -0.19091796875, -0.1844916045665741, -0.178065225481987, -0.1716388463973999, -0.1652124673128128, -0.1587860882282257, -0.1523597240447998, -0.1459333449602127, -0.1395069658756256, -0.1330806016921997, -0.1266542226076126, -0.12022784352302551, -0.11380146443843842, -0.10737509280443192, -0.10094872117042542, -0.09452234208583832, -0.08809596300125122, -0.08166959136724472, -0.07524321973323822, -0.06881684064865112, -0.062390465289354324, -0.055964089930057526, -0.04953771457076073, -0.04311133921146393, -0.03668496385216713, -0.03025858849287033, -0.023832213133573532, -0.017405837774276733, -0.010979462414979935, -0.004553087055683136, 0.0018732883036136627, 0.008299678564071655, 0.014726053923368454, 0.021152429282665253, 0.02757880464196205, 0.03400518000125885, 0.04043155536055565, 0.04685793071985245, 0.053284306079149246, 0.059710681438446045, 0.06613706052303314, 0.07256343215703964, 0.07898980379104614, 0.08541618287563324, 0.09184256196022034, 0.09826893359422684, 0.10469530522823334, 0.11112168431282043, 0.11754806339740753, 0.12397443503141403, 0.13040080666542053, 0.13682718575000763, 0.14325356483459473, 0.14967992901802063, 0.15610630810260773, 0.16253268718719482, 0.16895906627178192, 0.17538544535636902, 0.18181180953979492, 0.18823818862438202, 0.19466456770896912, 0.20109093189239502, 0.20751731097698212, 0.2139436900615692]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 6.0, 9.0, 12.0, 19.0, 20.0, 32.0, 49.0, 75.0, 110.0, 141.0, 196.0, 289.0, 387.0, 678.0, 880.0, 1312.0, 2022.0, 3046.0, 4763.0, 7119.0, 11000.0, 17654.0, 27817.0, 44829.0, 76776.0, 140441.0, 244609.0, 199076.0, 106098.0, 59695.0, 36057.0, 22462.0, 14215.0, 9056.0, 5911.0, 3867.0, 2564.0, 1663.0, 1140.0, 779.0, 555.0, 359.0, 228.0, 159.0, 120.0, 93.0, 50.0, 46.0, 23.0, 13.0, 14.0, 6.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.376953125, -0.3647041320800781, -0.35245513916015625, -0.3402061462402344, -0.3279571533203125, -0.3157081604003906, -0.30345916748046875, -0.2912101745605469, -0.278961181640625, -0.2667121887207031, -0.25446319580078125, -0.24221420288085938, -0.2299652099609375, -0.21771621704101562, -0.20546722412109375, -0.19321823120117188, -0.18096923828125, -0.16872024536132812, -0.15647125244140625, -0.14422225952148438, -0.1319732666015625, -0.11972427368164062, -0.10747528076171875, -0.09522628784179688, -0.082977294921875, -0.07072830200195312, -0.05847930908203125, -0.046230316162109375, -0.0339813232421875, -0.021732330322265625, -0.00948333740234375, 0.002765655517578125, 0.0150146484375, 0.027263641357421875, 0.03951263427734375, 0.051761627197265625, 0.0640106201171875, 0.07625961303710938, 0.08850860595703125, 0.10075759887695312, 0.113006591796875, 0.12525558471679688, 0.13750457763671875, 0.14975357055664062, 0.1620025634765625, 0.17425155639648438, 0.18650054931640625, 0.19874954223632812, 0.21099853515625, 0.22324752807617188, 0.23549652099609375, 0.24774551391601562, 0.2599945068359375, 0.2722434997558594, 0.28449249267578125, 0.2967414855957031, 0.308990478515625, 0.3212394714355469, 0.33348846435546875, 0.3457374572753906, 0.3579864501953125, 0.3702354431152344, 0.38248443603515625, 0.3947334289550781, 0.406982421875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 5.0, 7.0, 2.0, 17.0, 15.0, 17.0, 25.0, 12.0, 32.0, 30.0, 28.0, 34.0, 37.0, 39.0, 24.0, 42.0, 37.0, 39.0, 35.0, 45.0, 50.0, 37.0, 49.0, 38.0, 37.0, 27.0, 23.0, 26.0, 30.0, 22.0, 25.0, 15.0, 14.0, 22.0, 17.0, 5.0, 9.0, 6.0, 4.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20458984375, -0.19836807250976562, -0.19214630126953125, -0.18592453002929688, -0.1797027587890625, -0.17348098754882812, -0.16725921630859375, -0.16103744506835938, -0.154815673828125, -0.14859390258789062, -0.14237213134765625, -0.13615036010742188, -0.1299285888671875, -0.12370681762695312, -0.11748504638671875, -0.11126327514648438, -0.10504150390625, -0.09881973266601562, -0.09259796142578125, -0.08637619018554688, -0.0801544189453125, -0.07393264770507812, -0.06771087646484375, -0.061489105224609375, -0.055267333984375, -0.049045562744140625, -0.04282379150390625, -0.036602020263671875, -0.0303802490234375, -0.024158477783203125, -0.01793670654296875, -0.011714935302734375, -0.0054931640625, 0.000728607177734375, 0.00695037841796875, 0.013172149658203125, 0.0193939208984375, 0.025615692138671875, 0.03183746337890625, 0.038059234619140625, 0.044281005859375, 0.050502777099609375, 0.05672454833984375, 0.06294631958007812, 0.0691680908203125, 0.07538986206054688, 0.08161163330078125, 0.08783340454101562, 0.09405517578125, 0.10027694702148438, 0.10649871826171875, 0.11272048950195312, 0.1189422607421875, 0.12516403198242188, 0.13138580322265625, 0.13760757446289062, 0.143829345703125, 0.15005111694335938, 0.15627288818359375, 0.16249465942382812, 0.1687164306640625, 0.17493820190429688, 0.18115997314453125, 0.18738174438476562, 0.193603515625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 11.0, 17.0, 23.0, 31.0, 55.0, 86.0, 124.0, 182.0, 255.0, 399.0, 620.0, 946.0, 1495.0, 2294.0, 3725.0, 5830.0, 9652.0, 16596.0, 28929.0, 52298.0, 98119.0, 202300.0, 300450.0, 149071.0, 76058.0, 40976.0, 23014.0, 13598.0, 8025.0, 4774.0, 3017.0, 1984.0, 1232.0, 814.0, 510.0, 334.0, 259.0, 153.0, 104.0, 68.0, 35.0, 28.0, 22.0, 13.0, 10.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.47119140625, -0.45660400390625, -0.4420166015625, -0.42742919921875, -0.412841796875, -0.39825439453125, -0.3836669921875, -0.36907958984375, -0.3544921875, -0.33990478515625, -0.3253173828125, -0.31072998046875, -0.296142578125, -0.28155517578125, -0.2669677734375, -0.25238037109375, -0.23779296875, -0.22320556640625, -0.2086181640625, -0.19403076171875, -0.179443359375, -0.16485595703125, -0.1502685546875, -0.13568115234375, -0.12109375, -0.10650634765625, -0.0919189453125, -0.07733154296875, -0.062744140625, -0.04815673828125, -0.0335693359375, -0.01898193359375, -0.00439453125, 0.01019287109375, 0.0247802734375, 0.03936767578125, 0.053955078125, 0.06854248046875, 0.0831298828125, 0.09771728515625, 0.1123046875, 0.12689208984375, 0.1414794921875, 0.15606689453125, 0.170654296875, 0.18524169921875, 0.1998291015625, 0.21441650390625, 0.22900390625, 0.24359130859375, 0.2581787109375, 0.27276611328125, 0.287353515625, 0.30194091796875, 0.3165283203125, 0.33111572265625, 0.345703125, 0.36029052734375, 0.3748779296875, 0.38946533203125, 0.404052734375, 0.41864013671875, 0.4332275390625, 0.44781494140625, 0.46240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 8.0, 12.0, 10.0, 11.0, 24.0, 23.0, 22.0, 21.0, 30.0, 26.0, 31.0, 37.0, 44.0, 40.0, 29.0, 51.0, 47.0, 43.0, 33.0, 45.0, 30.0, 31.0, 41.0, 33.0, 31.0, 36.0, 26.0, 26.0, 28.0, 15.0, 16.0, 12.0, 11.0, 12.0, 16.0, 10.0, 6.0, 8.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.141357421875, -0.13730430603027344, -0.13325119018554688, -0.1291980743408203, -0.12514495849609375, -0.12109184265136719, -0.11703872680664062, -0.11298561096191406, -0.1089324951171875, -0.10487937927246094, -0.10082626342773438, -0.09677314758300781, -0.09272003173828125, -0.08866691589355469, -0.08461380004882812, -0.08056068420410156, -0.076507568359375, -0.07245445251464844, -0.06840133666992188, -0.06434822082519531, -0.06029510498046875, -0.05624198913574219, -0.052188873291015625, -0.04813575744628906, -0.0440826416015625, -0.04002952575683594, -0.035976409912109375, -0.03192329406738281, -0.02787017822265625, -0.023817062377929688, -0.019763946533203125, -0.015710830688476562, -0.01165771484375, -0.0076045989990234375, -0.003551483154296875, 0.0005016326904296875, 0.00455474853515625, 0.008607864379882812, 0.012660980224609375, 0.016714096069335938, 0.0207672119140625, 0.024820327758789062, 0.028873443603515625, 0.03292655944824219, 0.03697967529296875, 0.04103279113769531, 0.045085906982421875, 0.04913902282714844, 0.053192138671875, 0.05724525451660156, 0.061298370361328125, 0.06535148620605469, 0.06940460205078125, 0.07345771789550781, 0.07751083374023438, 0.08156394958496094, 0.0856170654296875, 0.08967018127441406, 0.09372329711914062, 0.09777641296386719, 0.10182952880859375, 0.10588264465332031, 0.10993576049804688, 0.11398887634277344, 0.1180419921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 10.0, 11.0, 19.0, 19.0, 30.0, 43.0, 50.0, 68.0, 84.0, 130.0, 125.0, 177.0, 229.0, 300.0, 399.0, 483.0, 591.0, 767.0, 1030.0, 1289.0, 1946.0, 3047.0, 5493.0, 13517.0, 89203.0, 883030.0, 25379.0, 8133.0, 3862.0, 2363.0, 1543.0, 1163.0, 911.0, 644.0, 556.0, 414.0, 342.0, 266.0, 216.0, 149.0, 124.0, 105.0, 71.0, 56.0, 46.0, 35.0, 15.0, 15.0, 16.0, 9.0, 9.0, 11.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.1900634765625, -0.18416786193847656, -0.17827224731445312, -0.1723766326904297, -0.16648101806640625, -0.1605854034423828, -0.15468978881835938, -0.14879417419433594, -0.1428985595703125, -0.13700294494628906, -0.13110733032226562, -0.1252117156982422, -0.11931610107421875, -0.11342048645019531, -0.10752487182617188, -0.10162925720214844, -0.095733642578125, -0.08983802795410156, -0.08394241333007812, -0.07804679870605469, -0.07215118408203125, -0.06625556945800781, -0.060359954833984375, -0.05446434020996094, -0.0485687255859375, -0.04267311096191406, -0.036777496337890625, -0.030881881713867188, -0.02498626708984375, -0.019090652465820312, -0.013195037841796875, -0.0072994232177734375, -0.00140380859375, 0.0044918060302734375, 0.010387420654296875, 0.016283035278320312, 0.02217864990234375, 0.028074264526367188, 0.033969879150390625, 0.03986549377441406, 0.0457611083984375, 0.05165672302246094, 0.057552337646484375, 0.06344795227050781, 0.06934356689453125, 0.07523918151855469, 0.08113479614257812, 0.08703041076660156, 0.092926025390625, 0.09882164001464844, 0.10471725463867188, 0.11061286926269531, 0.11650848388671875, 0.12240409851074219, 0.12829971313476562, 0.13419532775878906, 0.1400909423828125, 0.14598655700683594, 0.15188217163085938, 0.1577777862548828, 0.16367340087890625, 0.1695690155029297, 0.17546463012695312, 0.18136024475097656, 0.187255859375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 6.0, 9.0, 20.0, 22.0, 48.0, 106.0, 220.0, 263.0, 134.0, 38.0, 54.0, 27.0, 10.0, 12.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.268732249736786e-06, -6.100162863731384e-06, -5.931593477725983e-06, -5.763024091720581e-06, -5.5944547057151794e-06, -5.425885319709778e-06, -5.257315933704376e-06, -5.088746547698975e-06, -4.920177161693573e-06, -4.751607775688171e-06, -4.58303838968277e-06, -4.414469003677368e-06, -4.2458996176719666e-06, -4.077330231666565e-06, -3.908760845661163e-06, -3.7401914596557617e-06, -3.57162207365036e-06, -3.4030526876449585e-06, -3.234483301639557e-06, -3.0659139156341553e-06, -2.8973445296287537e-06, -2.728775143623352e-06, -2.5602057576179504e-06, -2.391636371612549e-06, -2.2230669856071472e-06, -2.0544975996017456e-06, -1.885928213596344e-06, -1.7173588275909424e-06, -1.5487894415855408e-06, -1.3802200555801392e-06, -1.2116506695747375e-06, -1.043081283569336e-06, -8.745118975639343e-07, -7.059425115585327e-07, -5.373731255531311e-07, -3.688037395477295e-07, -2.0023435354232788e-07, -3.166496753692627e-08, 1.3690441846847534e-07, 3.0547380447387695e-07, 4.7404319047927856e-07, 6.426125764846802e-07, 8.111819624900818e-07, 9.797513484954834e-07, 1.148320734500885e-06, 1.3168901205062866e-06, 1.4854595065116882e-06, 1.6540288925170898e-06, 1.8225982785224915e-06, 1.991167664527893e-06, 2.1597370505332947e-06, 2.3283064365386963e-06, 2.496875822544098e-06, 2.6654452085494995e-06, 2.834014594554901e-06, 3.0025839805603027e-06, 3.1711533665657043e-06, 3.339722752571106e-06, 3.5082921385765076e-06, 3.676861524581909e-06, 3.845430910587311e-06, 4.014000296592712e-06, 4.182569682598114e-06, 4.351139068603516e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 3.0, 2.0, 4.0, 18.0, 11.0, 22.0, 34.0, 47.0, 70.0, 91.0, 140.0, 168.0, 271.0, 390.0, 496.0, 742.0, 1100.0, 1577.0, 2488.0, 4606.0, 11267.0, 58059.0, 913224.0, 34190.0, 8717.0, 3801.0, 2276.0, 1416.0, 996.0, 661.0, 488.0, 337.0, 246.0, 178.0, 116.0, 84.0, 58.0, 50.0, 27.0, 24.0, 15.0, 6.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.229248046875, -0.22276878356933594, -0.21628952026367188, -0.2098102569580078, -0.20333099365234375, -0.1968517303466797, -0.19037246704101562, -0.18389320373535156, -0.1774139404296875, -0.17093467712402344, -0.16445541381835938, -0.1579761505126953, -0.15149688720703125, -0.1450176239013672, -0.13853836059570312, -0.13205909729003906, -0.125579833984375, -0.11910057067871094, -0.11262130737304688, -0.10614204406738281, -0.09966278076171875, -0.09318351745605469, -0.08670425415039062, -0.08022499084472656, -0.0737457275390625, -0.06726646423339844, -0.060787200927734375, -0.05430793762207031, -0.04782867431640625, -0.04134941101074219, -0.034870147705078125, -0.028390884399414062, -0.02191162109375, -0.015432357788085938, -0.008953094482421875, -0.0024738311767578125, 0.00400543212890625, 0.010484695434570312, 0.016963958740234375, 0.023443222045898438, 0.0299224853515625, 0.03640174865722656, 0.042881011962890625, 0.04936027526855469, 0.05583953857421875, 0.06231880187988281, 0.06879806518554688, 0.07527732849121094, 0.081756591796875, 0.08823585510253906, 0.09471511840820312, 0.10119438171386719, 0.10767364501953125, 0.11415290832519531, 0.12063217163085938, 0.12711143493652344, 0.1335906982421875, 0.14006996154785156, 0.14654922485351562, 0.1530284881591797, 0.15950775146484375, 0.1659870147705078, 0.17246627807617188, 0.17894554138183594, 0.1854248046875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 11.0, 15.0, 33.0, 165.0, 568.0, 97.0, 29.0, 27.0, 13.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044830322265625, -0.043062686920166016, -0.04129505157470703, -0.03952741622924805, -0.03775978088378906, -0.03599214553833008, -0.034224510192871094, -0.03245687484741211, -0.030689239501953125, -0.02892160415649414, -0.027153968811035156, -0.025386333465576172, -0.023618698120117188, -0.021851062774658203, -0.02008342742919922, -0.018315792083740234, -0.01654815673828125, -0.014780521392822266, -0.013012886047363281, -0.011245250701904297, -0.009477615356445312, -0.007709980010986328, -0.005942344665527344, -0.004174709320068359, -0.002407073974609375, -0.0006394386291503906, 0.0011281967163085938, 0.002895832061767578, 0.0046634674072265625, 0.006431102752685547, 0.008198738098144531, 0.009966373443603516, 0.0117340087890625, 0.013501644134521484, 0.015269279479980469, 0.017036914825439453, 0.018804550170898438, 0.020572185516357422, 0.022339820861816406, 0.02410745620727539, 0.025875091552734375, 0.02764272689819336, 0.029410362243652344, 0.031177997589111328, 0.03294563293457031, 0.0347132682800293, 0.03648090362548828, 0.038248538970947266, 0.04001617431640625, 0.041783809661865234, 0.04355144500732422, 0.0453190803527832, 0.04708671569824219, 0.04885435104370117, 0.050621986389160156, 0.05238962173461914, 0.054157257080078125, 0.05592489242553711, 0.057692527770996094, 0.05946016311645508, 0.06122779846191406, 0.06299543380737305, 0.06476306915283203, 0.06653070449829102, 0.06829833984375]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 9.0, 13.0, 16.0, 19.0, 26.0, 33.0, 46.0, 57.0, 96.0, 122.0, 137.0, 96.0, 90.0, 68.0, 39.0, 31.0, 27.0, 12.0, 15.0, 8.0, 12.0, 9.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.47175055742263794, -0.4594736099243164, -0.44719669222831726, -0.4349197447299957, -0.4226428270339966, -0.41036587953567505, -0.3980889320373535, -0.38581201434135437, -0.3735350966453552, -0.3612581491470337, -0.34898123145103455, -0.336704283952713, -0.32442736625671387, -0.31215041875839233, -0.2998734712600708, -0.28759655356407166, -0.2753196060657501, -0.2630426585674286, -0.25076574087142944, -0.2384887933731079, -0.22621187567710876, -0.21393492817878723, -0.2016579955816269, -0.18938106298446655, -0.1771041303873062, -0.16482719779014587, -0.15255026519298553, -0.1402733325958252, -0.12799638509750366, -0.11571945995092392, -0.10344251990318298, -0.09116558730602264, -0.07888862490653992, -0.06661169230937958, -0.05433475598692894, -0.0420578196644783, -0.029780887067317963, -0.017503954470157623, -0.005227014422416687, 0.007049918174743652, 0.01932685077190399, 0.03160378336906433, 0.04388071969151497, 0.05615765601396561, 0.06843458861112595, 0.08071152120828629, 0.09298846125602722, 0.10526539385318756, 0.1175423264503479, 0.12981925904750824, 0.14209619164466858, 0.1543731391429901, 0.16665005683898926, 0.1789270043373108, 0.19120393693447113, 0.20348086953163147, 0.2157578021287918, 0.22803473472595215, 0.2403116673231125, 0.2525885999202728, 0.26486554741859436, 0.2771424651145935, 0.28941941261291504, 0.3016963601112366, 0.3139732778072357]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 13.0, 12.0, 9.0, 16.0, 11.0, 17.0, 22.0, 19.0, 24.0, 30.0, 19.0, 40.0, 23.0, 29.0, 39.0, 29.0, 34.0, 34.0, 43.0, 43.0, 37.0, 40.0, 29.0, 34.0, 38.0, 29.0, 24.0, 26.0, 35.0, 28.0, 18.0, 20.0, 18.0, 16.0, 16.0, 8.0, 9.0, 16.0, 7.0, 6.0, 8.0, 6.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.18892674148082733, -0.18307974934577942, -0.1772327721118927, -0.1713857799768448, -0.16553878784179688, -0.15969179570674896, -0.15384481847286224, -0.14799782633781433, -0.14215083420276642, -0.1363038420677185, -0.1304568648338318, -0.12460987269878387, -0.11876288056373596, -0.11291589587926865, -0.10706891119480133, -0.10122191905975342, -0.0953749343752861, -0.08952794969081879, -0.08368095755577087, -0.07783397287130356, -0.07198698073625565, -0.06613999605178833, -0.060293007642030716, -0.0544460192322731, -0.04859903082251549, -0.042752042412757874, -0.03690505400300026, -0.031058067455887794, -0.02521107904613018, -0.019364090636372566, -0.013517104089260101, -0.007670115679502487, -0.001823127269744873, 0.004023860674351454, 0.00987084861844778, 0.01571783609688282, 0.021564824506640434, 0.02741181291639805, 0.03325879946351051, 0.03910578787326813, 0.04495277628302574, 0.050799764692783356, 0.05664675310254097, 0.062493741512298584, 0.0683407261967659, 0.07418771833181381, 0.08003470301628113, 0.08588169515132904, 0.09172867983579636, 0.09757566452026367, 0.10342265665531158, 0.1092696413397789, 0.11511663347482681, 0.12096361815929413, 0.12681061029434204, 0.13265758752822876, 0.13850457966327667, 0.14435157179832458, 0.1501985490322113, 0.15604554116725922, 0.16189253330230713, 0.16773952543735504, 0.17358650267124176, 0.17943349480628967, 0.18528048694133759]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 9.0, 21.0, 14.0, 24.0, 42.0, 84.0, 112.0, 182.0, 341.0, 580.0, 895.0, 1502.0, 2774.0, 4832.0, 8701.0, 15818.0, 28548.0, 54795.0, 111608.0, 258886.0, 1063407.0, 1906032.0, 428425.0, 152746.0, 72556.0, 37045.0, 19593.0, 10696.0, 5990.0, 3329.0, 1860.0, 1112.0, 655.0, 400.0, 252.0, 153.0, 98.0, 57.0, 30.0, 31.0, 19.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.348876953125, -0.33769989013671875, -0.3265228271484375, -0.31534576416015625, -0.304168701171875, -0.29299163818359375, -0.2818145751953125, -0.27063751220703125, -0.25946044921875, -0.24828338623046875, -0.2371063232421875, -0.22592926025390625, -0.214752197265625, -0.20357513427734375, -0.1923980712890625, -0.18122100830078125, -0.1700439453125, -0.15886688232421875, -0.1476898193359375, -0.13651275634765625, -0.125335693359375, -0.11415863037109375, -0.1029815673828125, -0.09180450439453125, -0.08062744140625, -0.06945037841796875, -0.0582733154296875, -0.04709625244140625, -0.035919189453125, -0.02474212646484375, -0.0135650634765625, -0.00238800048828125, 0.0087890625, 0.01996612548828125, 0.0311431884765625, 0.04232025146484375, 0.053497314453125, 0.06467437744140625, 0.0758514404296875, 0.08702850341796875, 0.09820556640625, 0.10938262939453125, 0.1205596923828125, 0.13173675537109375, 0.142913818359375, 0.15409088134765625, 0.1652679443359375, 0.17644500732421875, 0.1876220703125, 0.19879913330078125, 0.2099761962890625, 0.22115325927734375, 0.232330322265625, 0.24350738525390625, 0.2546844482421875, 0.26586151123046875, 0.27703857421875, 0.28821563720703125, 0.2993927001953125, 0.31056976318359375, 0.321746826171875, 0.33292388916015625, 0.3441009521484375, 0.35527801513671875, 0.366455078125]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 9.0, 9.0, 10.0, 16.0, 17.0, 18.0, 28.0, 21.0, 28.0, 27.0, 27.0, 35.0, 29.0, 48.0, 41.0, 36.0, 37.0, 52.0, 52.0, 48.0, 30.0, 27.0, 40.0, 28.0, 39.0, 32.0, 30.0, 28.0, 24.0, 16.0, 15.0, 12.0, 9.0, 12.0, 6.0, 8.0, 9.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12359619140625, -0.11969661712646484, -0.11579704284667969, -0.11189746856689453, -0.10799789428710938, -0.10409832000732422, -0.10019874572753906, -0.0962991714477539, -0.09239959716796875, -0.0885000228881836, -0.08460044860839844, -0.08070087432861328, -0.07680130004882812, -0.07290172576904297, -0.06900215148925781, -0.06510257720947266, -0.0612030029296875, -0.057303428649902344, -0.05340385437011719, -0.04950428009033203, -0.045604705810546875, -0.04170513153076172, -0.03780555725097656, -0.033905982971191406, -0.03000640869140625, -0.026106834411621094, -0.022207260131835938, -0.01830768585205078, -0.014408111572265625, -0.010508537292480469, -0.0066089630126953125, -0.0027093887329101562, 0.001190185546875, 0.005089759826660156, 0.008989334106445312, 0.012888908386230469, 0.016788482666015625, 0.02068805694580078, 0.024587631225585938, 0.028487205505371094, 0.03238677978515625, 0.036286354064941406, 0.04018592834472656, 0.04408550262451172, 0.047985076904296875, 0.05188465118408203, 0.05578422546386719, 0.059683799743652344, 0.0635833740234375, 0.06748294830322266, 0.07138252258300781, 0.07528209686279297, 0.07918167114257812, 0.08308124542236328, 0.08698081970214844, 0.0908803939819336, 0.09477996826171875, 0.0986795425415039, 0.10257911682128906, 0.10647869110107422, 0.11037826538085938, 0.11427783966064453, 0.11817741394042969, 0.12207698822021484, 0.1259765625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 8.0, 25.0, 38.0, 51.0, 70.0, 120.0, 189.0, 265.0, 428.0, 680.0, 1062.0, 1629.0, 2607.0, 4390.0, 6937.0, 11243.0, 18688.0, 30546.0, 51923.0, 89001.0, 161611.0, 324367.0, 775059.0, 1478991.0, 623213.0, 274372.0, 141483.0, 78714.0, 45372.0, 27523.0, 16643.0, 10335.0, 6258.0, 3871.0, 2515.0, 1489.0, 907.0, 607.0, 408.0, 229.0, 136.0, 100.0, 58.0, 44.0, 20.0, 13.0, 14.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0], "bins": [-0.230224609375, -0.22352981567382812, -0.21683502197265625, -0.21014022827148438, -0.2034454345703125, -0.19675064086914062, -0.19005584716796875, -0.18336105346679688, -0.176666259765625, -0.16997146606445312, -0.16327667236328125, -0.15658187866210938, -0.1498870849609375, -0.14319229125976562, -0.13649749755859375, -0.12980270385742188, -0.12310791015625, -0.11641311645507812, -0.10971832275390625, -0.10302352905273438, -0.0963287353515625, -0.08963394165039062, -0.08293914794921875, -0.07624435424804688, -0.069549560546875, -0.06285476684570312, -0.05615997314453125, -0.049465179443359375, -0.0427703857421875, -0.036075592041015625, -0.02938079833984375, -0.022686004638671875, -0.0159912109375, -0.009296417236328125, -0.00260162353515625, 0.004093170166015625, 0.0107879638671875, 0.017482757568359375, 0.02417755126953125, 0.030872344970703125, 0.037567138671875, 0.044261932373046875, 0.05095672607421875, 0.057651519775390625, 0.0643463134765625, 0.07104110717773438, 0.07773590087890625, 0.08443069458007812, 0.09112548828125, 0.09782028198242188, 0.10451507568359375, 0.11120986938476562, 0.1179046630859375, 0.12459945678710938, 0.13129425048828125, 0.13798904418945312, 0.144683837890625, 0.15137863159179688, 0.15807342529296875, 0.16476821899414062, 0.1714630126953125, 0.17815780639648438, 0.18485260009765625, 0.19154739379882812, 0.1982421875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 8.0, 13.0, 23.0, 23.0, 34.0, 42.0, 41.0, 53.0, 74.0, 90.0, 94.0, 110.0, 125.0, 159.0, 181.0, 244.0, 243.0, 309.0, 336.0, 313.0, 278.0, 218.0, 191.0, 170.0, 138.0, 83.0, 72.0, 85.0, 67.0, 66.0, 50.0, 41.0, 28.0, 20.0, 14.0, 11.0, 4.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0704345703125, -0.0681314468383789, -0.06582832336425781, -0.06352519989013672, -0.061222076416015625, -0.05891895294189453, -0.05661582946777344, -0.054312705993652344, -0.05200958251953125, -0.049706459045410156, -0.04740333557128906, -0.04510021209716797, -0.042797088623046875, -0.04049396514892578, -0.03819084167480469, -0.035887718200683594, -0.0335845947265625, -0.031281471252441406, -0.028978347778320312, -0.02667522430419922, -0.024372100830078125, -0.02206897735595703, -0.019765853881835938, -0.017462730407714844, -0.01515960693359375, -0.012856483459472656, -0.010553359985351562, -0.008250236511230469, -0.005947113037109375, -0.0036439895629882812, -0.0013408660888671875, 0.0009622573852539062, 0.003265380859375, 0.005568504333496094, 0.007871627807617188, 0.010174751281738281, 0.012477874755859375, 0.014780998229980469, 0.017084121704101562, 0.019387245178222656, 0.02169036865234375, 0.023993492126464844, 0.026296615600585938, 0.02859973907470703, 0.030902862548828125, 0.03320598602294922, 0.03550910949707031, 0.037812232971191406, 0.0401153564453125, 0.042418479919433594, 0.04472160339355469, 0.04702472686767578, 0.049327850341796875, 0.05163097381591797, 0.05393409729003906, 0.056237220764160156, 0.05854034423828125, 0.060843467712402344, 0.06314659118652344, 0.06544971466064453, 0.06775283813476562, 0.07005596160888672, 0.07235908508300781, 0.0746622085571289, 0.07696533203125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 4.0, 15.0, 9.0, 17.0, 20.0, 27.0, 30.0, 37.0, 66.0, 82.0, 79.0, 130.0, 103.0, 78.0, 66.0, 55.0, 39.0, 23.0, 21.0, 18.0, 18.0, 11.0, 7.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.19987991452217102, -0.19294939935207367, -0.18601888418197632, -0.17908836901187897, -0.17215785384178162, -0.16522735357284546, -0.1582968384027481, -0.15136632323265076, -0.1444358080625534, -0.13750529289245605, -0.1305747777223587, -0.12364427000284195, -0.1167137548327446, -0.10978323966264725, -0.1028527319431305, -0.09592221677303314, -0.08899170160293579, -0.08206118643283844, -0.07513067126274109, -0.06820016354322433, -0.061269648373126984, -0.05433913320302963, -0.04740862175822258, -0.04047811031341553, -0.033547595143318176, -0.026617081835865974, -0.019686568528413773, -0.01275605522096157, -0.005825541913509369, 0.0011049732565879822, 0.008035484701395035, 0.014965996146202087, 0.02189651131629944, 0.02882702462375164, 0.03575753793120384, 0.042688049376010895, 0.049618564546108246, 0.0565490797162056, 0.06347958743572235, 0.0704101026058197, 0.07734061777591705, 0.0842711329460144, 0.09120164811611176, 0.09813215583562851, 0.10506267100572586, 0.11199318617582321, 0.11892369389533997, 0.12585420906543732, 0.13278472423553467, 0.13971523940563202, 0.14664575457572937, 0.15357626974582672, 0.16050678491592407, 0.16743728518486023, 0.17436780035495758, 0.18129831552505493, 0.18822883069515228, 0.19515934586524963, 0.20208986103534698, 0.20902037620544434, 0.2159508764743805, 0.22288140654563904, 0.2298119068145752, 0.23674242198467255, 0.2436729371547699]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 6.0, 9.0, 10.0, 8.0, 20.0, 11.0, 17.0, 26.0, 19.0, 28.0, 18.0, 26.0, 36.0, 38.0, 41.0, 38.0, 37.0, 34.0, 38.0, 37.0, 37.0, 37.0, 43.0, 33.0, 34.0, 31.0, 33.0, 30.0, 27.0, 31.0, 25.0, 17.0, 22.0, 14.0, 10.0, 17.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 8.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.13533739745616913, -0.1312183290719986, -0.12709924578666687, -0.12298017740249634, -0.1188611090183258, -0.11474203318357468, -0.11062295734882355, -0.10650388896465302, -0.10238481312990189, -0.09826573729515076, -0.09414666891098022, -0.0900275930762291, -0.08590851724147797, -0.08178944885730743, -0.0776703730225563, -0.07355129718780518, -0.06943222880363464, -0.06531315296888351, -0.06119408458471298, -0.05707500874996185, -0.05295593664050102, -0.04883686453104019, -0.04471778869628906, -0.04059871658682823, -0.0364796444773674, -0.03236057236790657, -0.02824149839580059, -0.02412242442369461, -0.02000335231423378, -0.01588428020477295, -0.01176520623266697, -0.007646132260560989, -0.003527045249938965, 0.0005920277908444405, 0.004711100831627846, 0.008830173872411251, 0.012949246913194656, 0.017068319022655487, 0.021187392994761467, 0.025306466966867447, 0.029425539076328278, 0.03354461118578911, 0.03766368329524994, 0.04178275913000107, 0.0459018312394619, 0.05002090334892273, 0.05413997918367386, 0.05825905129313469, 0.06237812340259552, 0.06649719923734665, 0.07061626762151718, 0.07473534345626831, 0.07885441184043884, 0.08297348767518997, 0.0870925635099411, 0.09121163189411163, 0.09533070772886276, 0.09944978356361389, 0.10356885194778442, 0.10768792778253555, 0.11180700361728668, 0.11592607200145721, 0.12004514783620834, 0.12416422367095947, 0.12828329205513]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 7.0, 7.0, 14.0, 12.0, 20.0, 43.0, 71.0, 111.0, 177.0, 281.0, 367.0, 644.0, 1000.0, 1630.0, 2538.0, 4170.0, 6904.0, 11173.0, 19670.0, 35993.0, 70141.0, 160563.0, 390267.0, 177708.0, 75080.0, 38474.0, 20715.0, 11970.0, 7206.0, 4518.0, 2668.0, 1625.0, 1030.0, 632.0, 404.0, 274.0, 152.0, 96.0, 63.0, 49.0, 24.0, 22.0, 18.0, 7.0, 6.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1339111328125, -0.1293792724609375, -0.124847412109375, -0.1203155517578125, -0.11578369140625, -0.1112518310546875, -0.106719970703125, -0.1021881103515625, -0.09765625, -0.0931243896484375, -0.088592529296875, -0.0840606689453125, -0.07952880859375, -0.0749969482421875, -0.070465087890625, -0.0659332275390625, -0.0614013671875, -0.0568695068359375, -0.052337646484375, -0.0478057861328125, -0.04327392578125, -0.0387420654296875, -0.034210205078125, -0.0296783447265625, -0.025146484375, -0.0206146240234375, -0.016082763671875, -0.0115509033203125, -0.00701904296875, -0.0024871826171875, 0.002044677734375, 0.0065765380859375, 0.0111083984375, 0.0156402587890625, 0.020172119140625, 0.0247039794921875, 0.02923583984375, 0.0337677001953125, 0.038299560546875, 0.0428314208984375, 0.04736328125, 0.0518951416015625, 0.056427001953125, 0.0609588623046875, 0.06549072265625, 0.0700225830078125, 0.074554443359375, 0.0790863037109375, 0.0836181640625, 0.0881500244140625, 0.092681884765625, 0.0972137451171875, 0.10174560546875, 0.1062774658203125, 0.110809326171875, 0.1153411865234375, 0.119873046875, 0.1244049072265625, 0.128936767578125, 0.1334686279296875, 0.13800048828125, 0.1425323486328125, 0.147064208984375, 0.1515960693359375, 0.1561279296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 6.0, 3.0, 4.0, 4.0, 16.0, 5.0, 12.0, 17.0, 16.0, 16.0, 25.0, 21.0, 15.0, 22.0, 34.0, 29.0, 43.0, 42.0, 39.0, 37.0, 45.0, 48.0, 43.0, 32.0, 52.0, 48.0, 37.0, 32.0, 30.0, 32.0, 26.0, 28.0, 29.0, 22.0, 19.0, 12.0, 12.0, 11.0, 11.0, 7.0, 8.0, 6.0, 1.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.15966796875, -0.1551361083984375, -0.150604248046875, -0.1460723876953125, -0.14154052734375, -0.1370086669921875, -0.132476806640625, -0.1279449462890625, -0.1234130859375, -0.1188812255859375, -0.114349365234375, -0.1098175048828125, -0.10528564453125, -0.1007537841796875, -0.096221923828125, -0.0916900634765625, -0.087158203125, -0.0826263427734375, -0.078094482421875, -0.0735626220703125, -0.06903076171875, -0.0644989013671875, -0.059967041015625, -0.0554351806640625, -0.0509033203125, -0.0463714599609375, -0.041839599609375, -0.0373077392578125, -0.03277587890625, -0.0282440185546875, -0.023712158203125, -0.0191802978515625, -0.0146484375, -0.0101165771484375, -0.005584716796875, -0.0010528564453125, 0.00347900390625, 0.0080108642578125, 0.012542724609375, 0.0170745849609375, 0.0216064453125, 0.0261383056640625, 0.030670166015625, 0.0352020263671875, 0.03973388671875, 0.0442657470703125, 0.048797607421875, 0.0533294677734375, 0.057861328125, 0.0623931884765625, 0.066925048828125, 0.0714569091796875, 0.07598876953125, 0.0805206298828125, 0.085052490234375, 0.0895843505859375, 0.0941162109375, 0.0986480712890625, 0.103179931640625, 0.1077117919921875, 0.11224365234375, 0.1167755126953125, 0.121307373046875, 0.1258392333984375, 0.13037109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 1.0, 9.0, 8.0, 8.0, 21.0, 28.0, 37.0, 39.0, 41.0, 96.0, 122.0, 142.0, 204.0, 342.0, 439.0, 603.0, 816.0, 1272.0, 1990.0, 3100.0, 5097.0, 9106.0, 17931.0, 45952.0, 306173.0, 550969.0, 57468.0, 20677.0, 10226.0, 5548.0, 3387.0, 2113.0, 1370.0, 933.0, 653.0, 446.0, 341.0, 240.0, 172.0, 104.0, 91.0, 65.0, 55.0, 43.0, 26.0, 16.0, 10.0, 3.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2364501953125, -0.2290821075439453, -0.22171401977539062, -0.21434593200683594, -0.20697784423828125, -0.19960975646972656, -0.19224166870117188, -0.1848735809326172, -0.1775054931640625, -0.1701374053955078, -0.16276931762695312, -0.15540122985839844, -0.14803314208984375, -0.14066505432128906, -0.13329696655273438, -0.1259288787841797, -0.118560791015625, -0.11119270324707031, -0.10382461547851562, -0.09645652770996094, -0.08908843994140625, -0.08172035217285156, -0.07435226440429688, -0.06698417663574219, -0.0596160888671875, -0.05224800109863281, -0.044879913330078125, -0.03751182556152344, -0.03014373779296875, -0.022775650024414062, -0.015407562255859375, -0.008039474487304688, -0.00067138671875, 0.0066967010498046875, 0.014064788818359375, 0.021432876586914062, 0.02880096435546875, 0.03616905212402344, 0.043537139892578125, 0.05090522766113281, 0.0582733154296875, 0.06564140319824219, 0.07300949096679688, 0.08037757873535156, 0.08774566650390625, 0.09511375427246094, 0.10248184204101562, 0.10984992980957031, 0.117218017578125, 0.12458610534667969, 0.13195419311523438, 0.13932228088378906, 0.14669036865234375, 0.15405845642089844, 0.16142654418945312, 0.1687946319580078, 0.1761627197265625, 0.1835308074951172, 0.19089889526367188, 0.19826698303222656, 0.20563507080078125, 0.21300315856933594, 0.22037124633789062, 0.2277393341064453, 0.235107421875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 11.0, 10.0, 7.0, 10.0, 12.0, 13.0, 14.0, 11.0, 30.0, 20.0, 28.0, 29.0, 25.0, 31.0, 44.0, 35.0, 39.0, 37.0, 39.0, 37.0, 33.0, 42.0, 43.0, 32.0, 45.0, 46.0, 35.0, 32.0, 27.0, 15.0, 22.0, 12.0, 19.0, 12.0, 16.0, 16.0, 3.0, 10.0, 8.0, 7.0, 5.0, 3.0, 5.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.08245849609375, -0.07993698120117188, -0.07741546630859375, -0.07489395141601562, -0.0723724365234375, -0.06985092163085938, -0.06732940673828125, -0.06480789184570312, -0.062286376953125, -0.059764862060546875, -0.05724334716796875, -0.054721832275390625, -0.0522003173828125, -0.049678802490234375, -0.04715728759765625, -0.044635772705078125, -0.0421142578125, -0.039592742919921875, -0.03707122802734375, -0.034549713134765625, -0.0320281982421875, -0.029506683349609375, -0.02698516845703125, -0.024463653564453125, -0.021942138671875, -0.019420623779296875, -0.01689910888671875, -0.014377593994140625, -0.0118560791015625, -0.009334564208984375, -0.00681304931640625, -0.004291534423828125, -0.00177001953125, 0.000751495361328125, 0.00327301025390625, 0.005794525146484375, 0.0083160400390625, 0.010837554931640625, 0.01335906982421875, 0.015880584716796875, 0.018402099609375, 0.020923614501953125, 0.02344512939453125, 0.025966644287109375, 0.0284881591796875, 0.031009674072265625, 0.03353118896484375, 0.036052703857421875, 0.03857421875, 0.041095733642578125, 0.04361724853515625, 0.046138763427734375, 0.0486602783203125, 0.051181793212890625, 0.05370330810546875, 0.056224822998046875, 0.058746337890625, 0.061267852783203125, 0.06378936767578125, 0.06631088256835938, 0.0688323974609375, 0.07135391235351562, 0.07387542724609375, 0.07639694213867188, 0.07891845703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 12.0, 5.0, 15.0, 11.0, 18.0, 35.0, 30.0, 40.0, 56.0, 56.0, 81.0, 128.0, 152.0, 172.0, 294.0, 406.0, 584.0, 944.0, 1399.0, 2244.0, 3863.0, 7151.0, 15765.0, 46931.0, 411690.0, 473630.0, 48510.0, 16250.0, 7270.0, 3975.0, 2284.0, 1492.0, 900.0, 664.0, 388.0, 284.0, 219.0, 161.0, 98.0, 76.0, 71.0, 58.0, 33.0, 25.0, 20.0, 15.0, 15.0, 10.0, 4.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.0184783935546875, -0.017882585525512695, -0.01728677749633789, -0.016690969467163086, -0.01609516143798828, -0.015499353408813477, -0.014903545379638672, -0.014307737350463867, -0.013711929321289062, -0.013116121292114258, -0.012520313262939453, -0.011924505233764648, -0.011328697204589844, -0.010732889175415039, -0.010137081146240234, -0.00954127311706543, -0.008945465087890625, -0.00834965705871582, -0.007753849029541016, -0.007158041000366211, -0.006562232971191406, -0.0059664249420166016, -0.005370616912841797, -0.004774808883666992, -0.0041790008544921875, -0.003583192825317383, -0.002987384796142578, -0.0023915767669677734, -0.0017957687377929688, -0.001199960708618164, -0.0006041526794433594, -8.344650268554688e-06, 0.00058746337890625, 0.0011832714080810547, 0.0017790794372558594, 0.002374887466430664, 0.0029706954956054688, 0.0035665035247802734, 0.004162311553955078, 0.004758119583129883, 0.0053539276123046875, 0.005949735641479492, 0.006545543670654297, 0.0071413516998291016, 0.007737159729003906, 0.008332967758178711, 0.008928775787353516, 0.00952458381652832, 0.010120391845703125, 0.01071619987487793, 0.011312007904052734, 0.011907815933227539, 0.012503623962402344, 0.013099431991577148, 0.013695240020751953, 0.014291048049926758, 0.014886856079101562, 0.015482664108276367, 0.016078472137451172, 0.016674280166625977, 0.01727008819580078, 0.017865896224975586, 0.01846170425415039, 0.019057512283325195, 0.0196533203125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 5.0, 7.0, 9.0, 15.0, 18.0, 12.0, 12.0, 13.0, 35.0, 86.0, 55.0, 53.0, 64.0, 65.0, 73.0, 138.0, 56.0, 47.0, 44.0, 38.0, 49.0, 19.0, 13.0, 13.0, 7.0, 9.0, 6.0, 6.0, 6.0, 1.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.8971040844917297e-06, -1.8272548913955688e-06, -1.757405698299408e-06, -1.687556505203247e-06, -1.6177073121070862e-06, -1.5478581190109253e-06, -1.4780089259147644e-06, -1.4081597328186035e-06, -1.3383105397224426e-06, -1.2684613466262817e-06, -1.1986121535301208e-06, -1.12876296043396e-06, -1.058913767337799e-06, -9.890645742416382e-07, -9.192153811454773e-07, -8.493661880493164e-07, -7.795169949531555e-07, -7.096678018569946e-07, -6.398186087608337e-07, -5.699694156646729e-07, -5.00120222568512e-07, -4.302710294723511e-07, -3.604218363761902e-07, -2.905726432800293e-07, -2.207234501838684e-07, -1.5087425708770752e-07, -8.102506399154663e-08, -1.1175870895385742e-08, 5.8673322200775146e-08, 1.2852251529693604e-07, 1.9837170839309692e-07, 2.682209014892578e-07, 3.380700945854187e-07, 4.079192876815796e-07, 4.777684807777405e-07, 5.476176738739014e-07, 6.174668669700623e-07, 6.873160600662231e-07, 7.57165253162384e-07, 8.270144462585449e-07, 8.968636393547058e-07, 9.667128324508667e-07, 1.0365620255470276e-06, 1.1064112186431885e-06, 1.1762604117393494e-06, 1.2461096048355103e-06, 1.3159587979316711e-06, 1.385807991027832e-06, 1.455657184123993e-06, 1.5255063772201538e-06, 1.5953555703163147e-06, 1.6652047634124756e-06, 1.7350539565086365e-06, 1.8049031496047974e-06, 1.8747523427009583e-06, 1.944601535797119e-06, 2.01445072889328e-06, 2.084299921989441e-06, 2.154149115085602e-06, 2.2239983081817627e-06, 2.2938475012779236e-06, 2.3636966943740845e-06, 2.4335458874702454e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 11.0, 16.0, 26.0, 35.0, 50.0, 80.0, 117.0, 169.0, 246.0, 366.0, 541.0, 861.0, 1430.0, 2436.0, 4170.0, 7692.0, 15507.0, 35306.0, 105479.0, 537098.0, 229614.0, 59384.0, 22996.0, 11024.0, 5690.0, 3181.0, 1852.0, 1100.0, 710.0, 456.0, 299.0, 202.0, 110.0, 84.0, 51.0, 42.0, 31.0, 23.0, 17.0, 16.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019073486328125, -0.018453359603881836, -0.017833232879638672, -0.017213106155395508, -0.016592979431152344, -0.01597285270690918, -0.015352725982666016, -0.014732599258422852, -0.014112472534179688, -0.013492345809936523, -0.01287221908569336, -0.012252092361450195, -0.011631965637207031, -0.011011838912963867, -0.010391712188720703, -0.009771585464477539, -0.009151458740234375, -0.008531332015991211, -0.007911205291748047, -0.007291078567504883, -0.006670951843261719, -0.006050825119018555, -0.005430698394775391, -0.0048105716705322266, -0.0041904449462890625, -0.0035703182220458984, -0.0029501914978027344, -0.0023300647735595703, -0.0017099380493164062, -0.0010898113250732422, -0.0004696846008300781, 0.00015044212341308594, 0.00077056884765625, 0.001390695571899414, 0.002010822296142578, 0.002630949020385742, 0.0032510757446289062, 0.0038712024688720703, 0.004491329193115234, 0.0051114559173583984, 0.0057315826416015625, 0.0063517093658447266, 0.006971836090087891, 0.007591962814331055, 0.008212089538574219, 0.008832216262817383, 0.009452342987060547, 0.010072469711303711, 0.010692596435546875, 0.011312723159790039, 0.011932849884033203, 0.012552976608276367, 0.013173103332519531, 0.013793230056762695, 0.01441335678100586, 0.015033483505249023, 0.015653610229492188, 0.01627373695373535, 0.016893863677978516, 0.01751399040222168, 0.018134117126464844, 0.018754243850708008, 0.019374370574951172, 0.019994497299194336, 0.0206146240234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 10.0, 7.0, 10.0, 12.0, 16.0, 37.0, 36.0, 93.0, 150.0, 211.0, 152.0, 87.0, 40.0, 27.0, 21.0, 17.0, 15.0, 5.0, 7.0, 6.0, 5.0, 4.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0110931396484375, -0.010818719863891602, -0.010544300079345703, -0.010269880294799805, -0.009995460510253906, -0.009721040725708008, -0.00944662094116211, -0.009172201156616211, -0.008897781372070312, -0.008623361587524414, -0.008348941802978516, -0.008074522018432617, -0.007800102233886719, -0.00752568244934082, -0.007251262664794922, -0.0069768428802490234, -0.006702423095703125, -0.0064280033111572266, -0.006153583526611328, -0.00587916374206543, -0.005604743957519531, -0.005330324172973633, -0.005055904388427734, -0.004781484603881836, -0.0045070648193359375, -0.004232645034790039, -0.003958225250244141, -0.003683805465698242, -0.0034093856811523438, -0.0031349658966064453, -0.002860546112060547, -0.0025861263275146484, -0.00231170654296875, -0.0020372867584228516, -0.0017628669738769531, -0.0014884471893310547, -0.0012140274047851562, -0.0009396076202392578, -0.0006651878356933594, -0.00039076805114746094, -0.0001163482666015625, 0.00015807151794433594, 0.0004324913024902344, 0.0007069110870361328, 0.0009813308715820312, 0.0012557506561279297, 0.0015301704406738281, 0.0018045902252197266, 0.002079010009765625, 0.0023534297943115234, 0.002627849578857422, 0.0029022693634033203, 0.0031766891479492188, 0.003451108932495117, 0.0037255287170410156, 0.003999948501586914, 0.0042743682861328125, 0.004548788070678711, 0.004823207855224609, 0.005097627639770508, 0.005372047424316406, 0.005646467208862305, 0.005920886993408203, 0.0061953067779541016, 0.0064697265625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 9.0, 11.0, 12.0, 23.0, 17.0, 32.0, 42.0, 50.0, 67.0, 85.0, 112.0, 121.0, 92.0, 79.0, 54.0, 48.0, 29.0, 25.0, 14.0, 18.0, 8.0, 7.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20207804441452026, -0.19492216408252716, -0.18776626884937286, -0.18061038851737976, -0.17345449328422546, -0.16629861295223236, -0.15914273262023926, -0.15198683738708496, -0.14483095705509186, -0.13767507672309875, -0.13051918148994446, -0.12336330115795135, -0.11620741337537766, -0.10905152559280396, -0.10189563781023026, -0.09473975002765656, -0.08758386224508286, -0.08042797446250916, -0.07327208667993546, -0.06611619889736176, -0.05896031856536865, -0.05180443078279495, -0.04464854300022125, -0.03749265894293785, -0.03033677116036415, -0.0231808852404356, -0.01602499932050705, -0.00886911153793335, -0.0017132256180047989, 0.005442660301923752, 0.012598548084497452, 0.019754432141780853, 0.026910319924354553, 0.03406620770692825, 0.041222091764211655, 0.048377979546785355, 0.055533863604068756, 0.06268975138664246, 0.06984563916921616, 0.07700152695178986, 0.08415740728378296, 0.09131329506635666, 0.09846918284893036, 0.10562506318092346, 0.11278095096349716, 0.11993683874607086, 0.12709271907806396, 0.13424861431121826, 0.14140450954437256, 0.14856038987636566, 0.15571628510951996, 0.16287216544151306, 0.17002806067466736, 0.17718394100666046, 0.18433982133865356, 0.19149571657180786, 0.19865159690380096, 0.20580747723579407, 0.21296337246894836, 0.22011925280094147, 0.22727514803409576, 0.23443102836608887, 0.24158692359924316, 0.24874280393123627, 0.25589868426322937]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 9.0, 8.0, 5.0, 10.0, 13.0, 19.0, 14.0, 23.0, 21.0, 27.0, 22.0, 27.0, 31.0, 42.0, 37.0, 39.0, 38.0, 35.0, 38.0, 35.0, 33.0, 40.0, 45.0, 31.0, 36.0, 33.0, 34.0, 33.0, 22.0, 31.0, 27.0, 22.0, 20.0, 14.0, 10.0, 20.0, 5.0, 7.0, 9.0, 8.0, 3.0, 0.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1353679746389389, -0.13127759099006653, -0.12718720734119415, -0.12309681624174118, -0.1190064325928688, -0.11491604894399643, -0.11082565784454346, -0.10673527419567108, -0.1026448905467987, -0.09855450689792633, -0.09446412324905396, -0.09037373214960098, -0.08628334850072861, -0.08219296485185623, -0.07810257375240326, -0.07401219010353088, -0.06992180645465851, -0.06583142280578613, -0.06174103543162346, -0.057650648057460785, -0.05356026440858841, -0.049469880759716034, -0.04537949338555336, -0.041289106011390686, -0.03719872236251831, -0.033108338713645935, -0.02901795133948326, -0.024927565827965736, -0.02083718031644821, -0.016746794804930687, -0.012656409293413162, -0.008566023781895638, -0.004475638270378113, -0.0003852527588605881, 0.0037051327526569366, 0.007795518264174461, 0.011885903775691986, 0.01597628928720951, 0.020066674798727036, 0.02415706031024456, 0.028247445821762085, 0.03233782947063446, 0.036428216844797134, 0.04051860421895981, 0.044608987867832184, 0.04869937151670456, 0.05278975889086723, 0.05688014626502991, 0.06097052991390228, 0.06506091356277466, 0.06915129721164703, 0.0732416883111, 0.07733207195997238, 0.08142245560884476, 0.08551284670829773, 0.0896032303571701, 0.09369361400604248, 0.09778399765491486, 0.10187438130378723, 0.1059647724032402, 0.11005515605211258, 0.11414553970098495, 0.11823593080043793, 0.1223263144493103, 0.12641669809818268]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 14.0, 17.0, 28.0, 42.0, 78.0, 119.0, 169.0, 262.0, 384.0, 666.0, 1033.0, 1735.0, 2754.0, 4624.0, 7969.0, 13626.0, 24331.0, 44029.0, 82154.0, 164024.0, 295303.0, 193152.0, 95509.0, 50754.0, 27756.0, 15490.0, 9053.0, 5412.0, 3048.0, 1943.0, 1188.0, 760.0, 427.0, 274.0, 165.0, 100.0, 67.0, 32.0, 21.0, 14.0, 10.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.33154296875, -0.3219642639160156, -0.31238555908203125, -0.3028068542480469, -0.2932281494140625, -0.2836494445800781, -0.27407073974609375, -0.2644920349121094, -0.254913330078125, -0.24533462524414062, -0.23575592041015625, -0.22617721557617188, -0.2165985107421875, -0.20701980590820312, -0.19744110107421875, -0.18786239624023438, -0.17828369140625, -0.16870498657226562, -0.15912628173828125, -0.14954757690429688, -0.1399688720703125, -0.13039016723632812, -0.12081146240234375, -0.11123275756835938, -0.101654052734375, -0.09207534790039062, -0.08249664306640625, -0.07291793823242188, -0.0633392333984375, -0.053760528564453125, -0.04418182373046875, -0.034603118896484375, -0.0250244140625, -0.015445709228515625, -0.00586700439453125, 0.003711700439453125, 0.0132904052734375, 0.022869110107421875, 0.03244781494140625, 0.042026519775390625, 0.051605224609375, 0.061183929443359375, 0.07076263427734375, 0.08034133911132812, 0.0899200439453125, 0.09949874877929688, 0.10907745361328125, 0.11865615844726562, 0.12823486328125, 0.13781356811523438, 0.14739227294921875, 0.15697097778320312, 0.1665496826171875, 0.17612838745117188, 0.18570709228515625, 0.19528579711914062, 0.204864501953125, 0.21444320678710938, 0.22402191162109375, 0.23360061645507812, 0.2431793212890625, 0.2527580261230469, 0.26233673095703125, 0.2719154357910156, 0.281494140625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 11.0, 4.0, 7.0, 6.0, 15.0, 14.0, 11.0, 16.0, 18.0, 22.0, 20.0, 35.0, 31.0, 36.0, 25.0, 32.0, 43.0, 27.0, 40.0, 39.0, 31.0, 32.0, 27.0, 39.0, 42.0, 36.0, 32.0, 34.0, 26.0, 36.0, 23.0, 24.0, 24.0, 21.0, 13.0, 19.0, 11.0, 10.0, 12.0, 8.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.109375, -0.10590553283691406, -0.10243606567382812, -0.09896659851074219, -0.09549713134765625, -0.09202766418457031, -0.08855819702148438, -0.08508872985839844, -0.0816192626953125, -0.07814979553222656, -0.07468032836914062, -0.07121086120605469, -0.06774139404296875, -0.06427192687988281, -0.060802459716796875, -0.05733299255371094, -0.053863525390625, -0.05039405822753906, -0.046924591064453125, -0.04345512390136719, -0.03998565673828125, -0.03651618957519531, -0.033046722412109375, -0.029577255249023438, -0.0261077880859375, -0.022638320922851562, -0.019168853759765625, -0.015699386596679688, -0.01222991943359375, -0.008760452270507812, -0.005290985107421875, -0.0018215179443359375, 0.00164794921875, 0.0051174163818359375, 0.008586883544921875, 0.012056350708007812, 0.01552581787109375, 0.018995285034179688, 0.022464752197265625, 0.025934219360351562, 0.0294036865234375, 0.03287315368652344, 0.036342620849609375, 0.03981208801269531, 0.04328155517578125, 0.04675102233886719, 0.050220489501953125, 0.05368995666503906, 0.057159423828125, 0.06062889099121094, 0.06409835815429688, 0.06756782531738281, 0.07103729248046875, 0.07450675964355469, 0.07797622680664062, 0.08144569396972656, 0.0849151611328125, 0.08838462829589844, 0.09185409545898438, 0.09532356262207031, 0.09879302978515625, 0.10226249694824219, 0.10573196411132812, 0.10920143127441406, 0.1126708984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 11.0, 16.0, 21.0, 26.0, 38.0, 45.0, 67.0, 88.0, 148.0, 219.0, 318.0, 492.0, 699.0, 1039.0, 1608.0, 2307.0, 3678.0, 5750.0, 9067.0, 14004.0, 22630.0, 37533.0, 63445.0, 112059.0, 214750.0, 243755.0, 130290.0, 72185.0, 42594.0, 25646.0, 15637.0, 9915.0, 6345.0, 4085.0, 2635.0, 1809.0, 1173.0, 800.0, 567.0, 340.0, 231.0, 156.0, 98.0, 71.0, 37.0, 42.0, 22.0, 23.0, 12.0, 9.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.26123046875, -0.2530975341796875, -0.244964599609375, -0.2368316650390625, -0.22869873046875, -0.2205657958984375, -0.212432861328125, -0.2042999267578125, -0.1961669921875, -0.1880340576171875, -0.179901123046875, -0.1717681884765625, -0.16363525390625, -0.1555023193359375, -0.147369384765625, -0.1392364501953125, -0.131103515625, -0.1229705810546875, -0.114837646484375, -0.1067047119140625, -0.09857177734375, -0.0904388427734375, -0.082305908203125, -0.0741729736328125, -0.0660400390625, -0.0579071044921875, -0.049774169921875, -0.0416412353515625, -0.03350830078125, -0.0253753662109375, -0.017242431640625, -0.0091094970703125, -0.0009765625, 0.0071563720703125, 0.015289306640625, 0.0234222412109375, 0.03155517578125, 0.0396881103515625, 0.047821044921875, 0.0559539794921875, 0.0640869140625, 0.0722198486328125, 0.080352783203125, 0.0884857177734375, 0.09661865234375, 0.1047515869140625, 0.112884521484375, 0.1210174560546875, 0.129150390625, 0.1372833251953125, 0.145416259765625, 0.1535491943359375, 0.16168212890625, 0.1698150634765625, 0.177947998046875, 0.1860809326171875, 0.1942138671875, 0.2023468017578125, 0.210479736328125, 0.2186126708984375, 0.22674560546875, 0.2348785400390625, 0.243011474609375, 0.2511444091796875, 0.25927734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 5.0, 9.0, 9.0, 14.0, 18.0, 11.0, 13.0, 20.0, 19.0, 20.0, 21.0, 32.0, 38.0, 31.0, 46.0, 44.0, 36.0, 21.0, 33.0, 35.0, 37.0, 29.0, 36.0, 51.0, 30.0, 38.0, 31.0, 21.0, 29.0, 23.0, 26.0, 17.0, 21.0, 23.0, 19.0, 17.0, 8.0, 8.0, 4.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0679931640625, -0.06567573547363281, -0.06335830688476562, -0.06104087829589844, -0.05872344970703125, -0.05640602111816406, -0.054088592529296875, -0.05177116394042969, -0.0494537353515625, -0.04713630676269531, -0.044818878173828125, -0.04250144958496094, -0.04018402099609375, -0.03786659240722656, -0.035549163818359375, -0.03323173522949219, -0.030914306640625, -0.028596878051757812, -0.026279449462890625, -0.023962020874023438, -0.02164459228515625, -0.019327163696289062, -0.017009735107421875, -0.014692306518554688, -0.0123748779296875, -0.010057449340820312, -0.007740020751953125, -0.0054225921630859375, -0.00310516357421875, -0.0007877349853515625, 0.001529693603515625, 0.0038471221923828125, 0.00616455078125, 0.008481979370117188, 0.010799407958984375, 0.013116836547851562, 0.01543426513671875, 0.017751693725585938, 0.020069122314453125, 0.022386550903320312, 0.0247039794921875, 0.027021408081054688, 0.029338836669921875, 0.03165626525878906, 0.03397369384765625, 0.03629112243652344, 0.038608551025390625, 0.04092597961425781, 0.043243408203125, 0.04556083679199219, 0.047878265380859375, 0.05019569396972656, 0.05251312255859375, 0.05483055114746094, 0.057147979736328125, 0.05946540832519531, 0.0617828369140625, 0.06410026550292969, 0.06641769409179688, 0.06873512268066406, 0.07105255126953125, 0.07336997985839844, 0.07568740844726562, 0.07800483703613281, 0.080322265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 11.0, 14.0, 19.0, 34.0, 41.0, 47.0, 83.0, 111.0, 152.0, 235.0, 322.0, 477.0, 711.0, 959.0, 1413.0, 1958.0, 2948.0, 4428.0, 6519.0, 10007.0, 16032.0, 28993.0, 66419.0, 613081.0, 182621.0, 47646.0, 23287.0, 13550.0, 8522.0, 5593.0, 3764.0, 2680.0, 1770.0, 1242.0, 847.0, 586.0, 425.0, 282.0, 217.0, 144.0, 111.0, 68.0, 53.0, 49.0, 24.0, 15.0, 11.0, 10.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.013031005859375, -0.01260828971862793, -0.01218557357788086, -0.011762857437133789, -0.011340141296386719, -0.010917425155639648, -0.010494709014892578, -0.010071992874145508, -0.009649276733398438, -0.009226560592651367, -0.008803844451904297, -0.008381128311157227, -0.007958412170410156, -0.007535696029663086, -0.007112979888916016, -0.006690263748168945, -0.006267547607421875, -0.005844831466674805, -0.005422115325927734, -0.004999399185180664, -0.004576683044433594, -0.0041539669036865234, -0.003731250762939453, -0.003308534622192383, -0.0028858184814453125, -0.002463102340698242, -0.002040386199951172, -0.0016176700592041016, -0.0011949539184570312, -0.0007722377777099609, -0.0003495216369628906, 7.319450378417969e-05, 0.00049591064453125, 0.0009186267852783203, 0.0013413429260253906, 0.001764059066772461, 0.0021867752075195312, 0.0026094913482666016, 0.003032207489013672, 0.003454923629760742, 0.0038776397705078125, 0.004300355911254883, 0.004723072052001953, 0.0051457881927490234, 0.005568504333496094, 0.005991220474243164, 0.006413936614990234, 0.006836652755737305, 0.007259368896484375, 0.007682085037231445, 0.008104801177978516, 0.008527517318725586, 0.008950233459472656, 0.009372949600219727, 0.009795665740966797, 0.010218381881713867, 0.010641098022460938, 0.011063814163208008, 0.011486530303955078, 0.011909246444702148, 0.012331962585449219, 0.012754678726196289, 0.01317739486694336, 0.01360011100769043, 0.0140228271484375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 13.0, 9.0, 11.0, 15.0, 15.0, 15.0, 82.0, 50.0, 54.0, 80.0, 102.0, 198.0, 75.0, 47.0, 41.0, 43.0, 22.0, 31.0, 15.0, 10.0, 8.0, 7.0, 3.0, 16.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.314336597919464e-06, -2.2444874048233032e-06, -2.1746382117271423e-06, -2.1047890186309814e-06, -2.0349398255348206e-06, -1.9650906324386597e-06, -1.8952414393424988e-06, -1.8253922462463379e-06, -1.755543053150177e-06, -1.6856938600540161e-06, -1.6158446669578552e-06, -1.5459954738616943e-06, -1.4761462807655334e-06, -1.4062970876693726e-06, -1.3364478945732117e-06, -1.2665987014770508e-06, -1.1967495083808899e-06, -1.126900315284729e-06, -1.0570511221885681e-06, -9.872019290924072e-07, -9.173527359962463e-07, -8.475035429000854e-07, -7.776543498039246e-07, -7.078051567077637e-07, -6.379559636116028e-07, -5.681067705154419e-07, -4.98257577419281e-07, -4.284083843231201e-07, -3.5855919122695923e-07, -2.8870999813079834e-07, -2.1886080503463745e-07, -1.4901161193847656e-07, -7.916241884231567e-08, -9.313225746154785e-09, 6.05359673500061e-08, 1.30385160446167e-07, 2.0023435354232788e-07, 2.7008354663848877e-07, 3.3993273973464966e-07, 4.0978193283081055e-07, 4.796311259269714e-07, 5.494803190231323e-07, 6.193295121192932e-07, 6.891787052154541e-07, 7.59027898311615e-07, 8.288770914077759e-07, 8.987262845039368e-07, 9.685754776000977e-07, 1.0384246706962585e-06, 1.1082738637924194e-06, 1.1781230568885803e-06, 1.2479722499847412e-06, 1.317821443080902e-06, 1.387670636177063e-06, 1.4575198292732239e-06, 1.5273690223693848e-06, 1.5972182154655457e-06, 1.6670674085617065e-06, 1.7369166016578674e-06, 1.8067657947540283e-06, 1.8766149878501892e-06, 1.94646418094635e-06, 2.016313374042511e-06, 2.086162567138672e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 6.0, 10.0, 6.0, 8.0, 15.0, 17.0, 36.0, 28.0, 64.0, 94.0, 112.0, 167.0, 171.0, 333.0, 485.0, 652.0, 992.0, 1462.0, 2236.0, 3562.0, 5931.0, 10158.0, 19535.0, 45413.0, 229873.0, 619254.0, 56497.0, 22348.0, 11312.0, 6450.0, 3929.0, 2418.0, 1610.0, 1013.0, 716.0, 455.0, 348.0, 236.0, 167.0, 108.0, 61.0, 66.0, 50.0, 45.0, 29.0, 23.0, 14.0, 13.0, 7.0, 11.0, 0.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01445770263671875, -0.013943076133728027, -0.013428449630737305, -0.012913823127746582, -0.01239919662475586, -0.011884570121765137, -0.011369943618774414, -0.010855317115783691, -0.010340690612792969, -0.009826064109802246, -0.009311437606811523, -0.0087968111038208, -0.008282184600830078, -0.0077675580978393555, -0.007252931594848633, -0.00673830509185791, -0.0062236785888671875, -0.005709052085876465, -0.005194425582885742, -0.0046797990798950195, -0.004165172576904297, -0.0036505460739135742, -0.0031359195709228516, -0.002621293067932129, -0.0021066665649414062, -0.0015920400619506836, -0.001077413558959961, -0.0005627870559692383, -4.8160552978515625e-05, 0.00046646595001220703, 0.0009810924530029297, 0.0014957189559936523, 0.002010345458984375, 0.0025249719619750977, 0.0030395984649658203, 0.003554224967956543, 0.004068851470947266, 0.004583477973937988, 0.005098104476928711, 0.005612730979919434, 0.006127357482910156, 0.006641983985900879, 0.0071566104888916016, 0.007671236991882324, 0.008185863494873047, 0.00870048999786377, 0.009215116500854492, 0.009729743003845215, 0.010244369506835938, 0.01075899600982666, 0.011273622512817383, 0.011788249015808105, 0.012302875518798828, 0.01281750202178955, 0.013332128524780273, 0.013846755027770996, 0.014361381530761719, 0.014876008033752441, 0.015390634536743164, 0.015905261039733887, 0.01641988754272461, 0.016934514045715332, 0.017449140548706055, 0.017963767051696777, 0.0184783935546875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 2.0, 7.0, 3.0, 6.0, 9.0, 13.0, 9.0, 11.0, 20.0, 11.0, 26.0, 29.0, 43.0, 84.0, 279.0, 116.0, 79.0, 47.0, 42.0, 24.0, 21.0, 14.0, 19.0, 10.0, 10.0, 9.0, 4.0, 6.0, 2.0, 1.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0038166046142578125, -0.003710329532623291, -0.0036040544509887695, -0.003497779369354248, -0.0033915042877197266, -0.003285229206085205, -0.0031789541244506836, -0.003072679042816162, -0.0029664039611816406, -0.002860128879547119, -0.0027538537979125977, -0.002647578716278076, -0.0025413036346435547, -0.002435028553009033, -0.0023287534713745117, -0.0022224783897399902, -0.0021162033081054688, -0.0020099282264709473, -0.0019036531448364258, -0.0017973780632019043, -0.0016911029815673828, -0.0015848278999328613, -0.0014785528182983398, -0.0013722777366638184, -0.0012660026550292969, -0.0011597275733947754, -0.001053452491760254, -0.0009471774101257324, -0.0008409023284912109, -0.0007346272468566895, -0.000628352165222168, -0.0005220770835876465, -0.000415802001953125, -0.0003095269203186035, -0.00020325183868408203, -9.697675704956055e-05, 9.298324584960938e-06, 0.00011557340621948242, 0.0002218484878540039, 0.0003281235694885254, 0.0004343986511230469, 0.0005406737327575684, 0.0006469488143920898, 0.0007532238960266113, 0.0008594989776611328, 0.0009657740592956543, 0.0010720491409301758, 0.0011783242225646973, 0.0012845993041992188, 0.0013908743858337402, 0.0014971494674682617, 0.0016034245491027832, 0.0017096996307373047, 0.0018159747123718262, 0.0019222497940063477, 0.002028524875640869, 0.0021347999572753906, 0.002241075038909912, 0.0023473501205444336, 0.002453625202178955, 0.0025599002838134766, 0.002666175365447998, 0.0027724504470825195, 0.002878725528717041, 0.0029850006103515625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 12.0, 9.0, 11.0, 16.0, 21.0, 33.0, 35.0, 72.0, 84.0, 103.0, 109.0, 122.0, 86.0, 61.0, 51.0, 37.0, 29.0, 24.0, 20.0, 13.0, 12.0, 6.0, 13.0, 9.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17265063524246216, -0.1657581925392151, -0.1588657647371292, -0.15197333693504333, -0.14508089423179626, -0.1381884515285492, -0.13129602372646332, -0.12440358847379684, -0.11751115322113037, -0.1106187179684639, -0.10372628271579742, -0.09683384746313095, -0.08994141221046448, -0.083048976957798, -0.07615654170513153, -0.06926410645246506, -0.062371671199798584, -0.05547923594713211, -0.04858680069446564, -0.041694365441799164, -0.03480193018913269, -0.027909494936466217, -0.021017059683799744, -0.01412462443113327, -0.007232189178466797, -0.0003397539258003235, 0.00655268132686615, 0.013445116579532623, 0.020337551832199097, 0.02722998708486557, 0.03412242233753204, 0.04101485759019852, 0.04790729284286499, 0.054799728095531464, 0.06169216334819794, 0.06858459860086441, 0.07547703385353088, 0.08236946910619736, 0.08926190435886383, 0.0961543396115303, 0.10304677486419678, 0.10993921011686325, 0.11683164536952972, 0.1237240806221962, 0.13061651587486267, 0.13750895857810974, 0.14440138638019562, 0.1512938141822815, 0.15818625688552856, 0.16507869958877563, 0.1719711273908615, 0.1788635551929474, 0.18575599789619446, 0.19264844059944153, 0.1995408684015274, 0.20643329620361328, 0.21332573890686035, 0.22021818161010742, 0.2271106094121933, 0.23400303721427917, 0.24089547991752625, 0.24778792262077332, 0.254680335521698, 0.26157277822494507, 0.26846522092819214]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 9.0, 5.0, 14.0, 13.0, 12.0, 17.0, 24.0, 26.0, 19.0, 22.0, 37.0, 25.0, 35.0, 45.0, 40.0, 35.0, 48.0, 42.0, 41.0, 36.0, 46.0, 40.0, 38.0, 36.0, 32.0, 26.0, 30.0, 28.0, 28.0, 32.0, 19.0, 14.0, 13.0, 11.0, 17.0, 11.0, 10.0, 9.0, 2.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.13561442494392395, -0.13153374195098877, -0.1274530589580536, -0.12337237596511841, -0.11929168552160263, -0.11521100252866745, -0.11113031953573227, -0.10704963654279709, -0.10296894609928131, -0.09888826310634613, -0.09480758011341095, -0.09072689712047577, -0.08664620667695999, -0.08256552368402481, -0.07848484069108963, -0.07440415769815445, -0.07032347470521927, -0.06624279171228409, -0.06216210499405861, -0.05808142200112343, -0.05400073528289795, -0.04992005228996277, -0.04583936929702759, -0.04175868630409241, -0.03767799958586693, -0.03359731659293175, -0.02951662987470627, -0.025435946881771088, -0.021355262026190758, -0.017274577170610428, -0.013193894177675247, -0.009113209322094917, -0.005032524466514587, -0.0009518400765955448, 0.0031288443133234978, 0.007209528237581253, 0.011290213093161583, 0.015370897948741913, 0.019451580941677094, 0.023532265797257423, 0.027612950652837753, 0.031693633645772934, 0.03577432036399841, 0.039855003356933594, 0.043935686349868774, 0.048016373068094254, 0.052097056061029434, 0.05617774277925491, 0.060258425772190094, 0.06433910876512527, 0.06841979175806046, 0.07250048220157623, 0.07658116519451141, 0.0806618481874466, 0.08474253118038177, 0.08882321417331696, 0.09290389716625214, 0.09698458015918732, 0.1010652631521225, 0.10514594614505768, 0.10922663658857346, 0.11330731958150864, 0.11738800257444382, 0.121468685567379, 0.12554937601089478]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 14.0, 18.0, 27.0, 38.0, 49.0, 79.0, 116.0, 169.0, 280.0, 483.0, 766.0, 1196.0, 1912.0, 3087.0, 4934.0, 8453.0, 14211.0, 24927.0, 44613.0, 83326.0, 167692.0, 457502.0, 1750466.0, 1079334.0, 275135.0, 122749.0, 63905.0, 35755.0, 20613.0, 12227.0, 7358.0, 4588.0, 3035.0, 1832.0, 1166.0, 716.0, 500.0, 352.0, 200.0, 147.0, 93.0, 62.0, 42.0, 37.0, 28.0, 17.0, 10.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1734619140625, -0.16743850708007812, -0.16141510009765625, -0.15539169311523438, -0.1493682861328125, -0.14334487915039062, -0.13732147216796875, -0.13129806518554688, -0.125274658203125, -0.11925125122070312, -0.11322784423828125, -0.10720443725585938, -0.1011810302734375, -0.09515762329101562, -0.08913421630859375, -0.08311080932617188, -0.07708740234375, -0.07106399536132812, -0.06504058837890625, -0.059017181396484375, -0.0529937744140625, -0.046970367431640625, -0.04094696044921875, -0.034923553466796875, -0.028900146484375, -0.022876739501953125, -0.01685333251953125, -0.010829925537109375, -0.0048065185546875, 0.001216888427734375, 0.00724029541015625, 0.013263702392578125, 0.019287109375, 0.025310516357421875, 0.03133392333984375, 0.037357330322265625, 0.0433807373046875, 0.049404144287109375, 0.05542755126953125, 0.061450958251953125, 0.067474365234375, 0.07349777221679688, 0.07952117919921875, 0.08554458618164062, 0.0915679931640625, 0.09759140014648438, 0.10361480712890625, 0.10963821411132812, 0.11566162109375, 0.12168502807617188, 0.12770843505859375, 0.13373184204101562, 0.1397552490234375, 0.14577865600585938, 0.15180206298828125, 0.15782546997070312, 0.163848876953125, 0.16987228393554688, 0.17589569091796875, 0.18191909790039062, 0.1879425048828125, 0.19396591186523438, 0.19998931884765625, 0.20601272583007812, 0.2120361328125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 7.0, 3.0, 8.0, 11.0, 17.0, 21.0, 21.0, 20.0, 23.0, 22.0, 30.0, 31.0, 35.0, 39.0, 37.0, 32.0, 43.0, 38.0, 33.0, 36.0, 47.0, 39.0, 36.0, 29.0, 36.0, 35.0, 28.0, 35.0, 29.0, 23.0, 12.0, 24.0, 16.0, 10.0, 8.0, 13.0, 17.0, 12.0, 3.0, 6.0, 7.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-0.07501220703125, -0.07277679443359375, -0.0705413818359375, -0.06830596923828125, -0.066070556640625, -0.06383514404296875, -0.0615997314453125, -0.05936431884765625, -0.05712890625, -0.05489349365234375, -0.0526580810546875, -0.05042266845703125, -0.048187255859375, -0.04595184326171875, -0.0437164306640625, -0.04148101806640625, -0.03924560546875, -0.03701019287109375, -0.0347747802734375, -0.03253936767578125, -0.030303955078125, -0.02806854248046875, -0.0258331298828125, -0.02359771728515625, -0.0213623046875, -0.01912689208984375, -0.0168914794921875, -0.01465606689453125, -0.012420654296875, -0.01018524169921875, -0.0079498291015625, -0.00571441650390625, -0.00347900390625, -0.00124359130859375, 0.0009918212890625, 0.00322723388671875, 0.005462646484375, 0.00769805908203125, 0.0099334716796875, 0.01216888427734375, 0.014404296875, 0.01663970947265625, 0.0188751220703125, 0.02111053466796875, 0.023345947265625, 0.02558135986328125, 0.0278167724609375, 0.03005218505859375, 0.03228759765625, 0.03452301025390625, 0.0367584228515625, 0.03899383544921875, 0.041229248046875, 0.04346466064453125, 0.0457000732421875, 0.04793548583984375, 0.0501708984375, 0.05240631103515625, 0.0546417236328125, 0.05687713623046875, 0.059112548828125, 0.06134796142578125, 0.0635833740234375, 0.06581878662109375, 0.06805419921875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 7.0, 9.0, 14.0, 18.0, 27.0, 41.0, 90.0, 144.0, 250.0, 495.0, 850.0, 1538.0, 2686.0, 4892.0, 8575.0, 15042.0, 27070.0, 51212.0, 102900.0, 217443.0, 523898.0, 1520316.0, 1021068.0, 366258.0, 162286.0, 78504.0, 39717.0, 21276.0, 12010.0, 6668.0, 3772.0, 2243.0, 1268.0, 741.0, 402.0, 236.0, 123.0, 68.0, 45.0, 35.0, 22.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.14039039611816406, -0.13551712036132812, -0.1306438446044922, -0.12577056884765625, -0.12089729309082031, -0.11602401733398438, -0.11115074157714844, -0.1062774658203125, -0.10140419006347656, -0.09653091430664062, -0.09165763854980469, -0.08678436279296875, -0.08191108703613281, -0.07703781127929688, -0.07216453552246094, -0.067291259765625, -0.06241798400878906, -0.057544708251953125, -0.05267143249511719, -0.04779815673828125, -0.04292488098144531, -0.038051605224609375, -0.03317832946777344, -0.0283050537109375, -0.023431777954101562, -0.018558502197265625, -0.013685226440429688, -0.00881195068359375, -0.0039386749267578125, 0.000934600830078125, 0.0058078765869140625, 0.01068115234375, 0.015554428100585938, 0.020427703857421875, 0.025300979614257812, 0.03017425537109375, 0.03504753112792969, 0.039920806884765625, 0.04479408264160156, 0.0496673583984375, 0.05454063415527344, 0.059413909912109375, 0.06428718566894531, 0.06916046142578125, 0.07403373718261719, 0.07890701293945312, 0.08378028869628906, 0.088653564453125, 0.09352684020996094, 0.09840011596679688, 0.10327339172363281, 0.10814666748046875, 0.11301994323730469, 0.11789321899414062, 0.12276649475097656, 0.1276397705078125, 0.13251304626464844, 0.13738632202148438, 0.1422595977783203, 0.14713287353515625, 0.1520061492919922, 0.15687942504882812, 0.16175270080566406, 0.1666259765625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 13.0, 13.0, 16.0, 20.0, 30.0, 31.0, 30.0, 50.0, 62.0, 63.0, 88.0, 111.0, 130.0, 151.0, 198.0, 226.0, 251.0, 301.0, 302.0, 321.0, 290.0, 266.0, 199.0, 188.0, 135.0, 114.0, 99.0, 77.0, 52.0, 64.0, 49.0, 41.0, 22.0, 27.0, 11.0, 13.0, 7.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03912353515625, -0.03771162033081055, -0.036299705505371094, -0.03488779067993164, -0.03347587585449219, -0.032063961029052734, -0.03065204620361328, -0.029240131378173828, -0.027828216552734375, -0.026416301727294922, -0.02500438690185547, -0.023592472076416016, -0.022180557250976562, -0.02076864242553711, -0.019356727600097656, -0.017944812774658203, -0.01653289794921875, -0.015120983123779297, -0.013709068298339844, -0.01229715347290039, -0.010885238647460938, -0.009473323822021484, -0.008061408996582031, -0.006649494171142578, -0.005237579345703125, -0.003825664520263672, -0.0024137496948242188, -0.0010018348693847656, 0.0004100799560546875, 0.0018219947814941406, 0.0032339096069335938, 0.004645824432373047, 0.0060577392578125, 0.007469654083251953, 0.008881568908691406, 0.01029348373413086, 0.011705398559570312, 0.013117313385009766, 0.014529228210449219, 0.015941143035888672, 0.017353057861328125, 0.018764972686767578, 0.02017688751220703, 0.021588802337646484, 0.023000717163085938, 0.02441263198852539, 0.025824546813964844, 0.027236461639404297, 0.02864837646484375, 0.030060291290283203, 0.031472206115722656, 0.03288412094116211, 0.03429603576660156, 0.035707950592041016, 0.03711986541748047, 0.03853178024291992, 0.039943695068359375, 0.04135560989379883, 0.04276752471923828, 0.044179439544677734, 0.04559135437011719, 0.04700326919555664, 0.048415184020996094, 0.04982709884643555, 0.051239013671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 10.0, 14.0, 14.0, 26.0, 32.0, 38.0, 44.0, 67.0, 73.0, 96.0, 122.0, 95.0, 88.0, 57.0, 52.0, 39.0, 31.0, 28.0, 16.0, 6.0, 9.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15770062804222107, -0.15328910946846008, -0.1488776057958603, -0.1444661021232605, -0.1400545835494995, -0.13564306497573853, -0.13123156130313873, -0.12682005763053894, -0.12240853905677795, -0.11799702793359756, -0.11358551681041718, -0.10917400568723679, -0.1047624945640564, -0.10035098344087601, -0.09593947231769562, -0.09152796119451523, -0.08711645007133484, -0.08270493894815445, -0.07829342782497406, -0.07388191670179367, -0.06947040557861328, -0.06505889445543289, -0.0606473833322525, -0.05623587220907211, -0.051824361085891724, -0.047412849962711334, -0.043001338839530945, -0.038589827716350555, -0.034178316593170166, -0.029766805469989777, -0.025355294346809387, -0.020943783223628998, -0.016532257199287415, -0.012120746076107025, -0.007709234952926636, -0.0032977238297462463, 0.001113787293434143, 0.0055252984166145325, 0.009936809539794922, 0.014348320662975311, 0.0187598317861557, 0.02317134290933609, 0.02758285403251648, 0.03199436515569687, 0.03640587627887726, 0.04081738740205765, 0.04522889852523804, 0.049640409648418427, 0.054051920771598816, 0.058463431894779205, 0.0628749430179596, 0.06728645414113998, 0.07169796526432037, 0.07610947638750076, 0.08052098751068115, 0.08493249863386154, 0.08934400975704193, 0.09375552088022232, 0.09816703200340271, 0.1025785431265831, 0.10699005424976349, 0.11140156537294388, 0.11581307649612427, 0.12022458761930466, 0.12463609874248505]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 10.0, 12.0, 12.0, 10.0, 18.0, 20.0, 21.0, 26.0, 27.0, 20.0, 30.0, 36.0, 32.0, 33.0, 41.0, 41.0, 46.0, 44.0, 34.0, 31.0, 37.0, 34.0, 48.0, 38.0, 31.0, 33.0, 32.0, 21.0, 25.0, 20.0, 20.0, 19.0, 12.0, 13.0, 11.0, 9.0, 13.0, 5.0, 7.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.0746145099401474, -0.07216963171958923, -0.06972475349903107, -0.0672798752784729, -0.06483499705791473, -0.06239011883735657, -0.0599452406167984, -0.057500362396240234, -0.05505548417568207, -0.0526106059551239, -0.050165727734565735, -0.04772084951400757, -0.0452759712934494, -0.042831093072891235, -0.04038621485233307, -0.0379413366317749, -0.035496458411216736, -0.03305158019065857, -0.030606701970100403, -0.028161823749542236, -0.02571694552898407, -0.023272067308425903, -0.020827189087867737, -0.01838231086730957, -0.015937432646751404, -0.013492554426193237, -0.01104767620563507, -0.008602797985076904, -0.006157919764518738, -0.0037130415439605713, -0.0012681633234024048, 0.0011767148971557617, 0.0036215856671333313, 0.006066463887691498, 0.008511342108249664, 0.01095622032880783, 0.013401098549365997, 0.015845976769924164, 0.01829085499048233, 0.020735733211040497, 0.023180611431598663, 0.02562548965215683, 0.028070367872714996, 0.030515246093273163, 0.03296012431383133, 0.035405002534389496, 0.03784988075494766, 0.04029475897550583, 0.042739637196063995, 0.04518451541662216, 0.04762939363718033, 0.050074271857738495, 0.05251915007829666, 0.05496402829885483, 0.057408906519412994, 0.05985378473997116, 0.06229866296052933, 0.0647435411810875, 0.06718841940164566, 0.06963329762220383, 0.072078175842762, 0.07452305406332016, 0.07696793228387833, 0.07941281050443649, 0.08185768872499466]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 8.0, 9.0, 13.0, 26.0, 31.0, 51.0, 67.0, 104.0, 118.0, 170.0, 269.0, 391.0, 526.0, 716.0, 1080.0, 1549.0, 2186.0, 3189.0, 4722.0, 6984.0, 10432.0, 15883.0, 24693.0, 39588.0, 66535.0, 125504.0, 288971.0, 210413.0, 95628.0, 53274.0, 32960.0, 21038.0, 13409.0, 8878.0, 5905.0, 4130.0, 2759.0, 1893.0, 1303.0, 959.0, 641.0, 454.0, 344.0, 215.0, 184.0, 108.0, 73.0, 53.0, 32.0, 30.0, 19.0, 12.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.058197021484375, -0.0562443733215332, -0.054291725158691406, -0.05233907699584961, -0.05038642883300781, -0.048433780670166016, -0.04648113250732422, -0.04452848434448242, -0.042575836181640625, -0.04062318801879883, -0.03867053985595703, -0.036717891693115234, -0.03476524353027344, -0.03281259536743164, -0.030859947204589844, -0.028907299041748047, -0.02695465087890625, -0.025002002716064453, -0.023049354553222656, -0.02109670639038086, -0.019144058227539062, -0.017191410064697266, -0.015238761901855469, -0.013286113739013672, -0.011333465576171875, -0.009380817413330078, -0.007428169250488281, -0.005475521087646484, -0.0035228729248046875, -0.0015702247619628906, 0.00038242340087890625, 0.002335071563720703, 0.0042877197265625, 0.006240367889404297, 0.008193016052246094, 0.01014566421508789, 0.012098312377929688, 0.014050960540771484, 0.01600360870361328, 0.017956256866455078, 0.019908905029296875, 0.021861553192138672, 0.02381420135498047, 0.025766849517822266, 0.027719497680664062, 0.02967214584350586, 0.031624794006347656, 0.03357744216918945, 0.03553009033203125, 0.03748273849487305, 0.039435386657714844, 0.04138803482055664, 0.04334068298339844, 0.045293331146240234, 0.04724597930908203, 0.04919862747192383, 0.051151275634765625, 0.05310392379760742, 0.05505657196044922, 0.057009220123291016, 0.05896186828613281, 0.06091451644897461, 0.0628671646118164, 0.0648198127746582, 0.0667724609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 13.0, 11.0, 14.0, 19.0, 19.0, 17.0, 28.0, 25.0, 16.0, 34.0, 39.0, 30.0, 45.0, 43.0, 46.0, 39.0, 48.0, 41.0, 43.0, 38.0, 47.0, 44.0, 34.0, 33.0, 27.0, 28.0, 25.0, 24.0, 12.0, 24.0, 12.0, 11.0, 14.0, 7.0, 7.0, 11.0, 5.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07819080352783203, -0.07551002502441406, -0.0728292465209961, -0.07014846801757812, -0.06746768951416016, -0.06478691101074219, -0.06210613250732422, -0.05942535400390625, -0.05674457550048828, -0.05406379699707031, -0.051383018493652344, -0.048702239990234375, -0.046021461486816406, -0.04334068298339844, -0.04065990447998047, -0.0379791259765625, -0.03529834747314453, -0.03261756896972656, -0.029936790466308594, -0.027256011962890625, -0.024575233459472656, -0.021894454956054688, -0.01921367645263672, -0.01653289794921875, -0.013852119445800781, -0.011171340942382812, -0.008490562438964844, -0.005809783935546875, -0.0031290054321289062, -0.0004482269287109375, 0.0022325515747070312, 0.004913330078125, 0.007594108581542969, 0.010274887084960938, 0.012955665588378906, 0.015636444091796875, 0.018317222595214844, 0.020998001098632812, 0.02367877960205078, 0.02635955810546875, 0.02904033660888672, 0.03172111511230469, 0.034401893615722656, 0.037082672119140625, 0.039763450622558594, 0.04244422912597656, 0.04512500762939453, 0.0478057861328125, 0.05048656463623047, 0.05316734313964844, 0.055848121643066406, 0.058528900146484375, 0.061209678649902344, 0.06389045715332031, 0.06657123565673828, 0.06925201416015625, 0.07193279266357422, 0.07461357116699219, 0.07729434967041016, 0.07997512817382812, 0.0826559066772461, 0.08533668518066406, 0.08801746368408203, 0.0906982421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 16.0, 27.0, 26.0, 34.0, 51.0, 81.0, 116.0, 149.0, 203.0, 308.0, 451.0, 655.0, 987.0, 1376.0, 2116.0, 3398.0, 5613.0, 10016.0, 19942.0, 50333.0, 447987.0, 410706.0, 49219.0, 19486.0, 9775.0, 5513.0, 3347.0, 2142.0, 1353.0, 954.0, 689.0, 448.0, 323.0, 211.0, 153.0, 106.0, 72.0, 51.0, 31.0, 21.0, 20.0, 13.0, 12.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.14453125, -0.1401500701904297, -0.13576889038085938, -0.13138771057128906, -0.12700653076171875, -0.12262535095214844, -0.11824417114257812, -0.11386299133300781, -0.1094818115234375, -0.10510063171386719, -0.10071945190429688, -0.09633827209472656, -0.09195709228515625, -0.08757591247558594, -0.08319473266601562, -0.07881355285644531, -0.074432373046875, -0.07005119323730469, -0.06567001342773438, -0.06128883361816406, -0.05690765380859375, -0.05252647399902344, -0.048145294189453125, -0.04376411437988281, -0.0393829345703125, -0.03500175476074219, -0.030620574951171875, -0.026239395141601562, -0.02185821533203125, -0.017477035522460938, -0.013095855712890625, -0.008714675903320312, -0.00433349609375, 4.76837158203125e-05, 0.004428863525390625, 0.008810043334960938, 0.01319122314453125, 0.017572402954101562, 0.021953582763671875, 0.026334762573242188, 0.0307159423828125, 0.03509712219238281, 0.039478302001953125, 0.04385948181152344, 0.04824066162109375, 0.05262184143066406, 0.057003021240234375, 0.06138420104980469, 0.065765380859375, 0.07014656066894531, 0.07452774047851562, 0.07890892028808594, 0.08329010009765625, 0.08767127990722656, 0.09205245971679688, 0.09643363952636719, 0.1008148193359375, 0.10519599914550781, 0.10957717895507812, 0.11395835876464844, 0.11833953857421875, 0.12272071838378906, 0.12710189819335938, 0.1314830780029297, 0.1358642578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 5.0, 8.0, 9.0, 13.0, 10.0, 8.0, 13.0, 14.0, 20.0, 15.0, 23.0, 34.0, 25.0, 24.0, 27.0, 52.0, 43.0, 31.0, 32.0, 44.0, 33.0, 28.0, 38.0, 37.0, 41.0, 32.0, 34.0, 28.0, 28.0, 31.0, 26.0, 27.0, 15.0, 24.0, 10.0, 16.0, 19.0, 16.0, 13.0, 8.0, 6.0, 7.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.051849365234375, -0.05031299591064453, -0.04877662658691406, -0.047240257263183594, -0.045703887939453125, -0.044167518615722656, -0.04263114929199219, -0.04109477996826172, -0.03955841064453125, -0.03802204132080078, -0.03648567199707031, -0.034949302673339844, -0.033412933349609375, -0.031876564025878906, -0.030340194702148438, -0.02880382537841797, -0.0272674560546875, -0.02573108673095703, -0.024194717407226562, -0.022658348083496094, -0.021121978759765625, -0.019585609436035156, -0.018049240112304688, -0.01651287078857422, -0.01497650146484375, -0.013440132141113281, -0.011903762817382812, -0.010367393493652344, -0.008831024169921875, -0.007294654846191406, -0.0057582855224609375, -0.004221916198730469, -0.002685546875, -0.0011491775512695312, 0.0003871917724609375, 0.0019235610961914062, 0.003459930419921875, 0.004996299743652344, 0.0065326690673828125, 0.008069038391113281, 0.00960540771484375, 0.011141777038574219, 0.012678146362304688, 0.014214515686035156, 0.015750885009765625, 0.017287254333496094, 0.018823623657226562, 0.02035999298095703, 0.0218963623046875, 0.02343273162841797, 0.024969100952148438, 0.026505470275878906, 0.028041839599609375, 0.029578208923339844, 0.031114578247070312, 0.03265094757080078, 0.03418731689453125, 0.03572368621826172, 0.03726005554199219, 0.038796424865722656, 0.040332794189453125, 0.041869163513183594, 0.04340553283691406, 0.04494190216064453, 0.046478271484375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 11.0, 7.0, 7.0, 20.0, 22.0, 24.0, 26.0, 51.0, 65.0, 89.0, 104.0, 170.0, 230.0, 338.0, 483.0, 729.0, 1171.0, 1960.0, 3414.0, 6722.0, 15035.0, 49372.0, 738534.0, 177888.0, 29041.0, 10621.0, 5086.0, 2683.0, 1625.0, 950.0, 602.0, 419.0, 281.0, 213.0, 150.0, 105.0, 84.0, 77.0, 41.0, 32.0, 24.0, 13.0, 12.0, 7.0, 11.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.024383544921875, -0.023591995239257812, -0.022800445556640625, -0.022008895874023438, -0.02121734619140625, -0.020425796508789062, -0.019634246826171875, -0.018842697143554688, -0.0180511474609375, -0.017259597778320312, -0.016468048095703125, -0.015676498413085938, -0.01488494873046875, -0.014093399047851562, -0.013301849365234375, -0.012510299682617188, -0.01171875, -0.010927200317382812, -0.010135650634765625, -0.009344100952148438, -0.00855255126953125, -0.0077610015869140625, -0.006969451904296875, -0.0061779022216796875, -0.0053863525390625, -0.0045948028564453125, -0.003803253173828125, -0.0030117034912109375, -0.00222015380859375, -0.0014286041259765625, -0.000637054443359375, 0.0001544952392578125, 0.000946044921875, 0.0017375946044921875, 0.002529144287109375, 0.0033206939697265625, 0.00411224365234375, 0.0049037933349609375, 0.005695343017578125, 0.0064868927001953125, 0.0072784423828125, 0.008069992065429688, 0.008861541748046875, 0.009653091430664062, 0.01044464111328125, 0.011236190795898438, 0.012027740478515625, 0.012819290161132812, 0.01361083984375, 0.014402389526367188, 0.015193939208984375, 0.015985488891601562, 0.01677703857421875, 0.017568588256835938, 0.018360137939453125, 0.019151687622070312, 0.0199432373046875, 0.020734786987304688, 0.021526336669921875, 0.022317886352539062, 0.02310943603515625, 0.023900985717773438, 0.024692535400390625, 0.025484085083007812, 0.026275634765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 7.0, 3.0, 3.0, 10.0, 11.0, 9.0, 0.0, 16.0, 19.0, 25.0, 33.0, 53.0, 54.0, 0.0, 79.0, 62.0, 78.0, 81.0, 91.0, 67.0, 0.0, 56.0, 62.0, 36.0, 45.0, 24.0, 15.0, 0.0, 19.0, 12.0, 11.0, 9.0, 4.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6177073121070862e-06, -1.5664845705032349e-06, -1.5152618288993835e-06, -1.4640390872955322e-06, -1.412816345691681e-06, -1.3615936040878296e-06, -1.3103708624839783e-06, -1.259148120880127e-06, -1.2079253792762756e-06, -1.1567026376724243e-06, -1.105479896068573e-06, -1.0542571544647217e-06, -1.0030344128608704e-06, -9.51811671257019e-07, -9.005889296531677e-07, -8.493661880493164e-07, -7.981434464454651e-07, -7.469207048416138e-07, -6.956979632377625e-07, -6.444752216339111e-07, -5.932524800300598e-07, -5.420297384262085e-07, -4.908069968223572e-07, -4.3958425521850586e-07, -3.8836151361465454e-07, -3.371387720108032e-07, -2.859160304069519e-07, -2.3469328880310059e-07, -1.8347054719924927e-07, -1.3224780559539795e-07, -8.102506399154663e-08, -2.9802322387695312e-08, 2.1420419216156006e-08, 7.264316082000732e-08, 1.2386590242385864e-07, 1.7508864402770996e-07, 2.2631138563156128e-07, 2.775341272354126e-07, 3.287568688392639e-07, 3.7997961044311523e-07, 4.3120235204696655e-07, 4.824250936508179e-07, 5.336478352546692e-07, 5.848705768585205e-07, 6.360933184623718e-07, 6.873160600662231e-07, 7.385388016700745e-07, 7.897615432739258e-07, 8.409842848777771e-07, 8.922070264816284e-07, 9.434297680854797e-07, 9.94652509689331e-07, 1.0458752512931824e-06, 1.0970979928970337e-06, 1.148320734500885e-06, 1.1995434761047363e-06, 1.2507662177085876e-06, 1.301988959312439e-06, 1.3532117009162903e-06, 1.4044344425201416e-06, 1.455657184123993e-06, 1.5068799257278442e-06, 1.5581026673316956e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 16.0, 22.0, 28.0, 43.0, 43.0, 78.0, 113.0, 130.0, 176.0, 257.0, 347.0, 456.0, 735.0, 996.0, 1495.0, 2182.0, 3590.0, 5763.0, 10035.0, 18632.0, 39298.0, 112001.0, 540392.0, 198547.0, 56671.0, 24407.0, 12511.0, 6987.0, 4249.0, 2632.0, 1741.0, 1147.0, 800.0, 530.0, 441.0, 276.0, 214.0, 158.0, 98.0, 78.0, 60.0, 38.0, 34.0, 31.0, 17.0, 12.0, 9.0, 10.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.01617431640625, -0.015679597854614258, -0.015184879302978516, -0.014690160751342773, -0.014195442199707031, -0.013700723648071289, -0.013206005096435547, -0.012711286544799805, -0.012216567993164062, -0.01172184944152832, -0.011227130889892578, -0.010732412338256836, -0.010237693786621094, -0.009742975234985352, -0.00924825668334961, -0.008753538131713867, -0.008258819580078125, -0.007764101028442383, -0.007269382476806641, -0.0067746639251708984, -0.006279945373535156, -0.005785226821899414, -0.005290508270263672, -0.00479578971862793, -0.0043010711669921875, -0.0038063526153564453, -0.003311634063720703, -0.002816915512084961, -0.0023221969604492188, -0.0018274784088134766, -0.0013327598571777344, -0.0008380413055419922, -0.00034332275390625, 0.0001513957977294922, 0.0006461143493652344, 0.0011408329010009766, 0.0016355514526367188, 0.002130270004272461, 0.002624988555908203, 0.0031197071075439453, 0.0036144256591796875, 0.00410914421081543, 0.004603862762451172, 0.005098581314086914, 0.005593299865722656, 0.0060880184173583984, 0.006582736968994141, 0.007077455520629883, 0.007572174072265625, 0.008066892623901367, 0.00856161117553711, 0.009056329727172852, 0.009551048278808594, 0.010045766830444336, 0.010540485382080078, 0.01103520393371582, 0.011529922485351562, 0.012024641036987305, 0.012519359588623047, 0.013014078140258789, 0.013508796691894531, 0.014003515243530273, 0.014498233795166016, 0.014992952346801758, 0.0154876708984375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 8.0, 3.0, 5.0, 3.0, 7.0, 15.0, 16.0, 26.0, 19.0, 43.0, 35.0, 63.0, 125.0, 198.0, 123.0, 62.0, 55.0, 37.0, 35.0, 17.0, 21.0, 10.0, 15.0, 8.0, 3.0, 11.0, 8.0, 2.0, 4.0, 1.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038089752197265625, -0.0036701858043670654, -0.0035313963890075684, -0.0033926069736480713, -0.0032538175582885742, -0.003115028142929077, -0.00297623872756958, -0.002837449312210083, -0.002698659896850586, -0.002559870481491089, -0.002421081066131592, -0.0022822916507720947, -0.0021435022354125977, -0.0020047128200531006, -0.0018659234046936035, -0.0017271339893341064, -0.0015883445739746094, -0.0014495551586151123, -0.0013107657432556152, -0.0011719763278961182, -0.001033186912536621, -0.000894397497177124, -0.000755608081817627, -0.0006168186664581299, -0.0004780292510986328, -0.00033923983573913574, -0.00020045042037963867, -6.16610050201416e-05, 7.712841033935547e-05, 0.00021591782569885254, 0.0003547072410583496, 0.0004934966564178467, 0.0006322860717773438, 0.0007710754871368408, 0.0009098649024963379, 0.001048654317855835, 0.001187443733215332, 0.001326233148574829, 0.0014650225639343262, 0.0016038119792938232, 0.0017426013946533203, 0.0018813908100128174, 0.0020201802253723145, 0.0021589696407318115, 0.0022977590560913086, 0.0024365484714508057, 0.0025753378868103027, 0.0027141273021698, 0.002852916717529297, 0.002991706132888794, 0.003130495548248291, 0.003269284963607788, 0.003408074378967285, 0.0035468637943267822, 0.0036856532096862793, 0.0038244426250457764, 0.0039632320404052734, 0.0041020214557647705, 0.004240810871124268, 0.004379600286483765, 0.004518389701843262, 0.004657179117202759, 0.004795968532562256, 0.004934757947921753, 0.00507354736328125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 10.0, 11.0, 13.0, 34.0, 19.0, 40.0, 37.0, 65.0, 78.0, 84.0, 128.0, 103.0, 90.0, 51.0, 57.0, 35.0, 34.0, 28.0, 14.0, 11.0, 17.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15215714275836945, -0.14779318869113922, -0.1434292495250702, -0.13906529545783997, -0.13470134139060974, -0.13033738732337952, -0.12597344815731049, -0.12160949409008026, -0.11724554747343063, -0.112881600856781, -0.10851764678955078, -0.10415370017290115, -0.09978975355625153, -0.0954257994890213, -0.09106185287237167, -0.08669790625572205, -0.08233395218849182, -0.0779700055718422, -0.07360605150461197, -0.06924210488796234, -0.06487815082073212, -0.06051420420408249, -0.05615025758743286, -0.051786307245492935, -0.04742235690355301, -0.04305840656161308, -0.03869445621967316, -0.03433050960302353, -0.029966559261083603, -0.025602608919143677, -0.0212386604398489, -0.016874711960554123, -0.01251077651977539, -0.008146827109158039, -0.0037828776985406876, 0.000581071712076664, 0.0049450211226940155, 0.009308971464633942, 0.013672919943928719, 0.018036868423223495, 0.02240081876516342, 0.026764769107103348, 0.031128717586398125, 0.0354926660656929, 0.03985661640763283, 0.044220566749572754, 0.04858451336622238, 0.05294846370816231, 0.057312414050102234, 0.06167636439204216, 0.06604031473398209, 0.07040426135063171, 0.07476821541786194, 0.07913216203451157, 0.0834961086511612, 0.08786006271839142, 0.09222400933504105, 0.09658795595169067, 0.1009519100189209, 0.10531585663557053, 0.10967980325222015, 0.11404375731945038, 0.1184077039361, 0.12277165055274963, 0.12713560461997986]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 13.0, 14.0, 17.0, 21.0, 18.0, 25.0, 32.0, 13.0, 34.0, 45.0, 25.0, 35.0, 41.0, 36.0, 54.0, 38.0, 34.0, 36.0, 34.0, 40.0, 43.0, 33.0, 34.0, 31.0, 35.0, 16.0, 29.0, 17.0, 18.0, 22.0, 13.0, 9.0, 13.0, 11.0, 11.0, 4.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0738101676106453, -0.07139213383197784, -0.0689741000533104, -0.06655605882406235, -0.0641380250453949, -0.06171999126672745, -0.05930195748806, -0.05688392370939255, -0.0544658862054348, -0.05204785242676735, -0.0496298149228096, -0.04721178114414215, -0.0447937473654747, -0.04237570986151695, -0.0399576760828495, -0.037539638578891754, -0.035121604800224304, -0.032703571021556854, -0.030285533517599106, -0.027867499738931656, -0.025449464097619057, -0.023031428456306458, -0.020613394677639008, -0.01819535903632641, -0.01577732339501381, -0.01335928775370121, -0.010941253043711185, -0.008523218333721161, -0.006105182692408562, -0.0036871470510959625, -0.001269112341105938, 0.0011489223688840866, 0.003566958010196686, 0.005984993185847998, 0.00840302836149931, 0.010821063071489334, 0.013239098712801933, 0.015657134354114532, 0.018075168132781982, 0.02049320377409458, 0.02291123941540718, 0.02532927505671978, 0.02774731069803238, 0.03016534447669983, 0.03258337825536728, 0.03500141575932503, 0.03741944953799248, 0.039837487041950226, 0.042255520820617676, 0.044673554599285126, 0.047091592103242874, 0.049509625881910324, 0.05192766338586807, 0.05434569716453552, 0.05676373094320297, 0.05918176472187042, 0.06159980222582817, 0.06401783972978592, 0.06643587350845337, 0.06885390728712082, 0.07127194106578827, 0.07368998229503632, 0.07610801607370377, 0.07852604985237122, 0.08094408363103867]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 11.0, 13.0, 26.0, 27.0, 47.0, 78.0, 112.0, 165.0, 251.0, 339.0, 542.0, 727.0, 1104.0, 1662.0, 2405.0, 3494.0, 5021.0, 7391.0, 11305.0, 16828.0, 26332.0, 42945.0, 74577.0, 139964.0, 258417.0, 198415.0, 102063.0, 56690.0, 33999.0, 21174.0, 13857.0, 9113.0, 6076.0, 4289.0, 2937.0, 1908.0, 1351.0, 890.0, 620.0, 423.0, 299.0, 197.0, 137.0, 109.0, 74.0, 47.0, 30.0, 24.0, 21.0, 14.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.15283203125, -0.14816665649414062, -0.14350128173828125, -0.13883590698242188, -0.1341705322265625, -0.12950515747070312, -0.12483978271484375, -0.12017440795898438, -0.115509033203125, -0.11084365844726562, -0.10617828369140625, -0.10151290893554688, -0.0968475341796875, -0.09218215942382812, -0.08751678466796875, -0.08285140991210938, -0.07818603515625, -0.07352066040039062, -0.06885528564453125, -0.06418991088867188, -0.0595245361328125, -0.054859161376953125, -0.05019378662109375, -0.045528411865234375, -0.040863037109375, -0.036197662353515625, -0.03153228759765625, -0.026866912841796875, -0.0222015380859375, -0.017536163330078125, -0.01287078857421875, -0.008205413818359375, -0.0035400390625, 0.001125335693359375, 0.00579071044921875, 0.010456085205078125, 0.0151214599609375, 0.019786834716796875, 0.02445220947265625, 0.029117584228515625, 0.033782958984375, 0.038448333740234375, 0.04311370849609375, 0.047779083251953125, 0.0524444580078125, 0.057109832763671875, 0.06177520751953125, 0.06644058227539062, 0.07110595703125, 0.07577133178710938, 0.08043670654296875, 0.08510208129882812, 0.0897674560546875, 0.09443283081054688, 0.09909820556640625, 0.10376358032226562, 0.108428955078125, 0.11309432983398438, 0.11775970458984375, 0.12242507934570312, 0.1270904541015625, 0.13175582885742188, 0.13642120361328125, 0.14108657836914062, 0.145751953125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 9.0, 4.0, 7.0, 9.0, 12.0, 15.0, 17.0, 17.0, 14.0, 19.0, 29.0, 28.0, 33.0, 29.0, 29.0, 40.0, 30.0, 41.0, 43.0, 34.0, 34.0, 34.0, 30.0, 35.0, 50.0, 35.0, 43.0, 29.0, 26.0, 24.0, 26.0, 23.0, 20.0, 21.0, 17.0, 8.0, 13.0, 21.0, 6.0, 6.0, 5.0, 6.0, 8.0, 4.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.060394287109375, -0.05832529067993164, -0.05625629425048828, -0.05418729782104492, -0.05211830139160156, -0.0500493049621582, -0.047980308532714844, -0.045911312103271484, -0.043842315673828125, -0.041773319244384766, -0.039704322814941406, -0.03763532638549805, -0.03556632995605469, -0.03349733352661133, -0.03142833709716797, -0.02935934066772461, -0.02729034423828125, -0.02522134780883789, -0.02315235137939453, -0.021083354949951172, -0.019014358520507812, -0.016945362091064453, -0.014876365661621094, -0.012807369232177734, -0.010738372802734375, -0.008669376373291016, -0.006600379943847656, -0.004531383514404297, -0.0024623870849609375, -0.0003933906555175781, 0.0016756057739257812, 0.0037446022033691406, 0.0058135986328125, 0.00788259506225586, 0.009951591491699219, 0.012020587921142578, 0.014089584350585938, 0.016158580780029297, 0.018227577209472656, 0.020296573638916016, 0.022365570068359375, 0.024434566497802734, 0.026503562927246094, 0.028572559356689453, 0.030641555786132812, 0.03271055221557617, 0.03477954864501953, 0.03684854507446289, 0.03891754150390625, 0.04098653793334961, 0.04305553436279297, 0.04512453079223633, 0.04719352722167969, 0.04926252365112305, 0.051331520080566406, 0.053400516510009766, 0.055469512939453125, 0.057538509368896484, 0.059607505798339844, 0.0616765022277832, 0.06374549865722656, 0.06581449508666992, 0.06788349151611328, 0.06995248794555664, 0.072021484375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 10.0, 5.0, 17.0, 28.0, 27.0, 41.0, 53.0, 82.0, 110.0, 169.0, 251.0, 421.0, 653.0, 969.0, 1359.0, 2187.0, 3418.0, 5212.0, 8300.0, 12996.0, 21035.0, 34087.0, 55117.0, 93511.0, 174342.0, 271348.0, 149019.0, 82978.0, 48885.0, 30310.0, 18872.0, 11792.0, 7349.0, 4754.0, 3052.0, 2005.0, 1278.0, 804.0, 527.0, 368.0, 242.0, 157.0, 110.0, 91.0, 66.0, 44.0, 22.0, 29.0, 15.0, 12.0, 8.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.14013671875, -0.13552474975585938, -0.13091278076171875, -0.12630081176757812, -0.1216888427734375, -0.11707687377929688, -0.11246490478515625, -0.10785293579101562, -0.103240966796875, -0.09862899780273438, -0.09401702880859375, -0.08940505981445312, -0.0847930908203125, -0.08018112182617188, -0.07556915283203125, -0.07095718383789062, -0.06634521484375, -0.061733245849609375, -0.05712127685546875, -0.052509307861328125, -0.0478973388671875, -0.043285369873046875, -0.03867340087890625, -0.034061431884765625, -0.029449462890625, -0.024837493896484375, -0.02022552490234375, -0.015613555908203125, -0.0110015869140625, -0.006389617919921875, -0.00177764892578125, 0.002834320068359375, 0.0074462890625, 0.012058258056640625, 0.01667022705078125, 0.021282196044921875, 0.0258941650390625, 0.030506134033203125, 0.03511810302734375, 0.039730072021484375, 0.044342041015625, 0.048954010009765625, 0.05356597900390625, 0.058177947998046875, 0.0627899169921875, 0.06740188598632812, 0.07201385498046875, 0.07662582397460938, 0.08123779296875, 0.08584976196289062, 0.09046173095703125, 0.09507369995117188, 0.0996856689453125, 0.10429763793945312, 0.10890960693359375, 0.11352157592773438, 0.118133544921875, 0.12274551391601562, 0.12735748291015625, 0.13196945190429688, 0.1365814208984375, 0.14119338989257812, 0.14580535888671875, 0.15041732788085938, 0.155029296875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 10.0, 14.0, 8.0, 12.0, 12.0, 15.0, 11.0, 23.0, 29.0, 30.0, 28.0, 29.0, 30.0, 32.0, 29.0, 37.0, 42.0, 35.0, 40.0, 45.0, 31.0, 33.0, 30.0, 52.0, 34.0, 31.0, 40.0, 50.0, 24.0, 27.0, 23.0, 13.0, 23.0, 16.0, 12.0, 12.0, 10.0, 6.0, 5.0, 8.0, 4.0, 6.0, 0.0, 1.0, 2.0], "bins": [-0.05352783203125, -0.052135467529296875, -0.05074310302734375, -0.049350738525390625, -0.0479583740234375, -0.046566009521484375, -0.04517364501953125, -0.043781280517578125, -0.042388916015625, -0.040996551513671875, -0.03960418701171875, -0.038211822509765625, -0.0368194580078125, -0.035427093505859375, -0.03403472900390625, -0.032642364501953125, -0.03125, -0.029857635498046875, -0.02846527099609375, -0.027072906494140625, -0.0256805419921875, -0.024288177490234375, -0.02289581298828125, -0.021503448486328125, -0.020111083984375, -0.018718719482421875, -0.01732635498046875, -0.015933990478515625, -0.0145416259765625, -0.013149261474609375, -0.01175689697265625, -0.010364532470703125, -0.00897216796875, -0.007579803466796875, -0.00618743896484375, -0.004795074462890625, -0.0034027099609375, -0.002010345458984375, -0.00061798095703125, 0.000774383544921875, 0.002166748046875, 0.003559112548828125, 0.00495147705078125, 0.006343841552734375, 0.0077362060546875, 0.009128570556640625, 0.01052093505859375, 0.011913299560546875, 0.0133056640625, 0.014698028564453125, 0.01609039306640625, 0.017482757568359375, 0.0188751220703125, 0.020267486572265625, 0.02165985107421875, 0.023052215576171875, 0.024444580078125, 0.025836944580078125, 0.02722930908203125, 0.028621673583984375, 0.0300140380859375, 0.031406402587890625, 0.03279876708984375, 0.034191131591796875, 0.03558349609375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 12.0, 10.0, 12.0, 18.0, 24.0, 34.0, 45.0, 61.0, 73.0, 109.0, 125.0, 191.0, 275.0, 345.0, 428.0, 600.0, 824.0, 1202.0, 1690.0, 2525.0, 3894.0, 6400.0, 10692.0, 22999.0, 754571.0, 192073.0, 21070.0, 10114.0, 6002.0, 3813.0, 2476.0, 1572.0, 1176.0, 789.0, 601.0, 438.0, 313.0, 245.0, 173.0, 135.0, 105.0, 82.0, 64.0, 44.0, 35.0, 22.0, 9.0, 13.0, 5.0, 5.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.03753662109375, -0.036397457122802734, -0.03525829315185547, -0.0341191291809082, -0.03297996520996094, -0.03184080123901367, -0.030701637268066406, -0.02956247329711914, -0.028423309326171875, -0.02728414535522461, -0.026144981384277344, -0.025005817413330078, -0.023866653442382812, -0.022727489471435547, -0.02158832550048828, -0.020449161529541016, -0.01930999755859375, -0.018170833587646484, -0.01703166961669922, -0.015892505645751953, -0.014753341674804688, -0.013614177703857422, -0.012475013732910156, -0.01133584976196289, -0.010196685791015625, -0.00905752182006836, -0.007918357849121094, -0.006779193878173828, -0.0056400299072265625, -0.004500865936279297, -0.0033617019653320312, -0.0022225379943847656, -0.0010833740234375, 5.5789947509765625e-05, 0.0011949539184570312, 0.002334117889404297, 0.0034732818603515625, 0.004612445831298828, 0.005751609802246094, 0.006890773773193359, 0.008029937744140625, 0.00916910171508789, 0.010308265686035156, 0.011447429656982422, 0.012586593627929688, 0.013725757598876953, 0.014864921569824219, 0.016004085540771484, 0.01714324951171875, 0.018282413482666016, 0.01942157745361328, 0.020560741424560547, 0.021699905395507812, 0.022839069366455078, 0.023978233337402344, 0.02511739730834961, 0.026256561279296875, 0.02739572525024414, 0.028534889221191406, 0.029674053192138672, 0.030813217163085938, 0.0319523811340332, 0.03309154510498047, 0.034230709075927734, 0.035369873046875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 4.0, 7.0, 7.0, 5.0, 14.0, 19.0, 16.0, 30.0, 52.0, 69.0, 85.0, 118.0, 127.0, 106.0, 83.0, 79.0, 54.0, 29.0, 35.0, 18.0, 8.0, 7.0, 9.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06, 1.9073486328125e-06, 1.9669532775878906e-06, 2.0265579223632812e-06, 2.086162567138672e-06, 2.1457672119140625e-06, 2.205371856689453e-06, 2.2649765014648438e-06, 2.3245811462402344e-06, 2.384185791015625e-06, 2.4437904357910156e-06, 2.5033950805664062e-06, 2.562999725341797e-06, 2.6226043701171875e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 2.0, 2.0, 4.0, 17.0, 17.0, 27.0, 27.0, 41.0, 74.0, 91.0, 94.0, 147.0, 206.0, 315.0, 416.0, 628.0, 925.0, 1172.0, 1758.0, 2562.0, 3815.0, 6016.0, 9907.0, 21196.0, 548224.0, 401435.0, 21188.0, 9925.0, 5927.0, 3877.0, 2494.0, 1837.0, 1198.0, 874.0, 609.0, 442.0, 303.0, 226.0, 140.0, 101.0, 96.0, 60.0, 38.0, 24.0, 23.0, 19.0, 10.0, 7.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033447265625, -0.03236818313598633, -0.031289100646972656, -0.030210018157958984, -0.029130935668945312, -0.02805185317993164, -0.02697277069091797, -0.025893688201904297, -0.024814605712890625, -0.023735523223876953, -0.02265644073486328, -0.02157735824584961, -0.020498275756835938, -0.019419193267822266, -0.018340110778808594, -0.017261028289794922, -0.01618194580078125, -0.015102863311767578, -0.014023780822753906, -0.012944698333740234, -0.011865615844726562, -0.01078653335571289, -0.009707450866699219, -0.008628368377685547, -0.007549285888671875, -0.006470203399658203, -0.005391120910644531, -0.004312038421630859, -0.0032329559326171875, -0.0021538734436035156, -0.0010747909545898438, 4.291534423828125e-06, 0.0010833740234375, 0.002162456512451172, 0.0032415390014648438, 0.004320621490478516, 0.0053997039794921875, 0.006478786468505859, 0.007557868957519531, 0.008636951446533203, 0.009716033935546875, 0.010795116424560547, 0.011874198913574219, 0.01295328140258789, 0.014032363891601562, 0.015111446380615234, 0.016190528869628906, 0.017269611358642578, 0.01834869384765625, 0.019427776336669922, 0.020506858825683594, 0.021585941314697266, 0.022665023803710938, 0.02374410629272461, 0.02482318878173828, 0.025902271270751953, 0.026981353759765625, 0.028060436248779297, 0.02913951873779297, 0.03021860122680664, 0.03129768371582031, 0.032376766204833984, 0.033455848693847656, 0.03453493118286133, 0.035614013671875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 7.0, 12.0, 10.0, 40.0, 493.0, 292.0, 28.0, 22.0, 13.0, 6.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01102447509765625, -0.010689973831176758, -0.010355472564697266, -0.010020971298217773, -0.009686470031738281, -0.009351968765258789, -0.009017467498779297, -0.008682966232299805, -0.008348464965820312, -0.00801396369934082, -0.007679462432861328, -0.007344961166381836, -0.007010459899902344, -0.0066759586334228516, -0.006341457366943359, -0.006006956100463867, -0.005672454833984375, -0.005337953567504883, -0.005003452301025391, -0.0046689510345458984, -0.004334449768066406, -0.003999948501586914, -0.003665447235107422, -0.0033309459686279297, -0.0029964447021484375, -0.0026619434356689453, -0.002327442169189453, -0.001992940902709961, -0.0016584396362304688, -0.0013239383697509766, -0.0009894371032714844, -0.0006549358367919922, -0.0003204345703125, 1.4066696166992188e-05, 0.0003485679626464844, 0.0006830692291259766, 0.0010175704956054688, 0.001352071762084961, 0.0016865730285644531, 0.0020210742950439453, 0.0023555755615234375, 0.0026900768280029297, 0.003024578094482422, 0.003359079360961914, 0.0036935806274414062, 0.0040280818939208984, 0.004362583160400391, 0.004697084426879883, 0.005031585693359375, 0.005366086959838867, 0.005700588226318359, 0.0060350894927978516, 0.006369590759277344, 0.006704092025756836, 0.007038593292236328, 0.00737309455871582, 0.0077075958251953125, 0.008042097091674805, 0.008376598358154297, 0.008711099624633789, 0.009045600891113281, 0.009380102157592773, 0.009714603424072266, 0.010049104690551758, 0.01038360595703125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 16.0, 18.0, 19.0, 18.0, 36.0, 31.0, 53.0, 79.0, 106.0, 106.0, 113.0, 83.0, 72.0, 51.0, 42.0, 27.0, 33.0, 19.0, 13.0, 14.0, 4.0, 6.0, 13.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.145944744348526, -0.14200077950954437, -0.13805681467056274, -0.13411284983158112, -0.1301688849925995, -0.12622492015361786, -0.12228095531463623, -0.1183369904756546, -0.11439302563667297, -0.11044906079769135, -0.10650509595870972, -0.10256113111972809, -0.09861716628074646, -0.09467320144176483, -0.0907292366027832, -0.08678527176380157, -0.08284130692481995, -0.07889734208583832, -0.07495337724685669, -0.07100941240787506, -0.06706544756889343, -0.0631214827299118, -0.059177517890930176, -0.05523355305194855, -0.05128958821296692, -0.04734562337398529, -0.04340165853500366, -0.039457693696022034, -0.035513728857040405, -0.03156976401805878, -0.02762579917907715, -0.02368183434009552, -0.019737862050533295, -0.015793897211551666, -0.011849932372570038, -0.00790596753358841, -0.003962002694606781, -1.8037855625152588e-05, 0.003925926983356476, 0.007869891822338104, 0.011813856661319733, 0.01575782150030136, 0.01970178633928299, 0.023645751178264618, 0.027589716017246246, 0.031533680856227875, 0.0354776456952095, 0.03942161053419113, 0.04336557537317276, 0.04730954021215439, 0.05125350505113602, 0.055197469890117645, 0.059141434729099274, 0.0630853995680809, 0.06702936440706253, 0.07097332924604416, 0.07491729408502579, 0.07886125892400742, 0.08280522376298904, 0.08674918860197067, 0.0906931534409523, 0.09463711827993393, 0.09858108311891556, 0.10252504795789719, 0.10646901279687881]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 5.0, 7.0, 9.0, 15.0, 17.0, 13.0, 22.0, 22.0, 24.0, 35.0, 20.0, 36.0, 34.0, 42.0, 35.0, 36.0, 34.0, 43.0, 32.0, 42.0, 48.0, 43.0, 28.0, 45.0, 28.0, 34.0, 29.0, 20.0, 31.0, 20.0, 21.0, 17.0, 17.0, 19.0, 12.0, 12.0, 9.0, 7.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.06962723284959793, -0.06739553809165955, -0.06516385078430176, -0.06293215602636337, -0.060700464993715286, -0.0584687739610672, -0.056237079203128815, -0.05400538817048073, -0.05177369713783264, -0.049542006105184555, -0.04731031134724617, -0.045078620314598083, -0.04284692928195, -0.04061523824930191, -0.038383543491363525, -0.03615185245871544, -0.033920157700777054, -0.03168846666812897, -0.02945677377283573, -0.027225080877542496, -0.02499338984489441, -0.022761696949601173, -0.020530004054307938, -0.01829831302165985, -0.016066620126366615, -0.013834928162395954, -0.011603236198425293, -0.009371543303132057, -0.007139851339161396, -0.004908159375190735, -0.002676466479897499, -0.0004447745159268379, 0.0017869174480438232, 0.004018609412014484, 0.006250301841646433, 0.008481994271278381, 0.010713686235249043, 0.012945378199219704, 0.01517707109451294, 0.017408762127161026, 0.019640455022454262, 0.021872147917747498, 0.024103838950395584, 0.02633553184568882, 0.028567224740982056, 0.030798915773630142, 0.03303060680627823, 0.035262301564216614, 0.0374939925968647, 0.03972568362951279, 0.04195737838745117, 0.04418906942009926, 0.046420760452747345, 0.04865245521068573, 0.050884146243333817, 0.0531158372759819, 0.05534753203392029, 0.057579223066568375, 0.05981091782450676, 0.062042608857154846, 0.06427430361509323, 0.06650599092245102, 0.0687376856803894, 0.07096938043832779, 0.07320106774568558]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 7.0, 20.0, 17.0, 38.0, 48.0, 67.0, 103.0, 160.0, 196.0, 336.0, 508.0, 767.0, 1131.0, 1605.0, 2481.0, 3761.0, 5748.0, 8795.0, 13722.0, 22019.0, 36605.0, 62027.0, 112830.0, 233546.0, 691462.0, 1717806.0, 741250.0, 241729.0, 119969.0, 66840.0, 39569.0, 24144.0, 15030.0, 9798.0, 6512.0, 4298.0, 2787.0, 1988.0, 1362.0, 906.0, 648.0, 461.0, 352.0, 237.0, 171.0, 141.0, 83.0, 69.0, 55.0, 24.0, 17.0, 15.0, 8.0, 10.0, 4.0, 4.0, 3.0], "bins": [-0.0975341796875, -0.09453678131103516, -0.09153938293457031, -0.08854198455810547, -0.08554458618164062, -0.08254718780517578, -0.07954978942871094, -0.0765523910522461, -0.07355499267578125, -0.0705575942993164, -0.06756019592285156, -0.06456279754638672, -0.061565399169921875, -0.05856800079345703, -0.05557060241699219, -0.052573204040527344, -0.0495758056640625, -0.046578407287597656, -0.04358100891113281, -0.04058361053466797, -0.037586212158203125, -0.03458881378173828, -0.03159141540527344, -0.028594017028808594, -0.02559661865234375, -0.022599220275878906, -0.019601821899414062, -0.01660442352294922, -0.013607025146484375, -0.010609626770019531, -0.0076122283935546875, -0.004614830017089844, -0.001617431640625, 0.0013799667358398438, 0.0043773651123046875, 0.007374763488769531, 0.010372161865234375, 0.013369560241699219, 0.016366958618164062, 0.019364356994628906, 0.02236175537109375, 0.025359153747558594, 0.028356552124023438, 0.03135395050048828, 0.034351348876953125, 0.03734874725341797, 0.04034614562988281, 0.043343544006347656, 0.0463409423828125, 0.049338340759277344, 0.05233573913574219, 0.05533313751220703, 0.058330535888671875, 0.06132793426513672, 0.06432533264160156, 0.0673227310180664, 0.07032012939453125, 0.0733175277709961, 0.07631492614746094, 0.07931232452392578, 0.08230972290039062, 0.08530712127685547, 0.08830451965332031, 0.09130191802978516, 0.09429931640625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 7.0, 6.0, 9.0, 10.0, 11.0, 15.0, 22.0, 23.0, 20.0, 37.0, 31.0, 43.0, 21.0, 49.0, 46.0, 40.0, 51.0, 43.0, 38.0, 45.0, 42.0, 42.0, 30.0, 35.0, 37.0, 48.0, 21.0, 28.0, 21.0, 17.0, 20.0, 14.0, 18.0, 8.0, 10.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046966552734375, -0.04551553726196289, -0.04406452178955078, -0.04261350631713867, -0.04116249084472656, -0.03971147537231445, -0.038260459899902344, -0.036809444427490234, -0.035358428955078125, -0.033907413482666016, -0.032456398010253906, -0.031005382537841797, -0.029554367065429688, -0.028103351593017578, -0.02665233612060547, -0.02520132064819336, -0.02375030517578125, -0.02229928970336914, -0.02084827423095703, -0.019397258758544922, -0.017946243286132812, -0.016495227813720703, -0.015044212341308594, -0.013593196868896484, -0.012142181396484375, -0.010691165924072266, -0.009240150451660156, -0.007789134979248047, -0.0063381195068359375, -0.004887104034423828, -0.0034360885620117188, -0.0019850730895996094, -0.0005340576171875, 0.0009169578552246094, 0.0023679733276367188, 0.003818988800048828, 0.0052700042724609375, 0.006721019744873047, 0.008172035217285156, 0.009623050689697266, 0.011074066162109375, 0.012525081634521484, 0.013976097106933594, 0.015427112579345703, 0.016878128051757812, 0.018329143524169922, 0.01978015899658203, 0.02123117446899414, 0.02268218994140625, 0.02413320541381836, 0.02558422088623047, 0.027035236358642578, 0.028486251831054688, 0.029937267303466797, 0.031388282775878906, 0.032839298248291016, 0.034290313720703125, 0.035741329193115234, 0.037192344665527344, 0.03864336013793945, 0.04009437561035156, 0.04154539108276367, 0.04299640655517578, 0.04444742202758789, 0.0458984375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 7.0, 11.0, 12.0, 13.0, 30.0, 39.0, 55.0, 87.0, 124.0, 195.0, 280.0, 356.0, 581.0, 874.0, 1247.0, 1877.0, 2718.0, 4245.0, 6464.0, 9780.0, 15426.0, 23939.0, 38498.0, 63745.0, 108837.0, 194450.0, 380632.0, 877534.0, 1299523.0, 543932.0, 263314.0, 141957.0, 81345.0, 48432.0, 29786.0, 18861.0, 11946.0, 7804.0, 4974.0, 3372.0, 2246.0, 1520.0, 1033.0, 692.0, 500.0, 314.0, 236.0, 148.0, 98.0, 75.0, 39.0, 35.0, 25.0, 11.0, 7.0, 11.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.06768798828125, -0.06558799743652344, -0.06348800659179688, -0.06138801574707031, -0.05928802490234375, -0.05718803405761719, -0.055088043212890625, -0.05298805236816406, -0.0508880615234375, -0.04878807067871094, -0.046688079833984375, -0.04458808898925781, -0.04248809814453125, -0.04038810729980469, -0.038288116455078125, -0.03618812561035156, -0.034088134765625, -0.03198814392089844, -0.029888153076171875, -0.027788162231445312, -0.02568817138671875, -0.023588180541992188, -0.021488189697265625, -0.019388198852539062, -0.0172882080078125, -0.015188217163085938, -0.013088226318359375, -0.010988235473632812, -0.00888824462890625, -0.0067882537841796875, -0.004688262939453125, -0.0025882720947265625, -0.00048828125, 0.0016117095947265625, 0.003711700439453125, 0.0058116912841796875, 0.00791168212890625, 0.010011672973632812, 0.012111663818359375, 0.014211654663085938, 0.0163116455078125, 0.018411636352539062, 0.020511627197265625, 0.022611618041992188, 0.02471160888671875, 0.026811599731445312, 0.028911590576171875, 0.031011581420898438, 0.033111572265625, 0.03521156311035156, 0.037311553955078125, 0.03941154479980469, 0.04151153564453125, 0.04361152648925781, 0.045711517333984375, 0.04781150817871094, 0.0499114990234375, 0.05201148986816406, 0.054111480712890625, 0.05621147155761719, 0.05831146240234375, 0.06041145324707031, 0.06251144409179688, 0.06461143493652344, 0.06671142578125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 3.0, 7.0, 7.0, 12.0, 15.0, 11.0, 15.0, 37.0, 33.0, 43.0, 55.0, 71.0, 64.0, 105.0, 150.0, 128.0, 156.0, 156.0, 205.0, 233.0, 227.0, 282.0, 282.0, 266.0, 246.0, 180.0, 195.0, 149.0, 150.0, 90.0, 77.0, 73.0, 72.0, 47.0, 53.0, 38.0, 26.0, 27.0, 21.0, 13.0, 13.0, 10.0, 11.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0221099853515625, -0.02139878273010254, -0.020687580108642578, -0.019976377487182617, -0.019265174865722656, -0.018553972244262695, -0.017842769622802734, -0.017131567001342773, -0.016420364379882812, -0.01570916175842285, -0.01499795913696289, -0.01428675651550293, -0.013575553894042969, -0.012864351272583008, -0.012153148651123047, -0.011441946029663086, -0.010730743408203125, -0.010019540786743164, -0.009308338165283203, -0.008597135543823242, -0.007885932922363281, -0.00717473030090332, -0.006463527679443359, -0.0057523250579833984, -0.0050411224365234375, -0.0043299198150634766, -0.0036187171936035156, -0.0029075145721435547, -0.0021963119506835938, -0.0014851093292236328, -0.0007739067077636719, -6.270408630371094e-05, 0.00064849853515625, 0.001359701156616211, 0.002070903778076172, 0.002782106399536133, 0.0034933090209960938, 0.004204511642456055, 0.004915714263916016, 0.0056269168853759766, 0.0063381195068359375, 0.0070493221282958984, 0.007760524749755859, 0.00847172737121582, 0.009182929992675781, 0.009894132614135742, 0.010605335235595703, 0.011316537857055664, 0.012027740478515625, 0.012738943099975586, 0.013450145721435547, 0.014161348342895508, 0.014872550964355469, 0.01558375358581543, 0.01629495620727539, 0.01700615882873535, 0.017717361450195312, 0.018428564071655273, 0.019139766693115234, 0.019850969314575195, 0.020562171936035156, 0.021273374557495117, 0.021984577178955078, 0.02269577980041504, 0.023406982421875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 5.0, 14.0, 36.0, 33.0, 34.0, 43.0, 67.0, 83.0, 113.0, 111.0, 104.0, 57.0, 65.0, 40.0, 39.0, 18.0, 24.0, 19.0, 21.0, 12.0, 11.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0841507539153099, -0.08156321197748184, -0.07897566258907318, -0.07638812065124512, -0.07380057126283646, -0.07121302932500839, -0.06862547993659973, -0.06603793799877167, -0.063450388610363, -0.060862842947244644, -0.05827529728412628, -0.05568775162100792, -0.05310020595788956, -0.050512660294771194, -0.04792511463165283, -0.04533757269382477, -0.042750027030706406, -0.04016248136758804, -0.03757493570446968, -0.03498739004135132, -0.032399844378232956, -0.029812298715114594, -0.02722475491464138, -0.024637209251523018, -0.022049663588404655, -0.019462117925286293, -0.01687457226216793, -0.014287027530372143, -0.01169948186725378, -0.009111936204135418, -0.00652439147233963, -0.003936845809221268, -0.0013493001461029053, 0.0012382452841848135, 0.0038257907144725323, 0.006413335911929607, 0.00900088157504797, 0.011588427238166332, 0.01417597196996212, 0.016763517633080482, 0.019351063296198845, 0.021938608959317207, 0.02452615462243557, 0.027113698422908783, 0.029701244086027145, 0.03228878974914551, 0.03487633541226387, 0.03746388107538223, 0.040051426738500595, 0.04263897240161896, 0.04522651806473732, 0.04781406372785568, 0.050401609390974045, 0.05298915505409241, 0.05557669699192047, 0.05816424638032913, 0.060751788318157196, 0.06333933025598526, 0.06592687964439392, 0.06851442158222198, 0.07110197097063065, 0.07368951290845871, 0.07627706229686737, 0.07886460423469543, 0.0814521536231041]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 7.0, 11.0, 12.0, 16.0, 15.0, 19.0, 16.0, 20.0, 22.0, 21.0, 35.0, 27.0, 41.0, 34.0, 34.0, 31.0, 34.0, 36.0, 48.0, 37.0, 38.0, 31.0, 27.0, 39.0, 36.0, 30.0, 29.0, 27.0, 29.0, 29.0, 23.0, 18.0, 10.0, 21.0, 17.0, 12.0, 5.0, 13.0, 10.0, 2.0, 9.0, 7.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.04850662872195244, -0.04713018238544464, -0.045753732323646545, -0.04437728598713875, -0.04300083592534065, -0.041624389588832855, -0.04024793952703476, -0.03887149319052696, -0.037495046854019165, -0.03611860051751137, -0.03474215045571327, -0.033365704119205475, -0.03198925405740738, -0.030612807720899582, -0.029236359521746635, -0.02785991132259369, -0.026483461260795593, -0.025107013061642647, -0.0237305648624897, -0.022354118525981903, -0.020977668464183807, -0.01960122212767601, -0.018224773928523064, -0.016848325729370117, -0.01547187753021717, -0.014095429331064224, -0.012718981131911278, -0.011342533864080906, -0.00996608566492796, -0.008589637465775013, -0.007213190197944641, -0.005836741998791695, -0.004460293799638748, -0.0030838458333164454, -0.0017073978669941425, -0.00033095013350248337, 0.001045498065650463, 0.0024219462648034096, 0.0037983935326337814, 0.005174841731786728, 0.006551289930939674, 0.00792773813009262, 0.009304186329245567, 0.01068063359707594, 0.012057081796228886, 0.013433529995381832, 0.014809977263212204, 0.01618642546236515, 0.017562873661518097, 0.018939321860671043, 0.02031577005982399, 0.021692216396331787, 0.023068666458129883, 0.02444511279463768, 0.025821560993790627, 0.027198009192943573, 0.02857445739209652, 0.029950905591249466, 0.03132735192775726, 0.03270380198955536, 0.034080248326063156, 0.03545669838786125, 0.03683314472436905, 0.038209594786167145, 0.03958604112267494]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 9.0, 14.0, 22.0, 29.0, 43.0, 58.0, 85.0, 134.0, 188.0, 276.0, 412.0, 657.0, 985.0, 1491.0, 2245.0, 3632.0, 5556.0, 9031.0, 14299.0, 23449.0, 40254.0, 73565.0, 156883.0, 351654.0, 175235.0, 79085.0, 43113.0, 24875.0, 14931.0, 9658.0, 5867.0, 3793.0, 2429.0, 1529.0, 1030.0, 661.0, 463.0, 275.0, 207.0, 136.0, 91.0, 69.0, 53.0, 30.0, 12.0, 9.0, 12.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.04278564453125, -0.04147148132324219, -0.040157318115234375, -0.03884315490722656, -0.03752899169921875, -0.03621482849121094, -0.034900665283203125, -0.03358650207519531, -0.0322723388671875, -0.030958175659179688, -0.029644012451171875, -0.028329849243164062, -0.02701568603515625, -0.025701522827148438, -0.024387359619140625, -0.023073196411132812, -0.021759033203125, -0.020444869995117188, -0.019130706787109375, -0.017816543579101562, -0.01650238037109375, -0.015188217163085938, -0.013874053955078125, -0.012559890747070312, -0.0112457275390625, -0.009931564331054688, -0.008617401123046875, -0.0073032379150390625, -0.00598907470703125, -0.0046749114990234375, -0.003360748291015625, -0.0020465850830078125, -0.000732421875, 0.0005817413330078125, 0.001895904541015625, 0.0032100677490234375, 0.00452423095703125, 0.0058383941650390625, 0.007152557373046875, 0.008466720581054688, 0.0097808837890625, 0.011095046997070312, 0.012409210205078125, 0.013723373413085938, 0.01503753662109375, 0.016351699829101562, 0.017665863037109375, 0.018980026245117188, 0.020294189453125, 0.021608352661132812, 0.022922515869140625, 0.024236679077148438, 0.02555084228515625, 0.026865005493164062, 0.028179168701171875, 0.029493331909179688, 0.0308074951171875, 0.03212165832519531, 0.033435821533203125, 0.03474998474121094, 0.03606414794921875, 0.03737831115722656, 0.038692474365234375, 0.04000663757324219, 0.04132080078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 7.0, 7.0, 9.0, 14.0, 14.0, 22.0, 19.0, 21.0, 20.0, 31.0, 31.0, 32.0, 40.0, 36.0, 38.0, 34.0, 38.0, 37.0, 31.0, 40.0, 45.0, 41.0, 42.0, 39.0, 24.0, 29.0, 30.0, 30.0, 28.0, 29.0, 23.0, 19.0, 19.0, 11.0, 10.0, 12.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.053314208984375, -0.05182504653930664, -0.05033588409423828, -0.04884672164916992, -0.04735755920410156, -0.0458683967590332, -0.044379234313964844, -0.042890071868896484, -0.041400909423828125, -0.039911746978759766, -0.038422584533691406, -0.03693342208862305, -0.03544425964355469, -0.03395509719848633, -0.03246593475341797, -0.03097677230834961, -0.02948760986328125, -0.02799844741821289, -0.02650928497314453, -0.025020122528076172, -0.023530960083007812, -0.022041797637939453, -0.020552635192871094, -0.019063472747802734, -0.017574310302734375, -0.016085147857666016, -0.014595985412597656, -0.013106822967529297, -0.011617660522460938, -0.010128498077392578, -0.008639335632324219, -0.007150173187255859, -0.0056610107421875, -0.004171848297119141, -0.0026826858520507812, -0.0011935234069824219, 0.0002956390380859375, 0.0017848014831542969, 0.0032739639282226562, 0.004763126373291016, 0.006252288818359375, 0.007741451263427734, 0.009230613708496094, 0.010719776153564453, 0.012208938598632812, 0.013698101043701172, 0.015187263488769531, 0.01667642593383789, 0.01816558837890625, 0.01965475082397461, 0.02114391326904297, 0.022633075714111328, 0.024122238159179688, 0.025611400604248047, 0.027100563049316406, 0.028589725494384766, 0.030078887939453125, 0.031568050384521484, 0.033057212829589844, 0.0345463752746582, 0.03603553771972656, 0.03752470016479492, 0.03901386260986328, 0.04050302505493164, 0.0419921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 13.0, 11.0, 20.0, 21.0, 24.0, 17.0, 45.0, 70.0, 105.0, 126.0, 152.0, 232.0, 336.0, 402.0, 604.0, 833.0, 1150.0, 1739.0, 2305.0, 3428.0, 5080.0, 7995.0, 14046.0, 27066.0, 69928.0, 597846.0, 217818.0, 44570.0, 20325.0, 11036.0, 6727.0, 4233.0, 2981.0, 2148.0, 1413.0, 1081.0, 762.0, 496.0, 366.0, 286.0, 222.0, 141.0, 98.0, 76.0, 49.0, 35.0, 35.0, 22.0, 16.0, 8.0, 5.0, 7.0, 6.0, 4.0, 2.0, 4.0, 2.0], "bins": [-0.06890869140625, -0.06680774688720703, -0.06470680236816406, -0.0626058578491211, -0.060504913330078125, -0.058403968811035156, -0.05630302429199219, -0.05420207977294922, -0.05210113525390625, -0.05000019073486328, -0.04789924621582031, -0.045798301696777344, -0.043697357177734375, -0.041596412658691406, -0.03949546813964844, -0.03739452362060547, -0.0352935791015625, -0.03319263458251953, -0.031091690063476562, -0.028990745544433594, -0.026889801025390625, -0.024788856506347656, -0.022687911987304688, -0.02058696746826172, -0.01848602294921875, -0.01638507843017578, -0.014284133911132812, -0.012183189392089844, -0.010082244873046875, -0.007981300354003906, -0.0058803558349609375, -0.0037794113159179688, -0.001678466796875, 0.00042247772216796875, 0.0025234222412109375, 0.004624366760253906, 0.006725311279296875, 0.008826255798339844, 0.010927200317382812, 0.013028144836425781, 0.01512908935546875, 0.01723003387451172, 0.019330978393554688, 0.021431922912597656, 0.023532867431640625, 0.025633811950683594, 0.027734756469726562, 0.02983570098876953, 0.0319366455078125, 0.03403759002685547, 0.03613853454589844, 0.038239479064941406, 0.040340423583984375, 0.042441368103027344, 0.04454231262207031, 0.04664325714111328, 0.04874420166015625, 0.05084514617919922, 0.05294609069824219, 0.055047035217285156, 0.057147979736328125, 0.059248924255371094, 0.06134986877441406, 0.06345081329345703, 0.0655517578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 4.0, 5.0, 10.0, 12.0, 10.0, 10.0, 13.0, 19.0, 19.0, 17.0, 25.0, 24.0, 20.0, 26.0, 37.0, 35.0, 30.0, 46.0, 51.0, 27.0, 50.0, 33.0, 42.0, 49.0, 34.0, 31.0, 37.0, 37.0, 26.0, 26.0, 33.0, 22.0, 21.0, 18.0, 19.0, 18.0, 9.0, 13.0, 5.0, 9.0, 5.0, 3.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03216552734375, -0.031189441680908203, -0.030213356018066406, -0.02923727035522461, -0.028261184692382812, -0.027285099029541016, -0.02630901336669922, -0.025332927703857422, -0.024356842041015625, -0.023380756378173828, -0.02240467071533203, -0.021428585052490234, -0.020452499389648438, -0.01947641372680664, -0.018500328063964844, -0.017524242401123047, -0.01654815673828125, -0.015572071075439453, -0.014595985412597656, -0.01361989974975586, -0.012643814086914062, -0.011667728424072266, -0.010691642761230469, -0.009715557098388672, -0.008739471435546875, -0.007763385772705078, -0.006787300109863281, -0.005811214447021484, -0.0048351287841796875, -0.0038590431213378906, -0.0028829574584960938, -0.0019068717956542969, -0.0009307861328125, 4.5299530029296875e-05, 0.0010213851928710938, 0.0019974708557128906, 0.0029735565185546875, 0.003949642181396484, 0.004925727844238281, 0.005901813507080078, 0.006877899169921875, 0.007853984832763672, 0.008830070495605469, 0.009806156158447266, 0.010782241821289062, 0.01175832748413086, 0.012734413146972656, 0.013710498809814453, 0.01468658447265625, 0.015662670135498047, 0.016638755798339844, 0.01761484146118164, 0.018590927124023438, 0.019567012786865234, 0.02054309844970703, 0.021519184112548828, 0.022495269775390625, 0.023471355438232422, 0.02444744110107422, 0.025423526763916016, 0.026399612426757812, 0.02737569808959961, 0.028351783752441406, 0.029327869415283203, 0.030303955078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 10.0, 12.0, 9.0, 21.0, 25.0, 35.0, 52.0, 75.0, 94.0, 138.0, 200.0, 253.0, 470.0, 653.0, 1091.0, 1844.0, 3213.0, 6180.0, 14754.0, 52389.0, 789888.0, 133710.0, 24005.0, 9061.0, 4310.0, 2276.0, 1339.0, 847.0, 509.0, 334.0, 218.0, 165.0, 101.0, 76.0, 53.0, 40.0, 18.0, 22.0, 17.0, 7.0, 11.0, 10.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01611328125, -0.015588760375976562, -0.015064239501953125, -0.014539718627929688, -0.01401519775390625, -0.013490676879882812, -0.012966156005859375, -0.012441635131835938, -0.0119171142578125, -0.011392593383789062, -0.010868072509765625, -0.010343551635742188, -0.00981903076171875, -0.009294509887695312, -0.008769989013671875, -0.008245468139648438, -0.007720947265625, -0.0071964263916015625, -0.006671905517578125, -0.0061473846435546875, -0.00562286376953125, -0.0050983428955078125, -0.004573822021484375, -0.0040493011474609375, -0.0035247802734375, -0.0030002593994140625, -0.002475738525390625, -0.0019512176513671875, -0.00142669677734375, -0.0009021759033203125, -0.000377655029296875, 0.0001468658447265625, 0.00067138671875, 0.0011959075927734375, 0.001720428466796875, 0.0022449493408203125, 0.00276947021484375, 0.0032939910888671875, 0.003818511962890625, 0.0043430328369140625, 0.0048675537109375, 0.0053920745849609375, 0.005916595458984375, 0.0064411163330078125, 0.00696563720703125, 0.0074901580810546875, 0.008014678955078125, 0.008539199829101562, 0.009063720703125, 0.009588241577148438, 0.010112762451171875, 0.010637283325195312, 0.01116180419921875, 0.011686325073242188, 0.012210845947265625, 0.012735366821289062, 0.0132598876953125, 0.013784408569335938, 0.014308929443359375, 0.014833450317382812, 0.01535797119140625, 0.015882492065429688, 0.016407012939453125, 0.016931533813476562, 0.0174560546875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 1.0, 7.0, 6.0, 5.0, 7.0, 10.0, 19.0, 24.0, 28.0, 25.0, 28.0, 49.0, 49.0, 51.0, 62.0, 67.0, 69.0, 84.0, 0.0, 79.0, 57.0, 55.0, 43.0, 40.0, 30.0, 19.0, 17.0, 19.0, 8.0, 8.0, 7.0, 6.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6707926988601685e-06, -1.6130506992340088e-06, -1.5553086996078491e-06, -1.4975666999816895e-06, -1.4398247003555298e-06, -1.3820827007293701e-06, -1.3243407011032104e-06, -1.2665987014770508e-06, -1.2088567018508911e-06, -1.1511147022247314e-06, -1.0933727025985718e-06, -1.0356307029724121e-06, -9.778887033462524e-07, -9.201467037200928e-07, -8.624047040939331e-07, -8.046627044677734e-07, -7.469207048416138e-07, -6.891787052154541e-07, -6.314367055892944e-07, -5.736947059631348e-07, -5.159527063369751e-07, -4.5821070671081543e-07, -4.0046870708465576e-07, -3.427267074584961e-07, -2.849847078323364e-07, -2.2724270820617676e-07, -1.695007085800171e-07, -1.1175870895385742e-07, -5.4016709327697754e-08, 3.725290298461914e-09, 6.146728992462158e-08, 1.1920928955078125e-07, 1.7695128917694092e-07, 2.3469328880310059e-07, 2.9243528842926025e-07, 3.501772880554199e-07, 4.079192876815796e-07, 4.6566128730773926e-07, 5.234032869338989e-07, 5.811452865600586e-07, 6.388872861862183e-07, 6.966292858123779e-07, 7.543712854385376e-07, 8.121132850646973e-07, 8.698552846908569e-07, 9.275972843170166e-07, 9.853392839431763e-07, 1.043081283569336e-06, 1.1008232831954956e-06, 1.1585652828216553e-06, 1.216307282447815e-06, 1.2740492820739746e-06, 1.3317912817001343e-06, 1.389533281326294e-06, 1.4472752809524536e-06, 1.5050172805786133e-06, 1.562759280204773e-06, 1.6205012798309326e-06, 1.6782432794570923e-06, 1.735985279083252e-06, 1.7937272787094116e-06, 1.8514692783355713e-06, 1.909211277961731e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 18.0, 19.0, 32.0, 49.0, 52.0, 86.0, 122.0, 186.0, 258.0, 343.0, 521.0, 698.0, 1136.0, 1690.0, 2466.0, 4161.0, 7411.0, 14531.0, 33325.0, 110807.0, 641404.0, 151240.0, 40109.0, 16696.0, 8222.0, 4570.0, 2742.0, 1779.0, 1194.0, 784.0, 572.0, 380.0, 289.0, 194.0, 136.0, 101.0, 61.0, 44.0, 32.0, 26.0, 22.0, 14.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0135955810546875, -0.01316523551940918, -0.01273488998413086, -0.012304544448852539, -0.011874198913574219, -0.011443853378295898, -0.011013507843017578, -0.010583162307739258, -0.010152816772460938, -0.009722471237182617, -0.009292125701904297, -0.008861780166625977, -0.008431434631347656, -0.008001089096069336, -0.007570743560791016, -0.007140398025512695, -0.006710052490234375, -0.006279706954956055, -0.005849361419677734, -0.005419015884399414, -0.004988670349121094, -0.0045583248138427734, -0.004127979278564453, -0.003697633743286133, -0.0032672882080078125, -0.002836942672729492, -0.002406597137451172, -0.0019762516021728516, -0.0015459060668945312, -0.001115560531616211, -0.0006852149963378906, -0.0002548694610595703, 0.00017547607421875, 0.0006058216094970703, 0.0010361671447753906, 0.001466512680053711, 0.0018968582153320312, 0.0023272037506103516, 0.002757549285888672, 0.003187894821166992, 0.0036182403564453125, 0.004048585891723633, 0.004478931427001953, 0.0049092769622802734, 0.005339622497558594, 0.005769968032836914, 0.006200313568115234, 0.006630659103393555, 0.007061004638671875, 0.007491350173950195, 0.007921695709228516, 0.008352041244506836, 0.008782386779785156, 0.009212732315063477, 0.009643077850341797, 0.010073423385620117, 0.010503768920898438, 0.010934114456176758, 0.011364459991455078, 0.011794805526733398, 0.012225151062011719, 0.012655496597290039, 0.01308584213256836, 0.01351618766784668, 0.013946533203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 9.0, 9.0, 20.0, 35.0, 37.0, 76.0, 164.0, 282.0, 136.0, 81.0, 47.0, 28.0, 15.0, 22.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006641387939453125, -0.006463825702667236, -0.006286263465881348, -0.006108701229095459, -0.00593113899230957, -0.005753576755523682, -0.005576014518737793, -0.005398452281951904, -0.005220890045166016, -0.005043327808380127, -0.004865765571594238, -0.00468820333480835, -0.004510641098022461, -0.004333078861236572, -0.004155516624450684, -0.003977954387664795, -0.0038003921508789062, -0.0036228299140930176, -0.003445267677307129, -0.0032677054405212402, -0.0030901432037353516, -0.002912580966949463, -0.0027350187301635742, -0.0025574564933776855, -0.002379894256591797, -0.002202332019805908, -0.0020247697830200195, -0.0018472075462341309, -0.0016696453094482422, -0.0014920830726623535, -0.0013145208358764648, -0.0011369585990905762, -0.0009593963623046875, -0.0007818341255187988, -0.0006042718887329102, -0.0004267096519470215, -0.0002491474151611328, -7.158517837524414e-05, 0.00010597705841064453, 0.0002835392951965332, 0.0004611015319824219, 0.0006386637687683105, 0.0008162260055541992, 0.0009937882423400879, 0.0011713504791259766, 0.0013489127159118652, 0.001526474952697754, 0.0017040371894836426, 0.0018815994262695312, 0.00205916166305542, 0.0022367238998413086, 0.0024142861366271973, 0.002591848373413086, 0.0027694106101989746, 0.0029469728469848633, 0.003124535083770752, 0.0033020973205566406, 0.0034796595573425293, 0.003657221794128418, 0.0038347840309143066, 0.004012346267700195, 0.004189908504486084, 0.004367470741271973, 0.004545032978057861, 0.00472259521484375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 4.0, 8.0, 8.0, 7.0, 11.0, 15.0, 21.0, 42.0, 33.0, 45.0, 64.0, 76.0, 116.0, 109.0, 110.0, 63.0, 58.0, 42.0, 41.0, 23.0, 23.0, 18.0, 17.0, 13.0, 7.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08309037238359451, -0.08054132014513016, -0.0779922679066658, -0.07544320821762085, -0.0728941559791565, -0.07034510374069214, -0.06779605150222778, -0.06524699926376343, -0.06269793957471848, -0.06014888733625412, -0.057599831372499466, -0.05505077913403511, -0.05250172317028046, -0.0499526709318161, -0.047403618693351746, -0.04485456272959709, -0.042305510491132736, -0.03975645825266838, -0.03720740228891373, -0.03465835005044937, -0.03210929408669472, -0.029560241848230362, -0.027011187747120857, -0.024462133646011353, -0.021913079544901848, -0.019364025443792343, -0.01681497134268284, -0.014265918172895908, -0.011716864071786404, -0.009167809970676899, -0.006618756800889969, -0.004069702699780464, -0.0015206485986709595, 0.0010284052696079016, 0.0035774591378867626, 0.00612651277333498, 0.008675566874444485, 0.01122462097555399, 0.01377367414534092, 0.016322728246450424, 0.01887178234755993, 0.021420836448669434, 0.02396989054977894, 0.026518944650888443, 0.0290679968893528, 0.03161705285310745, 0.03416610509157181, 0.03671515733003616, 0.03926421329379082, 0.04181326553225517, 0.04436232149600983, 0.04691137373447418, 0.049460429698228836, 0.05200948193669319, 0.054558537900447845, 0.0571075901389122, 0.059656642377376556, 0.06220569461584091, 0.06475474685430527, 0.06730380654335022, 0.06985285878181458, 0.07240191102027893, 0.07495096325874329, 0.07750001549720764, 0.0800490751862526]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 14.0, 13.0, 15.0, 19.0, 18.0, 23.0, 21.0, 18.0, 37.0, 26.0, 35.0, 37.0, 36.0, 24.0, 42.0, 30.0, 49.0, 36.0, 40.0, 34.0, 33.0, 36.0, 35.0, 31.0, 20.0, 32.0, 32.0, 25.0, 24.0, 21.0, 12.0, 18.0, 16.0, 14.0, 6.0, 12.0, 6.0, 8.0, 8.0, 7.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0], "bins": [-0.04802699387073517, -0.046669792383909225, -0.04531259462237358, -0.04395539313554764, -0.04259819537401199, -0.04124099388718605, -0.03988379240036011, -0.03852659463882446, -0.03716939687728882, -0.035812195390462875, -0.03445499762892723, -0.03309779614210129, -0.03174059838056564, -0.0303833968937397, -0.029026197269558907, -0.027668997645378113, -0.02631179615855217, -0.024954596534371376, -0.023597396910190582, -0.02224019542336464, -0.020882997661828995, -0.019525796175003052, -0.018168596550822258, -0.016811396926641464, -0.01545419730246067, -0.014096997678279877, -0.012739798054099083, -0.011382597498595715, -0.01002539787441492, -0.008668198250234127, -0.007310997694730759, -0.005953798070549965, -0.004596598446369171, -0.0032393985893577337, -0.0018821987323462963, -0.0005249986425042152, 0.0008322009816765785, 0.0021894006058573723, 0.0035466011613607407, 0.004903800785541534, 0.006261000409722328, 0.007618200033903122, 0.008975399658083916, 0.010332600213587284, 0.011689799837768078, 0.013046999461948872, 0.01440420001745224, 0.015761399641633034, 0.017118599265813828, 0.01847579888999462, 0.019832998514175415, 0.021190200001001358, 0.022547397762537003, 0.023904599249362946, 0.02526179887354374, 0.026618998497724533, 0.027976198121905327, 0.02933339774608612, 0.030690597370266914, 0.03204779699444771, 0.03340499848127365, 0.034762196242809296, 0.03611939772963524, 0.03747659921646118, 0.038833796977996826]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 6.0, 8.0, 8.0, 16.0, 20.0, 34.0, 53.0, 72.0, 98.0, 162.0, 237.0, 329.0, 494.0, 672.0, 1012.0, 1511.0, 2255.0, 3443.0, 5034.0, 7904.0, 11917.0, 18486.0, 29381.0, 47827.0, 80739.0, 141791.0, 252644.0, 183487.0, 100467.0, 58899.0, 35640.0, 22076.0, 14319.0, 9238.0, 6003.0, 4104.0, 2609.0, 1795.0, 1194.0, 809.0, 570.0, 364.0, 251.0, 174.0, 136.0, 79.0, 57.0, 48.0, 19.0, 23.0, 16.0, 9.0, 10.0, 5.0, 5.0, 2.0, 1.0], "bins": [-0.0906982421875, -0.08800697326660156, -0.08531570434570312, -0.08262443542480469, -0.07993316650390625, -0.07724189758300781, -0.07455062866210938, -0.07185935974121094, -0.0691680908203125, -0.06647682189941406, -0.06378555297851562, -0.06109428405761719, -0.05840301513671875, -0.05571174621582031, -0.053020477294921875, -0.05032920837402344, -0.047637939453125, -0.04494667053222656, -0.042255401611328125, -0.03956413269042969, -0.03687286376953125, -0.03418159484863281, -0.031490325927734375, -0.028799057006835938, -0.0261077880859375, -0.023416519165039062, -0.020725250244140625, -0.018033981323242188, -0.01534271240234375, -0.012651443481445312, -0.009960174560546875, -0.0072689056396484375, -0.00457763671875, -0.0018863677978515625, 0.000804901123046875, 0.0034961700439453125, 0.00618743896484375, 0.008878707885742188, 0.011569976806640625, 0.014261245727539062, 0.0169525146484375, 0.019643783569335938, 0.022335052490234375, 0.025026321411132812, 0.02771759033203125, 0.030408859252929688, 0.033100128173828125, 0.03579139709472656, 0.038482666015625, 0.04117393493652344, 0.043865203857421875, 0.04655647277832031, 0.04924774169921875, 0.05193901062011719, 0.054630279541015625, 0.05732154846191406, 0.0600128173828125, 0.06270408630371094, 0.06539535522460938, 0.06808662414550781, 0.07077789306640625, 0.07346916198730469, 0.07616043090820312, 0.07885169982910156, 0.08154296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 5.0, 7.0, 10.0, 20.0, 19.0, 24.0, 9.0, 21.0, 20.0, 21.0, 21.0, 43.0, 35.0, 33.0, 34.0, 33.0, 29.0, 44.0, 39.0, 44.0, 45.0, 35.0, 28.0, 39.0, 35.0, 31.0, 30.0, 33.0, 24.0, 28.0, 20.0, 21.0, 19.0, 18.0, 11.0, 7.0, 10.0, 12.0, 9.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.04443359375, -0.04314279556274414, -0.04185199737548828, -0.04056119918823242, -0.03927040100097656, -0.0379796028137207, -0.036688804626464844, -0.035398006439208984, -0.034107208251953125, -0.032816410064697266, -0.031525611877441406, -0.030234813690185547, -0.028944015502929688, -0.027653217315673828, -0.02636241912841797, -0.02507162094116211, -0.02378082275390625, -0.02249002456665039, -0.02119922637939453, -0.019908428192138672, -0.018617630004882812, -0.017326831817626953, -0.016036033630371094, -0.014745235443115234, -0.013454437255859375, -0.012163639068603516, -0.010872840881347656, -0.009582042694091797, -0.008291244506835938, -0.007000446319580078, -0.005709648132324219, -0.004418849945068359, -0.0031280517578125, -0.0018372535705566406, -0.0005464553833007812, 0.0007443428039550781, 0.0020351409912109375, 0.003325939178466797, 0.004616737365722656, 0.005907535552978516, 0.007198333740234375, 0.008489131927490234, 0.009779930114746094, 0.011070728302001953, 0.012361526489257812, 0.013652324676513672, 0.014943122863769531, 0.01623392105102539, 0.01752471923828125, 0.01881551742553711, 0.02010631561279297, 0.021397113800048828, 0.022687911987304688, 0.023978710174560547, 0.025269508361816406, 0.026560306549072266, 0.027851104736328125, 0.029141902923583984, 0.030432701110839844, 0.0317234992980957, 0.03301429748535156, 0.03430509567260742, 0.03559589385986328, 0.03688669204711914, 0.038177490234375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 11.0, 12.0, 11.0, 27.0, 41.0, 36.0, 71.0, 105.0, 139.0, 187.0, 310.0, 425.0, 641.0, 914.0, 1330.0, 1831.0, 2657.0, 3791.0, 5697.0, 8171.0, 12325.0, 18231.0, 28113.0, 43466.0, 70862.0, 122972.0, 232401.0, 203333.0, 108196.0, 63848.0, 39835.0, 26020.0, 16931.0, 11310.0, 7529.0, 5167.0, 3628.0, 2421.0, 1711.0, 1194.0, 819.0, 552.0, 383.0, 274.0, 210.0, 126.0, 102.0, 63.0, 45.0, 28.0, 20.0, 17.0, 9.0, 6.0, 2.0, 9.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07684326171875, -0.0743560791015625, -0.071868896484375, -0.0693817138671875, -0.06689453125, -0.0644073486328125, -0.061920166015625, -0.0594329833984375, -0.05694580078125, -0.0544586181640625, -0.051971435546875, -0.0494842529296875, -0.0469970703125, -0.0445098876953125, -0.042022705078125, -0.0395355224609375, -0.03704833984375, -0.0345611572265625, -0.032073974609375, -0.0295867919921875, -0.027099609375, -0.0246124267578125, -0.022125244140625, -0.0196380615234375, -0.01715087890625, -0.0146636962890625, -0.012176513671875, -0.0096893310546875, -0.0072021484375, -0.0047149658203125, -0.002227783203125, 0.0002593994140625, 0.00274658203125, 0.0052337646484375, 0.007720947265625, 0.0102081298828125, 0.0126953125, 0.0151824951171875, 0.017669677734375, 0.0201568603515625, 0.02264404296875, 0.0251312255859375, 0.027618408203125, 0.0301055908203125, 0.0325927734375, 0.0350799560546875, 0.037567138671875, 0.0400543212890625, 0.04254150390625, 0.0450286865234375, 0.047515869140625, 0.0500030517578125, 0.052490234375, 0.0549774169921875, 0.057464599609375, 0.0599517822265625, 0.06243896484375, 0.0649261474609375, 0.067413330078125, 0.0699005126953125, 0.0723876953125, 0.0748748779296875, 0.077362060546875, 0.0798492431640625, 0.08233642578125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 8.0, 9.0, 13.0, 11.0, 7.0, 20.0, 15.0, 16.0, 21.0, 26.0, 24.0, 22.0, 24.0, 31.0, 26.0, 22.0, 28.0, 41.0, 20.0, 37.0, 45.0, 42.0, 32.0, 39.0, 39.0, 32.0, 37.0, 38.0, 28.0, 27.0, 28.0, 17.0, 28.0, 28.0, 21.0, 19.0, 18.0, 13.0, 11.0, 8.0, 6.0, 4.0, 2.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0250396728515625, -0.024225711822509766, -0.02341175079345703, -0.022597789764404297, -0.021783828735351562, -0.020969867706298828, -0.020155906677246094, -0.01934194564819336, -0.018527984619140625, -0.01771402359008789, -0.016900062561035156, -0.016086101531982422, -0.015272140502929688, -0.014458179473876953, -0.013644218444824219, -0.012830257415771484, -0.01201629638671875, -0.011202335357666016, -0.010388374328613281, -0.009574413299560547, -0.008760452270507812, -0.007946491241455078, -0.007132530212402344, -0.006318569183349609, -0.005504608154296875, -0.004690647125244141, -0.0038766860961914062, -0.003062725067138672, -0.0022487640380859375, -0.0014348030090332031, -0.0006208419799804688, 0.00019311904907226562, 0.001007080078125, 0.0018210411071777344, 0.0026350021362304688, 0.003448963165283203, 0.0042629241943359375, 0.005076885223388672, 0.005890846252441406, 0.006704807281494141, 0.007518768310546875, 0.00833272933959961, 0.009146690368652344, 0.009960651397705078, 0.010774612426757812, 0.011588573455810547, 0.012402534484863281, 0.013216495513916016, 0.01403045654296875, 0.014844417572021484, 0.01565837860107422, 0.016472339630126953, 0.017286300659179688, 0.018100261688232422, 0.018914222717285156, 0.01972818374633789, 0.020542144775390625, 0.02135610580444336, 0.022170066833496094, 0.022984027862548828, 0.023797988891601562, 0.024611949920654297, 0.02542591094970703, 0.026239871978759766, 0.0270538330078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 17.0, 11.0, 22.0, 15.0, 31.0, 34.0, 41.0, 67.0, 99.0, 145.0, 197.0, 277.0, 440.0, 697.0, 1159.0, 2087.0, 3937.0, 7622.0, 16049.0, 43339.0, 266025.0, 622205.0, 48128.0, 18089.0, 8038.0, 4090.0, 2185.0, 1269.0, 751.0, 507.0, 284.0, 199.0, 134.0, 95.0, 76.0, 43.0, 48.0, 27.0, 19.0, 10.0, 16.0, 7.0, 7.0, 3.0, 3.0, 0.0, 4.0, 0.0, 5.0, 1.0, 2.0], "bins": [-0.0277252197265625, -0.026911020278930664, -0.026096820831298828, -0.025282621383666992, -0.024468421936035156, -0.02365422248840332, -0.022840023040771484, -0.02202582359313965, -0.021211624145507812, -0.020397424697875977, -0.01958322525024414, -0.018769025802612305, -0.01795482635498047, -0.017140626907348633, -0.016326427459716797, -0.015512228012084961, -0.014698028564453125, -0.013883829116821289, -0.013069629669189453, -0.012255430221557617, -0.011441230773925781, -0.010627031326293945, -0.00981283187866211, -0.008998632431030273, -0.008184432983398438, -0.0073702335357666016, -0.006556034088134766, -0.00574183464050293, -0.004927635192871094, -0.004113435745239258, -0.003299236297607422, -0.002485036849975586, -0.00167083740234375, -0.0008566379547119141, -4.2438507080078125e-05, 0.0007717609405517578, 0.0015859603881835938, 0.0024001598358154297, 0.0032143592834472656, 0.0040285587310791016, 0.0048427581787109375, 0.0056569576263427734, 0.006471157073974609, 0.007285356521606445, 0.008099555969238281, 0.008913755416870117, 0.009727954864501953, 0.010542154312133789, 0.011356353759765625, 0.012170553207397461, 0.012984752655029297, 0.013798952102661133, 0.014613151550292969, 0.015427350997924805, 0.01624155044555664, 0.017055749893188477, 0.017869949340820312, 0.01868414878845215, 0.019498348236083984, 0.02031254768371582, 0.021126747131347656, 0.021940946578979492, 0.022755146026611328, 0.023569345474243164, 0.024383544921875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 10.0, 3.0, 0.0, 10.0, 14.0, 20.0, 0.0, 19.0, 29.0, 30.0, 0.0, 58.0, 66.0, 76.0, 0.0, 94.0, 111.0, 113.0, 0.0, 78.0, 59.0, 53.0, 0.0, 40.0, 32.0, 19.0, 0.0, 22.0, 7.0, 9.0, 0.0, 10.0, 6.0, 5.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.087784767150879e-06, -1.043081283569336e-06, -9.98377799987793e-07, -9.5367431640625e-07, -9.08970832824707e-07, -8.642673492431641e-07, -8.195638656616211e-07, -7.748603820800781e-07, -7.301568984985352e-07, -6.854534149169922e-07, -6.407499313354492e-07, -5.960464477539062e-07, -5.513429641723633e-07, -5.066394805908203e-07, -4.6193599700927734e-07, -4.172325134277344e-07, -3.725290298461914e-07, -3.2782554626464844e-07, -2.8312206268310547e-07, -2.384185791015625e-07, -1.9371509552001953e-07, -1.4901161193847656e-07, -1.043081283569336e-07, -5.960464477539063e-08, -1.4901161193847656e-08, 2.9802322387695312e-08, 7.450580596923828e-08, 1.1920928955078125e-07, 1.6391277313232422e-07, 2.086162567138672e-07, 2.5331974029541016e-07, 2.980232238769531e-07, 3.427267074584961e-07, 3.8743019104003906e-07, 4.3213367462158203e-07, 4.76837158203125e-07, 5.21540641784668e-07, 5.662441253662109e-07, 6.109476089477539e-07, 6.556510925292969e-07, 7.003545761108398e-07, 7.450580596923828e-07, 7.897615432739258e-07, 8.344650268554688e-07, 8.791685104370117e-07, 9.238719940185547e-07, 9.685754776000977e-07, 1.0132789611816406e-06, 1.0579824447631836e-06, 1.1026859283447266e-06, 1.1473894119262695e-06, 1.1920928955078125e-06, 1.2367963790893555e-06, 1.2814998626708984e-06, 1.3262033462524414e-06, 1.3709068298339844e-06, 1.4156103134155273e-06, 1.4603137969970703e-06, 1.5050172805786133e-06, 1.5497207641601562e-06, 1.5944242477416992e-06, 1.6391277313232422e-06, 1.6838312149047852e-06, 1.7285346984863281e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 11.0, 13.0, 14.0, 21.0, 25.0, 46.0, 46.0, 61.0, 107.0, 111.0, 146.0, 225.0, 328.0, 433.0, 589.0, 889.0, 1166.0, 1822.0, 2753.0, 4578.0, 8386.0, 17792.0, 46568.0, 539066.0, 339213.0, 45435.0, 17444.0, 8101.0, 4426.0, 2728.0, 1698.0, 1206.0, 871.0, 590.0, 457.0, 286.0, 265.0, 165.0, 124.0, 102.0, 67.0, 42.0, 34.0, 33.0, 23.0, 14.0, 13.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261383056640625, -0.025294780731201172, -0.024451255798339844, -0.023607730865478516, -0.022764205932617188, -0.02192068099975586, -0.02107715606689453, -0.020233631134033203, -0.019390106201171875, -0.018546581268310547, -0.01770305633544922, -0.01685953140258789, -0.016016006469726562, -0.015172481536865234, -0.014328956604003906, -0.013485431671142578, -0.01264190673828125, -0.011798381805419922, -0.010954856872558594, -0.010111331939697266, -0.009267807006835938, -0.00842428207397461, -0.007580757141113281, -0.006737232208251953, -0.005893707275390625, -0.005050182342529297, -0.004206657409667969, -0.0033631324768066406, -0.0025196075439453125, -0.0016760826110839844, -0.0008325576782226562, 1.0967254638671875e-05, 0.0008544921875, 0.0016980171203613281, 0.0025415420532226562, 0.0033850669860839844, 0.0042285919189453125, 0.005072116851806641, 0.005915641784667969, 0.006759166717529297, 0.007602691650390625, 0.008446216583251953, 0.009289741516113281, 0.01013326644897461, 0.010976791381835938, 0.011820316314697266, 0.012663841247558594, 0.013507366180419922, 0.01435089111328125, 0.015194416046142578, 0.016037940979003906, 0.016881465911865234, 0.017724990844726562, 0.01856851577758789, 0.01941204071044922, 0.020255565643310547, 0.021099090576171875, 0.021942615509033203, 0.02278614044189453, 0.02362966537475586, 0.024473190307617188, 0.025316715240478516, 0.026160240173339844, 0.027003765106201172, 0.0278472900390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 8.0, 15.0, 17.0, 24.0, 34.0, 36.0, 58.0, 190.0, 373.0, 59.0, 47.0, 36.0, 26.0, 16.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00820159912109375, -0.007937908172607422, -0.007674217224121094, -0.007410526275634766, -0.0071468353271484375, -0.006883144378662109, -0.006619453430175781, -0.006355762481689453, -0.006092071533203125, -0.005828380584716797, -0.005564689636230469, -0.005300998687744141, -0.0050373077392578125, -0.004773616790771484, -0.004509925842285156, -0.004246234893798828, -0.0039825439453125, -0.003718852996826172, -0.0034551620483398438, -0.0031914710998535156, -0.0029277801513671875, -0.0026640892028808594, -0.0024003982543945312, -0.002136707305908203, -0.001873016357421875, -0.0016093254089355469, -0.0013456344604492188, -0.0010819435119628906, -0.0008182525634765625, -0.0005545616149902344, -0.00029087066650390625, -2.7179718017578125e-05, 0.00023651123046875, 0.0005002021789550781, 0.0007638931274414062, 0.0010275840759277344, 0.0012912750244140625, 0.0015549659729003906, 0.0018186569213867188, 0.002082347869873047, 0.002346038818359375, 0.002609729766845703, 0.0028734207153320312, 0.0031371116638183594, 0.0034008026123046875, 0.0036644935607910156, 0.003928184509277344, 0.004191875457763672, 0.00445556640625, 0.004719257354736328, 0.004982948303222656, 0.005246639251708984, 0.0055103302001953125, 0.005774021148681641, 0.006037712097167969, 0.006301403045654297, 0.006565093994140625, 0.006828784942626953, 0.007092475891113281, 0.007356166839599609, 0.0076198577880859375, 0.007883548736572266, 0.008147239685058594, 0.008410930633544922, 0.00867462158203125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 14.0, 12.0, 27.0, 33.0, 31.0, 37.0, 51.0, 57.0, 83.0, 112.0, 114.0, 95.0, 53.0, 53.0, 38.0, 28.0, 27.0, 25.0, 21.0, 14.0, 9.0, 10.0, 7.0, 8.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0], "bins": [-0.07726425677537918, -0.07508154213428497, -0.07289882004261017, -0.07071610540151596, -0.06853339076042175, -0.06635066866874695, -0.06416795402765274, -0.061985235661268234, -0.05980251729488373, -0.05761979892849922, -0.055437084287405014, -0.05325436592102051, -0.051071647554636, -0.048888929188251495, -0.04670621454715729, -0.04452349618077278, -0.042340781539678574, -0.04015806317329407, -0.03797534853219986, -0.03579263016581535, -0.03360991179943085, -0.03142719715833664, -0.029244478791952133, -0.027061760425567627, -0.02487904392182827, -0.022696327418088913, -0.020513609051704407, -0.01833089254796505, -0.016148176044225693, -0.013965457677841187, -0.01178274117410183, -0.009600023739039898, -0.007417306303977966, -0.005234588868916035, -0.0030518718995153904, -0.0008691549301147461, 0.0013135625049471855, 0.003496279940009117, 0.005678996443748474, 0.007861713878810406, 0.010044431313872337, 0.012227148748934269, 0.0144098661839962, 0.016592582687735558, 0.018775299191474915, 0.02095801755785942, 0.023140734061598778, 0.025323450565338135, 0.02750616893172264, 0.029688885435461998, 0.031871601939201355, 0.03405432030558586, 0.03623703867197037, 0.038419753313064575, 0.04060247167944908, 0.04278519004583359, 0.044967904686927795, 0.0471506230533123, 0.04933333769440651, 0.051516056060791016, 0.05369877442717552, 0.05588149279356003, 0.058064207434654236, 0.06024692580103874, 0.06242964416742325]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 4.0, 11.0, 9.0, 9.0, 14.0, 15.0, 20.0, 31.0, 26.0, 33.0, 32.0, 33.0, 38.0, 42.0, 32.0, 42.0, 44.0, 45.0, 49.0, 35.0, 26.0, 52.0, 30.0, 35.0, 33.0, 26.0, 29.0, 34.0, 22.0, 18.0, 29.0, 14.0, 13.0, 4.0, 12.0, 13.0, 13.0, 9.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0441107414662838, -0.0426083467900753, -0.041105952113866806, -0.03960356116294861, -0.03810116648674011, -0.036598771810531616, -0.03509637713432312, -0.033593982458114624, -0.03209158778190613, -0.030589193105697632, -0.029086800292134285, -0.02758440561592579, -0.026082012802362442, -0.024579618126153946, -0.02307722344994545, -0.021574828773736954, -0.020072437822818756, -0.01857004314661026, -0.017067650333046913, -0.015565255656838417, -0.014062861911952496, -0.012560468167066574, -0.011058073490858078, -0.009555679745972157, -0.008053286001086235, -0.006550892256200314, -0.005048498045653105, -0.003546103835105896, -0.0020437100902199745, -0.000541316345334053, 0.000961078330874443, 0.0024634720757603645, 0.003965865820646286, 0.0054682595655322075, 0.006970653776079416, 0.008473047986626625, 0.009975441731512547, 0.011477835476398468, 0.012980230152606964, 0.014482623897492886, 0.015985017642378807, 0.017487412318587303, 0.01898980513215065, 0.020492199808359146, 0.021994594484567642, 0.02349698729813099, 0.024999381974339485, 0.026501774787902832, 0.028004169464111328, 0.029506564140319824, 0.03100895695388317, 0.032511353492736816, 0.034013744443655014, 0.03551613911986351, 0.037018533796072006, 0.0385209284722805, 0.0400233194231987, 0.041525714099407196, 0.04302810877561569, 0.04453050345182419, 0.046032894402742386, 0.04753528907895088, 0.04903768375515938, 0.050540078431367874, 0.05204247310757637]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 17.0, 21.0, 29.0, 39.0, 74.0, 111.0, 201.0, 362.0, 549.0, 946.0, 1685.0, 2976.0, 5392.0, 9979.0, 19442.0, 38387.0, 82333.0, 195171.0, 702662.0, 2213048.0, 598569.0, 176360.0, 75013.0, 34715.0, 16984.0, 8659.0, 4613.0, 2452.0, 1388.0, 841.0, 459.0, 286.0, 175.0, 112.0, 75.0, 57.0, 30.0, 12.0, 15.0, 8.0, 9.0, 5.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07427978515625, -0.07157421112060547, -0.06886863708496094, -0.0661630630493164, -0.06345748901367188, -0.060751914978027344, -0.05804634094238281, -0.05534076690673828, -0.05263519287109375, -0.04992961883544922, -0.04722404479980469, -0.044518470764160156, -0.041812896728515625, -0.039107322692871094, -0.03640174865722656, -0.03369617462158203, -0.0309906005859375, -0.02828502655029297, -0.025579452514648438, -0.022873878479003906, -0.020168304443359375, -0.017462730407714844, -0.014757156372070312, -0.012051582336425781, -0.00934600830078125, -0.006640434265136719, -0.0039348602294921875, -0.0012292861938476562, 0.001476287841796875, 0.004181861877441406, 0.0068874359130859375, 0.009593009948730469, 0.012298583984375, 0.015004158020019531, 0.017709732055664062, 0.020415306091308594, 0.023120880126953125, 0.025826454162597656, 0.028532028198242188, 0.03123760223388672, 0.03394317626953125, 0.03664875030517578, 0.03935432434082031, 0.042059898376464844, 0.044765472412109375, 0.047471046447753906, 0.05017662048339844, 0.05288219451904297, 0.0555877685546875, 0.05829334259033203, 0.06099891662597656, 0.0637044906616211, 0.06641006469726562, 0.06911563873291016, 0.07182121276855469, 0.07452678680419922, 0.07723236083984375, 0.07993793487548828, 0.08264350891113281, 0.08534908294677734, 0.08805465698242188, 0.0907602310180664, 0.09346580505371094, 0.09617137908935547, 0.098876953125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 5.0, 8.0, 12.0, 12.0, 16.0, 14.0, 17.0, 27.0, 24.0, 29.0, 32.0, 27.0, 42.0, 47.0, 42.0, 39.0, 42.0, 43.0, 40.0, 45.0, 41.0, 42.0, 47.0, 31.0, 36.0, 30.0, 27.0, 32.0, 19.0, 27.0, 17.0, 16.0, 17.0, 10.0, 9.0, 6.0, 11.0, 5.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026947021484375, -0.026000022888183594, -0.025053024291992188, -0.02410602569580078, -0.023159027099609375, -0.02221202850341797, -0.021265029907226562, -0.020318031311035156, -0.01937103271484375, -0.018424034118652344, -0.017477035522460938, -0.01653003692626953, -0.015583038330078125, -0.014636039733886719, -0.013689041137695312, -0.012742042541503906, -0.0117950439453125, -0.010848045349121094, -0.009901046752929688, -0.008954048156738281, -0.008007049560546875, -0.007060050964355469, -0.0061130523681640625, -0.005166053771972656, -0.00421905517578125, -0.0032720565795898438, -0.0023250579833984375, -0.0013780593872070312, -0.000431060791015625, 0.0005159378051757812, 0.0014629364013671875, 0.0024099349975585938, 0.00335693359375, 0.004303932189941406, 0.0052509307861328125, 0.006197929382324219, 0.007144927978515625, 0.008091926574707031, 0.009038925170898438, 0.009985923767089844, 0.01093292236328125, 0.011879920959472656, 0.012826919555664062, 0.013773918151855469, 0.014720916748046875, 0.01566791534423828, 0.016614913940429688, 0.017561912536621094, 0.0185089111328125, 0.019455909729003906, 0.020402908325195312, 0.02134990692138672, 0.022296905517578125, 0.02324390411376953, 0.024190902709960938, 0.025137901306152344, 0.02608489990234375, 0.027031898498535156, 0.027978897094726562, 0.02892589569091797, 0.029872894287109375, 0.03081989288330078, 0.03176689147949219, 0.032713890075683594, 0.033660888671875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 16.0, 19.0, 36.0, 47.0, 70.0, 133.0, 161.0, 236.0, 357.0, 496.0, 743.0, 1127.0, 1768.0, 2549.0, 3846.0, 5761.0, 8882.0, 13972.0, 21848.0, 35093.0, 57969.0, 100597.0, 181565.0, 350136.0, 780443.0, 1349892.0, 611569.0, 289916.0, 152402.0, 86096.0, 51173.0, 30824.0, 19165.0, 12298.0, 7952.0, 5039.0, 3239.0, 2288.0, 1432.0, 1002.0, 681.0, 474.0, 307.0, 197.0, 138.0, 113.0, 69.0, 44.0, 26.0, 28.0, 12.0, 16.0, 5.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.043731689453125, -0.042380332946777344, -0.04102897644042969, -0.03967761993408203, -0.038326263427734375, -0.03697490692138672, -0.03562355041503906, -0.034272193908691406, -0.03292083740234375, -0.031569480895996094, -0.030218124389648438, -0.02886676788330078, -0.027515411376953125, -0.02616405487060547, -0.024812698364257812, -0.023461341857910156, -0.0221099853515625, -0.020758628845214844, -0.019407272338867188, -0.01805591583251953, -0.016704559326171875, -0.015353202819824219, -0.014001846313476562, -0.012650489807128906, -0.01129913330078125, -0.009947776794433594, -0.008596420288085938, -0.007245063781738281, -0.005893707275390625, -0.004542350769042969, -0.0031909942626953125, -0.0018396377563476562, -0.00048828125, 0.0008630752563476562, 0.0022144317626953125, 0.0035657882690429688, 0.004917144775390625, 0.006268501281738281, 0.0076198577880859375, 0.008971214294433594, 0.01032257080078125, 0.011673927307128906, 0.013025283813476562, 0.014376640319824219, 0.015727996826171875, 0.01707935333251953, 0.018430709838867188, 0.019782066345214844, 0.0211334228515625, 0.022484779357910156, 0.023836135864257812, 0.02518749237060547, 0.026538848876953125, 0.02789020538330078, 0.029241561889648438, 0.030592918395996094, 0.03194427490234375, 0.033295631408691406, 0.03464698791503906, 0.03599834442138672, 0.037349700927734375, 0.03870105743408203, 0.04005241394042969, 0.041403770446777344, 0.042755126953125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 9.0, 5.0, 9.0, 16.0, 12.0, 11.0, 22.0, 29.0, 31.0, 44.0, 60.0, 72.0, 61.0, 85.0, 88.0, 141.0, 152.0, 186.0, 204.0, 208.0, 223.0, 258.0, 287.0, 274.0, 239.0, 214.0, 178.0, 158.0, 129.0, 131.0, 83.0, 71.0, 74.0, 61.0, 44.0, 53.0, 37.0, 36.0, 16.0, 13.0, 12.0, 16.0, 5.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01509857177734375, -0.014648079872131348, -0.014197587966918945, -0.013747096061706543, -0.01329660415649414, -0.012846112251281738, -0.012395620346069336, -0.011945128440856934, -0.011494636535644531, -0.011044144630432129, -0.010593652725219727, -0.010143160820007324, -0.009692668914794922, -0.00924217700958252, -0.008791685104370117, -0.008341193199157715, -0.007890701293945312, -0.00744020938873291, -0.006989717483520508, -0.0065392255783081055, -0.006088733673095703, -0.005638241767883301, -0.0051877498626708984, -0.004737257957458496, -0.004286766052246094, -0.0038362741470336914, -0.003385782241821289, -0.0029352903366088867, -0.0024847984313964844, -0.002034306526184082, -0.0015838146209716797, -0.0011333227157592773, -0.000682830810546875, -0.00023233890533447266, 0.0002181529998779297, 0.000668644905090332, 0.0011191368103027344, 0.0015696287155151367, 0.002020120620727539, 0.0024706125259399414, 0.0029211044311523438, 0.003371596336364746, 0.0038220882415771484, 0.004272580146789551, 0.004723072052001953, 0.0051735639572143555, 0.005624055862426758, 0.00607454776763916, 0.0065250396728515625, 0.006975531578063965, 0.007426023483276367, 0.00787651538848877, 0.008327007293701172, 0.008777499198913574, 0.009227991104125977, 0.009678483009338379, 0.010128974914550781, 0.010579466819763184, 0.011029958724975586, 0.011480450630187988, 0.01193094253540039, 0.012381434440612793, 0.012831926345825195, 0.013282418251037598, 0.01373291015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 12.0, 18.0, 21.0, 23.0, 18.0, 46.0, 37.0, 60.0, 68.0, 53.0, 86.0, 81.0, 82.0, 84.0, 66.0, 40.0, 43.0, 31.0, 16.0, 18.0, 23.0, 8.0, 12.0, 9.0, 5.0, 4.0, 4.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0431818813085556, -0.041818127036094666, -0.04045437276363373, -0.03909061849117279, -0.03772686421871185, -0.036363113671541214, -0.034999359399080276, -0.03363560512661934, -0.0322718508541584, -0.030908096581697464, -0.029544342309236526, -0.028180589899420738, -0.0268168356269598, -0.025453081354498863, -0.024089328944683075, -0.022725574672222137, -0.0213618203997612, -0.019998066127300262, -0.018634311854839325, -0.017270559445023537, -0.0159068051725626, -0.014543050900101662, -0.013179297558963299, -0.011815544217824936, -0.010451789945363998, -0.009088035672903061, -0.007724282331764698, -0.006360528524965048, -0.004996774718165398, -0.0036330209113657475, -0.0022692671045660973, -0.0009055137634277344, 0.0004582405090332031, 0.0018219943158328533, 0.0031857481226325035, 0.004549501929432154, 0.005913255736231804, 0.007277009543031454, 0.008640763349831104, 0.010004516690969467, 0.011368270963430405, 0.012732025235891342, 0.014095778577029705, 0.015459531918168068, 0.016823286190629005, 0.018187040463089943, 0.01955079287290573, 0.02091454714536667, 0.022278301417827606, 0.023642055690288544, 0.02500580996274948, 0.02636956237256527, 0.027733316645026207, 0.029097070917487144, 0.030460823327302933, 0.03182457759976387, 0.03318833187222481, 0.034552086144685745, 0.03591584041714668, 0.03727959468960762, 0.03864334523677826, 0.0400070995092392, 0.041370853781700134, 0.04273460805416107, 0.04409836232662201]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 5.0, 8.0, 7.0, 10.0, 18.0, 15.0, 16.0, 23.0, 18.0, 33.0, 31.0, 36.0, 40.0, 23.0, 42.0, 40.0, 45.0, 35.0, 39.0, 40.0, 39.0, 39.0, 45.0, 45.0, 28.0, 22.0, 30.0, 25.0, 22.0, 30.0, 27.0, 23.0, 20.0, 12.0, 10.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03274519369006157, -0.031783267855644226, -0.030821340158581734, -0.02985941432416439, -0.028897486627101898, -0.027935560792684555, -0.026973634958267212, -0.02601170726120472, -0.025049779564142227, -0.024087853729724884, -0.02312592603266239, -0.02216400019824505, -0.021202072501182556, -0.020240146666765213, -0.01927822083234787, -0.018316293135285378, -0.017354367300868034, -0.01639244146645069, -0.015430513769388199, -0.014468587934970856, -0.013506660237908363, -0.01254473440349102, -0.011582807637751102, -0.010620880872011185, -0.009658954106271267, -0.00869702734053135, -0.007735100574791431, -0.006773174274712801, -0.005811247508972883, -0.0048493207432329655, -0.003887394443154335, -0.0029254676774144173, -0.0019635427743196487, -0.0010016161249950528, -3.9689475670456886e-05, 0.0009222370572388172, 0.001884163822978735, 0.0028460905887186527, 0.003808016888797283, 0.004769943654537201, 0.005731870420277119, 0.0066937971860170364, 0.007655723951756954, 0.008617650717496872, 0.009579576551914215, 0.010541504248976707, 0.01150343008339405, 0.012465356849133968, 0.013427283614873886, 0.014389210380613804, 0.015351137146353722, 0.016313062980771065, 0.017274990677833557, 0.0182369165122509, 0.019198842346668243, 0.020160770043730736, 0.021122697740793228, 0.02208462357521057, 0.023046551272273064, 0.024008477106690407, 0.0249704048037529, 0.025932330638170242, 0.026894256472587585, 0.027856184169650078, 0.02881811000406742]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 9.0, 10.0, 16.0, 22.0, 36.0, 70.0, 84.0, 125.0, 193.0, 280.0, 455.0, 585.0, 866.0, 1295.0, 1885.0, 2899.0, 4187.0, 6437.0, 9815.0, 15223.0, 24261.0, 40061.0, 71628.0, 144258.0, 333571.0, 182722.0, 83715.0, 46323.0, 27643.0, 17251.0, 11023.0, 7220.0, 4725.0, 3174.0, 2064.0, 1392.0, 926.0, 673.0, 479.0, 299.0, 190.0, 128.0, 103.0, 83.0, 34.0, 46.0, 19.0, 15.0, 14.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.0281829833984375, -0.027344942092895508, -0.026506900787353516, -0.025668859481811523, -0.02483081817626953, -0.02399277687072754, -0.023154735565185547, -0.022316694259643555, -0.021478652954101562, -0.02064061164855957, -0.019802570343017578, -0.018964529037475586, -0.018126487731933594, -0.0172884464263916, -0.01645040512084961, -0.015612363815307617, -0.014774322509765625, -0.013936281204223633, -0.01309823989868164, -0.012260198593139648, -0.011422157287597656, -0.010584115982055664, -0.009746074676513672, -0.00890803337097168, -0.008069992065429688, -0.007231950759887695, -0.006393909454345703, -0.005555868148803711, -0.004717826843261719, -0.0038797855377197266, -0.0030417442321777344, -0.002203702926635742, -0.00136566162109375, -0.0005276203155517578, 0.0003104209899902344, 0.0011484622955322266, 0.0019865036010742188, 0.002824544906616211, 0.003662586212158203, 0.004500627517700195, 0.0053386688232421875, 0.00617671012878418, 0.007014751434326172, 0.007852792739868164, 0.008690834045410156, 0.009528875350952148, 0.01036691665649414, 0.011204957962036133, 0.012042999267578125, 0.012881040573120117, 0.01371908187866211, 0.014557123184204102, 0.015395164489746094, 0.016233205795288086, 0.017071247100830078, 0.01790928840637207, 0.018747329711914062, 0.019585371017456055, 0.020423412322998047, 0.02126145362854004, 0.02209949493408203, 0.022937536239624023, 0.023775577545166016, 0.024613618850708008, 0.02545166015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 8.0, 12.0, 12.0, 12.0, 13.0, 26.0, 22.0, 25.0, 21.0, 40.0, 38.0, 34.0, 35.0, 37.0, 45.0, 51.0, 49.0, 42.0, 42.0, 36.0, 34.0, 47.0, 32.0, 30.0, 29.0, 32.0, 27.0, 31.0, 21.0, 22.0, 18.0, 13.0, 15.0, 10.0, 8.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.036651611328125, -0.03561520576477051, -0.034578800201416016, -0.03354239463806152, -0.03250598907470703, -0.03146958351135254, -0.030433177947998047, -0.029396772384643555, -0.028360366821289062, -0.02732396125793457, -0.026287555694580078, -0.025251150131225586, -0.024214744567871094, -0.0231783390045166, -0.02214193344116211, -0.021105527877807617, -0.020069122314453125, -0.019032716751098633, -0.01799631118774414, -0.01695990562438965, -0.015923500061035156, -0.014887094497680664, -0.013850688934326172, -0.01281428337097168, -0.011777877807617188, -0.010741472244262695, -0.009705066680908203, -0.008668661117553711, -0.007632255554199219, -0.0065958499908447266, -0.005559444427490234, -0.004523038864135742, -0.00348663330078125, -0.002450227737426758, -0.0014138221740722656, -0.00037741661071777344, 0.0006589889526367188, 0.001695394515991211, 0.002731800079345703, 0.0037682056427001953, 0.0048046112060546875, 0.00584101676940918, 0.006877422332763672, 0.007913827896118164, 0.008950233459472656, 0.009986639022827148, 0.01102304458618164, 0.012059450149536133, 0.013095855712890625, 0.014132261276245117, 0.01516866683959961, 0.0162050724029541, 0.017241477966308594, 0.018277883529663086, 0.019314289093017578, 0.02035069465637207, 0.021387100219726562, 0.022423505783081055, 0.023459911346435547, 0.02449631690979004, 0.02553272247314453, 0.026569128036499023, 0.027605533599853516, 0.028641939163208008, 0.0296783447265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 7.0, 15.0, 16.0, 38.0, 39.0, 57.0, 73.0, 107.0, 137.0, 200.0, 319.0, 397.0, 582.0, 849.0, 1077.0, 1686.0, 2541.0, 3943.0, 6417.0, 11595.0, 23837.0, 63133.0, 622364.0, 223757.0, 42126.0, 17918.0, 9458.0, 5331.0, 3404.0, 2193.0, 1470.0, 964.0, 735.0, 522.0, 390.0, 250.0, 167.0, 117.0, 104.0, 55.0, 50.0, 34.0, 29.0, 17.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.051116943359375, -0.04945850372314453, -0.04780006408691406, -0.046141624450683594, -0.044483184814453125, -0.042824745178222656, -0.04116630554199219, -0.03950786590576172, -0.03784942626953125, -0.03619098663330078, -0.03453254699707031, -0.032874107360839844, -0.031215667724609375, -0.029557228088378906, -0.027898788452148438, -0.02624034881591797, -0.0245819091796875, -0.02292346954345703, -0.021265029907226562, -0.019606590270996094, -0.017948150634765625, -0.016289710998535156, -0.014631271362304688, -0.012972831726074219, -0.01131439208984375, -0.009655952453613281, -0.007997512817382812, -0.006339073181152344, -0.004680633544921875, -0.0030221939086914062, -0.0013637542724609375, 0.00029468536376953125, 0.001953125, 0.0036115646362304688, 0.0052700042724609375, 0.006928443908691406, 0.008586883544921875, 0.010245323181152344, 0.011903762817382812, 0.013562202453613281, 0.01522064208984375, 0.01687908172607422, 0.018537521362304688, 0.020195960998535156, 0.021854400634765625, 0.023512840270996094, 0.025171279907226562, 0.02682971954345703, 0.0284881591796875, 0.03014659881591797, 0.03180503845214844, 0.033463478088378906, 0.035121917724609375, 0.036780357360839844, 0.03843879699707031, 0.04009723663330078, 0.04175567626953125, 0.04341411590576172, 0.04507255554199219, 0.046730995178222656, 0.048389434814453125, 0.050047874450683594, 0.05170631408691406, 0.05336475372314453, 0.055023193359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 13.0, 12.0, 15.0, 14.0, 17.0, 18.0, 16.0, 12.0, 24.0, 21.0, 20.0, 20.0, 47.0, 32.0, 32.0, 45.0, 40.0, 38.0, 53.0, 28.0, 46.0, 44.0, 26.0, 35.0, 23.0, 34.0, 27.0, 35.0, 30.0, 28.0, 19.0, 18.0, 21.0, 22.0, 16.0, 11.0, 9.0, 6.0, 7.0, 4.0, 2.0, 9.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.0212554931640625, -0.020656585693359375, -0.02005767822265625, -0.019458770751953125, -0.01885986328125, -0.018260955810546875, -0.01766204833984375, -0.017063140869140625, -0.0164642333984375, -0.015865325927734375, -0.01526641845703125, -0.014667510986328125, -0.014068603515625, -0.013469696044921875, -0.01287078857421875, -0.012271881103515625, -0.0116729736328125, -0.011074066162109375, -0.01047515869140625, -0.009876251220703125, -0.00927734375, -0.008678436279296875, -0.00807952880859375, -0.007480621337890625, -0.0068817138671875, -0.006282806396484375, -0.00568389892578125, -0.005084991455078125, -0.004486083984375, -0.003887176513671875, -0.00328826904296875, -0.002689361572265625, -0.0020904541015625, -0.001491546630859375, -0.00089263916015625, -0.000293731689453125, 0.00030517578125, 0.000904083251953125, 0.00150299072265625, 0.002101898193359375, 0.0027008056640625, 0.003299713134765625, 0.00389862060546875, 0.004497528076171875, 0.005096435546875, 0.005695343017578125, 0.00629425048828125, 0.006893157958984375, 0.0074920654296875, 0.008090972900390625, 0.00868988037109375, 0.009288787841796875, 0.0098876953125, 0.010486602783203125, 0.01108551025390625, 0.011684417724609375, 0.0122833251953125, 0.012882232666015625, 0.01348114013671875, 0.014080047607421875, 0.014678955078125, 0.015277862548828125, 0.01587677001953125, 0.016475677490234375, 0.0170745849609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 4.0, 7.0, 17.0, 21.0, 27.0, 31.0, 54.0, 57.0, 74.0, 126.0, 144.0, 230.0, 308.0, 446.0, 665.0, 899.0, 1456.0, 2245.0, 3856.0, 6728.0, 13441.0, 33737.0, 204481.0, 689828.0, 51661.0, 17306.0, 8203.0, 4491.0, 2651.0, 1713.0, 1103.0, 769.0, 511.0, 365.0, 265.0, 171.0, 122.0, 103.0, 59.0, 45.0, 35.0, 23.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0059051513671875, -0.005715668201446533, -0.005526185035705566, -0.0053367018699646, -0.005147218704223633, -0.004957735538482666, -0.004768252372741699, -0.004578769207000732, -0.004389286041259766, -0.004199802875518799, -0.004010319709777832, -0.0038208365440368652, -0.0036313533782958984, -0.0034418702125549316, -0.003252387046813965, -0.003062903881072998, -0.0028734207153320312, -0.0026839375495910645, -0.0024944543838500977, -0.002304971218109131, -0.002115488052368164, -0.0019260048866271973, -0.0017365217208862305, -0.0015470385551452637, -0.0013575553894042969, -0.00116807222366333, -0.0009785890579223633, -0.0007891058921813965, -0.0005996227264404297, -0.0004101395606994629, -0.0002206563949584961, -3.11732292175293e-05, 0.0001583099365234375, 0.0003477931022644043, 0.0005372762680053711, 0.0007267594337463379, 0.0009162425994873047, 0.0011057257652282715, 0.0012952089309692383, 0.001484692096710205, 0.0016741752624511719, 0.0018636584281921387, 0.0020531415939331055, 0.0022426247596740723, 0.002432107925415039, 0.002621591091156006, 0.0028110742568969727, 0.0030005574226379395, 0.0031900405883789062, 0.003379523754119873, 0.00356900691986084, 0.0037584900856018066, 0.0039479732513427734, 0.00413745641708374, 0.004326939582824707, 0.004516422748565674, 0.004705905914306641, 0.004895389080047607, 0.005084872245788574, 0.005274355411529541, 0.005463838577270508, 0.005653321743011475, 0.005842804908752441, 0.006032288074493408, 0.006221771240234375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 2.0, 13.0, 11.0, 9.0, 33.0, 18.0, 37.0, 113.0, 72.0, 70.0, 157.0, 68.0, 71.0, 143.0, 44.0, 33.0, 44.0, 13.0, 10.0, 11.0, 5.0, 8.0, 9.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.6030465960502625e-06, -2.5238841772079468e-06, -2.444721758365631e-06, -2.3655593395233154e-06, -2.2863969206809998e-06, -2.207234501838684e-06, -2.1280720829963684e-06, -2.0489096641540527e-06, -1.969747245311737e-06, -1.8905848264694214e-06, -1.8114224076271057e-06, -1.73225998878479e-06, -1.6530975699424744e-06, -1.5739351511001587e-06, -1.494772732257843e-06, -1.4156103134155273e-06, -1.3364478945732117e-06, -1.257285475730896e-06, -1.1781230568885803e-06, -1.0989606380462646e-06, -1.019798219203949e-06, -9.406358003616333e-07, -8.614733815193176e-07, -7.82310962677002e-07, -7.031485438346863e-07, -6.239861249923706e-07, -5.448237061500549e-07, -4.6566128730773926e-07, -3.864988684654236e-07, -3.073364496231079e-07, -2.2817403078079224e-07, -1.4901161193847656e-07, -6.984919309616089e-08, 9.313225746154785e-09, 8.847564458847046e-08, 1.6763806343078613e-07, 2.468004822731018e-07, 3.259629011154175e-07, 4.0512531995773315e-07, 4.842877388000488e-07, 5.634501576423645e-07, 6.426125764846802e-07, 7.217749953269958e-07, 8.009374141693115e-07, 8.800998330116272e-07, 9.592622518539429e-07, 1.0384246706962585e-06, 1.1175870895385742e-06, 1.1967495083808899e-06, 1.2759119272232056e-06, 1.3550743460655212e-06, 1.434236764907837e-06, 1.5133991837501526e-06, 1.5925616025924683e-06, 1.671724021434784e-06, 1.7508864402770996e-06, 1.8300488591194153e-06, 1.909211277961731e-06, 1.9883736968040466e-06, 2.0675361156463623e-06, 2.146698534488678e-06, 2.2258609533309937e-06, 2.3050233721733093e-06, 2.384185791015625e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 5.0, 4.0, 2.0, 7.0, 3.0, 11.0, 18.0, 21.0, 25.0, 48.0, 69.0, 115.0, 160.0, 255.0, 404.0, 617.0, 927.0, 1558.0, 2586.0, 4445.0, 7654.0, 13956.0, 27585.0, 64863.0, 261142.0, 502970.0, 85899.0, 34564.0, 16707.0, 8940.0, 5131.0, 3002.0, 1846.0, 1125.0, 660.0, 434.0, 276.0, 165.0, 103.0, 84.0, 51.0, 38.0, 28.0, 20.0, 10.0, 10.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.004726409912109375, -0.004569590091705322, -0.0044127702713012695, -0.004255950450897217, -0.004099130630493164, -0.003942310810089111, -0.0037854909896850586, -0.003628671169281006, -0.003471851348876953, -0.0033150315284729004, -0.0031582117080688477, -0.003001391887664795, -0.002844572067260742, -0.0026877522468566895, -0.0025309324264526367, -0.002374112606048584, -0.0022172927856445312, -0.0020604729652404785, -0.0019036531448364258, -0.001746833324432373, -0.0015900135040283203, -0.0014331936836242676, -0.0012763738632202148, -0.0011195540428161621, -0.0009627342224121094, -0.0008059144020080566, -0.0006490945816040039, -0.0004922747611999512, -0.00033545494079589844, -0.0001786351203918457, -2.181529998779297e-05, 0.00013500452041625977, 0.0002918243408203125, 0.00044864416122436523, 0.000605463981628418, 0.0007622838020324707, 0.0009191036224365234, 0.0010759234428405762, 0.001232743263244629, 0.0013895630836486816, 0.0015463829040527344, 0.0017032027244567871, 0.0018600225448608398, 0.0020168423652648926, 0.0021736621856689453, 0.002330482006072998, 0.0024873018264770508, 0.0026441216468811035, 0.0028009414672851562, 0.002957761287689209, 0.0031145811080932617, 0.0032714009284973145, 0.003428220748901367, 0.00358504056930542, 0.0037418603897094727, 0.0038986802101135254, 0.004055500030517578, 0.004212319850921631, 0.004369139671325684, 0.004525959491729736, 0.004682779312133789, 0.004839599132537842, 0.0049964189529418945, 0.005153238773345947, 0.00531005859375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 4.0, 6.0, 4.0, 3.0, 7.0, 7.0, 7.0, 13.0, 10.0, 24.0, 25.0, 26.0, 45.0, 55.0, 84.0, 140.0, 169.0, 97.0, 76.0, 44.0, 38.0, 21.0, 20.0, 14.0, 8.0, 9.0, 10.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.0018768310546875, -0.001826271414756775, -0.0017757117748260498, -0.0017251521348953247, -0.0016745924949645996, -0.0016240328550338745, -0.0015734732151031494, -0.0015229135751724243, -0.0014723539352416992, -0.0014217942953109741, -0.001371234655380249, -0.001320675015449524, -0.0012701153755187988, -0.0012195557355880737, -0.0011689960956573486, -0.0011184364557266235, -0.0010678768157958984, -0.0010173171758651733, -0.0009667575359344482, -0.0009161978960037231, -0.000865638256072998, -0.000815078616142273, -0.0007645189762115479, -0.0007139593362808228, -0.0006633996963500977, -0.0006128400564193726, -0.0005622804164886475, -0.0005117207765579224, -0.00046116113662719727, -0.00041060149669647217, -0.00036004185676574707, -0.00030948221683502197, -0.0002589225769042969, -0.00020836293697357178, -0.00015780329704284668, -0.00010724365711212158, -5.6684017181396484e-05, -6.124377250671387e-06, 4.443526268005371e-05, 9.499490261077881e-05, 0.0001455545425415039, 0.000196114182472229, 0.0002466738224029541, 0.0002972334623336792, 0.0003477931022644043, 0.0003983527421951294, 0.0004489123821258545, 0.0004994720220565796, 0.0005500316619873047, 0.0006005913019180298, 0.0006511509418487549, 0.00070171058177948, 0.0007522702217102051, 0.0008028298616409302, 0.0008533895015716553, 0.0009039491415023804, 0.0009545087814331055, 0.0010050684213638306, 0.0010556280612945557, 0.0011061877012252808, 0.0011567473411560059, 0.001207306981086731, 0.001257866621017456, 0.0013084262609481812, 0.0013589859008789062]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 9.0, 20.0, 28.0, 23.0, 24.0, 36.0, 40.0, 76.0, 61.0, 72.0, 95.0, 85.0, 96.0, 63.0, 59.0, 41.0, 35.0, 17.0, 23.0, 15.0, 12.0, 15.0, 8.0, 6.0, 3.0, 4.0, 0.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044713977724313736, -0.04331965744495392, -0.0419253371655941, -0.04053101688623428, -0.039136696606874466, -0.03774237632751465, -0.03634805232286453, -0.03495373576879501, -0.0335594117641449, -0.03216509148478508, -0.030770771205425262, -0.029376450926065445, -0.027982130646705627, -0.02658781036734581, -0.025193488225340843, -0.023799167945981026, -0.022404849529266357, -0.02101052924990654, -0.019616208970546722, -0.018221888691186905, -0.016827568411827087, -0.015433247201144695, -0.014038925990462303, -0.012644605711102486, -0.011250285431742668, -0.00985596515238285, -0.008461644873023033, -0.007067323662340641, -0.0056730033829808235, -0.004278683103621006, -0.002884361892938614, -0.0014900416135787964, -9.572133421897888e-05, 0.0012985991779714823, 0.0026929196901619434, 0.004087240435183048, 0.005481560714542866, 0.006875880993902683, 0.008270202204585075, 0.009664522483944893, 0.01105884276330471, 0.012453163042664528, 0.013847483322024345, 0.015241804532706738, 0.01663612574338913, 0.018030446022748947, 0.019424766302108765, 0.020819086581468582, 0.0222134068608284, 0.023607727140188217, 0.025002047419548035, 0.026396367698907852, 0.02779068797826767, 0.029185008257627487, 0.030579330399632454, 0.03197365254163742, 0.03336796909570694, 0.03476228937506676, 0.036156609654426575, 0.03755092993378639, 0.03894525021314621, 0.04033957049250603, 0.041733890771865845, 0.04312821477651596, 0.04452253505587578]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 6.0, 9.0, 8.0, 17.0, 14.0, 17.0, 23.0, 17.0, 31.0, 32.0, 37.0, 34.0, 32.0, 38.0, 40.0, 46.0, 36.0, 41.0, 40.0, 37.0, 35.0, 47.0, 47.0, 28.0, 23.0, 32.0, 23.0, 25.0, 34.0, 22.0, 24.0, 18.0, 14.0, 10.0, 14.0, 11.0, 7.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03296642005443573, -0.03200586512684822, -0.03104531019926071, -0.030084755271673203, -0.029124202206730843, -0.028163647279143333, -0.027203092351555824, -0.026242537423968315, -0.025281984359025955, -0.024321429431438446, -0.023360874503850937, -0.022400319576263428, -0.021439766511321068, -0.02047921158373356, -0.01951865665614605, -0.01855810172855854, -0.01759754680097103, -0.016636991873383522, -0.015676436945796013, -0.014715882949531078, -0.013755328953266144, -0.012794774025678635, -0.011834219098091125, -0.010873664170503616, -0.009913110174238682, -0.008952555246651173, -0.007992001250386238, -0.007031446322798729, -0.006070891860872507, -0.005110337398946285, -0.004149782471358776, -0.0031892280094325542, -0.002228671684861183, -0.0012681171065196395, -0.0003075625281780958, 0.0006529921665787697, 0.0016135466285049915, 0.0025741010904312134, 0.0035346560180187225, 0.004495210479944944, 0.005455764941871166, 0.006416319403797388, 0.00737687386572361, 0.008337428793311119, 0.009297983720898628, 0.010258537717163563, 0.011219092644751072, 0.012179646641016006, 0.013140201568603516, 0.014100756496191025, 0.01506131049245596, 0.016021866351366043, 0.016982419416308403, 0.017942974343895912, 0.01890352927148342, 0.01986408419907093, 0.02082463726401329, 0.0217851921916008, 0.02274574711918831, 0.023706302046775818, 0.024666855111718178, 0.025627410039305687, 0.026587964966893196, 0.027548519894480705, 0.028509074822068214]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 16.0, 21.0, 39.0, 43.0, 82.0, 98.0, 165.0, 252.0, 369.0, 604.0, 803.0, 1231.0, 1777.0, 2791.0, 4320.0, 6852.0, 10281.0, 16095.0, 25456.0, 40783.0, 68503.0, 123042.0, 237594.0, 221326.0, 114747.0, 64555.0, 38818.0, 24316.0, 15282.0, 9860.0, 6277.0, 4195.0, 2656.0, 1763.0, 1221.0, 762.0, 494.0, 339.0, 254.0, 153.0, 112.0, 56.0, 44.0, 30.0, 18.0, 17.0, 8.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.058013916015625, -0.05625295639038086, -0.05449199676513672, -0.05273103713989258, -0.05097007751464844, -0.0492091178894043, -0.047448158264160156, -0.045687198638916016, -0.043926239013671875, -0.042165279388427734, -0.040404319763183594, -0.03864336013793945, -0.03688240051269531, -0.03512144088745117, -0.03336048126220703, -0.03159952163696289, -0.02983856201171875, -0.02807760238647461, -0.02631664276123047, -0.024555683135986328, -0.022794723510742188, -0.021033763885498047, -0.019272804260253906, -0.017511844635009766, -0.015750885009765625, -0.013989925384521484, -0.012228965759277344, -0.010468006134033203, -0.008707046508789062, -0.006946086883544922, -0.005185127258300781, -0.0034241676330566406, -0.0016632080078125, 9.775161743164062e-05, 0.0018587112426757812, 0.003619670867919922, 0.0053806304931640625, 0.007141590118408203, 0.008902549743652344, 0.010663509368896484, 0.012424468994140625, 0.014185428619384766, 0.015946388244628906, 0.017707347869873047, 0.019468307495117188, 0.021229267120361328, 0.02299022674560547, 0.02475118637084961, 0.02651214599609375, 0.02827310562133789, 0.03003406524658203, 0.03179502487182617, 0.03355598449707031, 0.03531694412231445, 0.037077903747558594, 0.038838863372802734, 0.040599822998046875, 0.042360782623291016, 0.044121742248535156, 0.0458827018737793, 0.04764366149902344, 0.04940462112426758, 0.05116558074951172, 0.05292654037475586, 0.0546875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 7.0, 6.0, 9.0, 13.0, 9.0, 16.0, 22.0, 15.0, 24.0, 25.0, 23.0, 26.0, 33.0, 40.0, 37.0, 42.0, 49.0, 43.0, 44.0, 47.0, 37.0, 44.0, 35.0, 45.0, 32.0, 36.0, 24.0, 25.0, 23.0, 35.0, 29.0, 25.0, 20.0, 14.0, 11.0, 7.0, 12.0, 6.0, 5.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.030059814453125, -0.02916717529296875, -0.0282745361328125, -0.02738189697265625, -0.0264892578125, -0.02559661865234375, -0.0247039794921875, -0.02381134033203125, -0.022918701171875, -0.02202606201171875, -0.0211334228515625, -0.02024078369140625, -0.01934814453125, -0.01845550537109375, -0.0175628662109375, -0.01667022705078125, -0.015777587890625, -0.01488494873046875, -0.0139923095703125, -0.01309967041015625, -0.01220703125, -0.01131439208984375, -0.0104217529296875, -0.00952911376953125, -0.008636474609375, -0.00774383544921875, -0.0068511962890625, -0.00595855712890625, -0.00506591796875, -0.00417327880859375, -0.0032806396484375, -0.00238800048828125, -0.001495361328125, -0.00060272216796875, 0.0002899169921875, 0.00118255615234375, 0.0020751953125, 0.00296783447265625, 0.0038604736328125, 0.00475311279296875, 0.005645751953125, 0.00653839111328125, 0.0074310302734375, 0.00832366943359375, 0.00921630859375, 0.01010894775390625, 0.0110015869140625, 0.01189422607421875, 0.012786865234375, 0.01367950439453125, 0.0145721435546875, 0.01546478271484375, 0.016357421875, 0.01725006103515625, 0.0181427001953125, 0.01903533935546875, 0.019927978515625, 0.02082061767578125, 0.0217132568359375, 0.02260589599609375, 0.02349853515625, 0.02439117431640625, 0.0252838134765625, 0.02617645263671875, 0.027069091796875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 9.0, 25.0, 23.0, 29.0, 49.0, 74.0, 117.0, 176.0, 235.0, 378.0, 576.0, 867.0, 1332.0, 1994.0, 3216.0, 4988.0, 7632.0, 12209.0, 19013.0, 31352.0, 51254.0, 86351.0, 158804.0, 273664.0, 165657.0, 89368.0, 52535.0, 32388.0, 19768.0, 12465.0, 7725.0, 4790.0, 3208.0, 2135.0, 1346.0, 922.0, 596.0, 409.0, 294.0, 193.0, 113.0, 88.0, 62.0, 38.0, 28.0, 17.0, 16.0, 3.0, 7.0, 5.0, 4.0, 1.0, 4.0], "bins": [-0.061676025390625, -0.059889793395996094, -0.05810356140136719, -0.05631732940673828, -0.054531097412109375, -0.05274486541748047, -0.05095863342285156, -0.049172401428222656, -0.04738616943359375, -0.045599937438964844, -0.04381370544433594, -0.04202747344970703, -0.040241241455078125, -0.03845500946044922, -0.03666877746582031, -0.034882545471191406, -0.0330963134765625, -0.031310081481933594, -0.029523849487304688, -0.02773761749267578, -0.025951385498046875, -0.02416515350341797, -0.022378921508789062, -0.020592689514160156, -0.01880645751953125, -0.017020225524902344, -0.015233993530273438, -0.013447761535644531, -0.011661529541015625, -0.009875297546386719, -0.008089065551757812, -0.006302833557128906, -0.0045166015625, -0.0027303695678710938, -0.0009441375732421875, 0.0008420944213867188, 0.002628326416015625, 0.004414558410644531, 0.0062007904052734375, 0.007987022399902344, 0.00977325439453125, 0.011559486389160156, 0.013345718383789062, 0.015131950378417969, 0.016918182373046875, 0.01870441436767578, 0.020490646362304688, 0.022276878356933594, 0.0240631103515625, 0.025849342346191406, 0.027635574340820312, 0.02942180633544922, 0.031208038330078125, 0.03299427032470703, 0.03478050231933594, 0.036566734313964844, 0.03835296630859375, 0.040139198303222656, 0.04192543029785156, 0.04371166229248047, 0.045497894287109375, 0.04728412628173828, 0.04907035827636719, 0.050856590270996094, 0.052642822265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 3.0, 6.0, 10.0, 11.0, 14.0, 12.0, 21.0, 12.0, 24.0, 16.0, 31.0, 29.0, 32.0, 30.0, 50.0, 45.0, 43.0, 47.0, 50.0, 40.0, 42.0, 38.0, 37.0, 49.0, 38.0, 43.0, 35.0, 18.0, 30.0, 36.0, 21.0, 21.0, 9.0, 18.0, 11.0, 8.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0163421630859375, -0.015743017196655273, -0.015143871307373047, -0.01454472541809082, -0.013945579528808594, -0.013346433639526367, -0.01274728775024414, -0.012148141860961914, -0.011548995971679688, -0.010949850082397461, -0.010350704193115234, -0.009751558303833008, -0.009152412414550781, -0.008553266525268555, -0.007954120635986328, -0.0073549747467041016, -0.006755828857421875, -0.0061566829681396484, -0.005557537078857422, -0.004958391189575195, -0.004359245300292969, -0.003760099411010742, -0.0031609535217285156, -0.002561807632446289, -0.0019626617431640625, -0.001363515853881836, -0.0007643699645996094, -0.0001652240753173828, 0.00043392181396484375, 0.0010330677032470703, 0.0016322135925292969, 0.0022313594818115234, 0.00283050537109375, 0.0034296512603759766, 0.004028797149658203, 0.00462794303894043, 0.005227088928222656, 0.005826234817504883, 0.006425380706787109, 0.007024526596069336, 0.0076236724853515625, 0.008222818374633789, 0.008821964263916016, 0.009421110153198242, 0.010020256042480469, 0.010619401931762695, 0.011218547821044922, 0.011817693710327148, 0.012416839599609375, 0.013015985488891602, 0.013615131378173828, 0.014214277267456055, 0.014813423156738281, 0.015412569046020508, 0.016011714935302734, 0.01661086082458496, 0.017210006713867188, 0.017809152603149414, 0.01840829849243164, 0.019007444381713867, 0.019606590270996094, 0.02020573616027832, 0.020804882049560547, 0.021404027938842773, 0.022003173828125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 9.0, 9.0, 21.0, 20.0, 32.0, 54.0, 55.0, 93.0, 109.0, 159.0, 247.0, 316.0, 500.0, 661.0, 1012.0, 1358.0, 2130.0, 3173.0, 5390.0, 9520.0, 20768.0, 62304.0, 663593.0, 203138.0, 38485.0, 14913.0, 7545.0, 4311.0, 2801.0, 1771.0, 1190.0, 788.0, 574.0, 377.0, 314.0, 250.0, 139.0, 115.0, 83.0, 67.0, 44.0, 32.0, 13.0, 23.0, 12.0, 9.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0047607421875, -0.004611074924468994, -0.004461407661437988, -0.004311740398406982, -0.0041620731353759766, -0.004012405872344971, -0.003862738609313965, -0.003713071346282959, -0.003563404083251953, -0.0034137368202209473, -0.0032640695571899414, -0.0031144022941589355, -0.0029647350311279297, -0.002815067768096924, -0.002665400505065918, -0.002515733242034912, -0.0023660659790039062, -0.0022163987159729004, -0.0020667314529418945, -0.0019170641899108887, -0.0017673969268798828, -0.001617729663848877, -0.001468062400817871, -0.0013183951377868652, -0.0011687278747558594, -0.0010190606117248535, -0.0008693933486938477, -0.0007197260856628418, -0.0005700588226318359, -0.0004203915596008301, -0.0002707242965698242, -0.00012105703353881836, 2.86102294921875e-05, 0.00017827749252319336, 0.0003279447555541992, 0.0004776120185852051, 0.0006272792816162109, 0.0007769465446472168, 0.0009266138076782227, 0.0010762810707092285, 0.0012259483337402344, 0.0013756155967712402, 0.001525282859802246, 0.001674950122833252, 0.0018246173858642578, 0.0019742846488952637, 0.0021239519119262695, 0.0022736191749572754, 0.0024232864379882812, 0.002572953701019287, 0.002722620964050293, 0.002872288227081299, 0.0030219554901123047, 0.0031716227531433105, 0.0033212900161743164, 0.0034709572792053223, 0.003620624542236328, 0.003770291805267334, 0.00391995906829834, 0.004069626331329346, 0.0042192935943603516, 0.004368960857391357, 0.004518628120422363, 0.004668295383453369, 0.004817962646484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 11.0, 12.0, 11.0, 17.0, 30.0, 0.0, 37.0, 66.0, 102.0, 118.0, 138.0, 124.0, 0.0, 113.0, 83.0, 39.0, 30.0, 20.0, 11.0, 0.0, 9.0, 4.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.319684088230133e-06, -1.2684613466262817e-06, -1.2172386050224304e-06, -1.166015863418579e-06, -1.1147931218147278e-06, -1.0635703802108765e-06, -1.0123476386070251e-06, -9.611248970031738e-07, -9.099021553993225e-07, -8.586794137954712e-07, -8.074566721916199e-07, -7.562339305877686e-07, -7.050111889839172e-07, -6.537884473800659e-07, -6.025657057762146e-07, -5.513429641723633e-07, -5.00120222568512e-07, -4.4889748096466064e-07, -3.976747393608093e-07, -3.46451997756958e-07, -2.952292561531067e-07, -2.4400651454925537e-07, -1.9278377294540405e-07, -1.4156103134155273e-07, -9.033828973770142e-08, -3.91155481338501e-08, 1.210719347000122e-08, 6.332993507385254e-08, 1.1455267667770386e-07, 1.6577541828155518e-07, 2.169981598854065e-07, 2.682209014892578e-07, 3.1944364309310913e-07, 3.7066638469696045e-07, 4.2188912630081177e-07, 4.731118679046631e-07, 5.243346095085144e-07, 5.755573511123657e-07, 6.26780092716217e-07, 6.780028343200684e-07, 7.292255759239197e-07, 7.80448317527771e-07, 8.316710591316223e-07, 8.828938007354736e-07, 9.34116542339325e-07, 9.853392839431763e-07, 1.0365620255470276e-06, 1.087784767150879e-06, 1.1390075087547302e-06, 1.1902302503585815e-06, 1.2414529919624329e-06, 1.2926757335662842e-06, 1.3438984751701355e-06, 1.3951212167739868e-06, 1.4463439583778381e-06, 1.4975666999816895e-06, 1.5487894415855408e-06, 1.600012183189392e-06, 1.6512349247932434e-06, 1.7024576663970947e-06, 1.753680408000946e-06, 1.8049031496047974e-06, 1.8561258912086487e-06, 1.9073486328125e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 2.0, 5.0, 8.0, 19.0, 14.0, 20.0, 28.0, 34.0, 49.0, 75.0, 90.0, 125.0, 168.0, 228.0, 339.0, 458.0, 724.0, 977.0, 1574.0, 2351.0, 3867.0, 6430.0, 11634.0, 22921.0, 75072.0, 735411.0, 122635.0, 29720.0, 13381.0, 7560.0, 4490.0, 2744.0, 1722.0, 1091.0, 745.0, 525.0, 365.0, 266.0, 185.0, 145.0, 98.0, 71.0, 49.0, 41.0, 22.0, 14.0, 15.0, 12.0, 12.0, 8.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00493621826171875, -0.004780173301696777, -0.004624128341674805, -0.004468083381652832, -0.004312038421630859, -0.004155993461608887, -0.003999948501586914, -0.0038439035415649414, -0.0036878585815429688, -0.003531813621520996, -0.0033757686614990234, -0.0032197237014770508, -0.003063678741455078, -0.0029076337814331055, -0.002751588821411133, -0.00259554386138916, -0.0024394989013671875, -0.002283453941345215, -0.002127408981323242, -0.0019713640213012695, -0.0018153190612792969, -0.0016592741012573242, -0.0015032291412353516, -0.001347184181213379, -0.0011911392211914062, -0.0010350942611694336, -0.0008790493011474609, -0.0007230043411254883, -0.0005669593811035156, -0.00041091442108154297, -0.0002548694610595703, -9.882450103759766e-05, 5.7220458984375e-05, 0.00021326541900634766, 0.0003693103790283203, 0.000525355339050293, 0.0006814002990722656, 0.0008374452590942383, 0.000993490219116211, 0.0011495351791381836, 0.0013055801391601562, 0.001461625099182129, 0.0016176700592041016, 0.0017737150192260742, 0.0019297599792480469, 0.0020858049392700195, 0.002241849899291992, 0.002397894859313965, 0.0025539398193359375, 0.00270998477935791, 0.002866029739379883, 0.0030220746994018555, 0.003178119659423828, 0.0033341646194458008, 0.0034902095794677734, 0.003646254539489746, 0.0038022994995117188, 0.003958344459533691, 0.004114389419555664, 0.004270434379577637, 0.004426479339599609, 0.004582524299621582, 0.004738569259643555, 0.004894614219665527, 0.0050506591796875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 2.0, 4.0, 7.0, 10.0, 17.0, 13.0, 14.0, 21.0, 59.0, 149.0, 346.0, 148.0, 76.0, 32.0, 15.0, 8.0, 14.0, 5.0, 7.0, 11.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001644134521484375, -0.0015965253114700317, -0.0015489161014556885, -0.0015013068914413452, -0.001453697681427002, -0.0014060884714126587, -0.0013584792613983154, -0.0013108700513839722, -0.001263260841369629, -0.0012156516313552856, -0.0011680424213409424, -0.0011204332113265991, -0.0010728240013122559, -0.0010252147912979126, -0.0009776055812835693, -0.0009299963712692261, -0.0008823871612548828, -0.0008347779512405396, -0.0007871687412261963, -0.000739559531211853, -0.0006919503211975098, -0.0006443411111831665, -0.0005967319011688232, -0.00054912269115448, -0.0005015134811401367, -0.00045390427112579346, -0.0004062950611114502, -0.00035868585109710693, -0.00031107664108276367, -0.0002634674310684204, -0.00021585822105407715, -0.0001682490110397339, -0.00012063980102539062, -7.303059101104736e-05, -2.54213809967041e-05, 2.218782901763916e-05, 6.979703903198242e-05, 0.00011740624904632568, 0.00016501545906066895, 0.0002126246690750122, 0.00026023387908935547, 0.00030784308910369873, 0.000355452299118042, 0.00040306150913238525, 0.0004506707191467285, 0.0004982799291610718, 0.000545889139175415, 0.0005934983491897583, 0.0006411075592041016, 0.0006887167692184448, 0.0007363259792327881, 0.0007839351892471313, 0.0008315443992614746, 0.0008791536092758179, 0.0009267628192901611, 0.0009743720293045044, 0.0010219812393188477, 0.001069590449333191, 0.0011171996593475342, 0.0011648088693618774, 0.0012124180793762207, 0.001260027289390564, 0.0013076364994049072, 0.0013552457094192505, 0.0014028549194335938]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 12.0, 7.0, 15.0, 17.0, 20.0, 28.0, 23.0, 28.0, 40.0, 50.0, 51.0, 71.0, 97.0, 106.0, 71.0, 53.0, 68.0, 48.0, 37.0, 37.0, 19.0, 21.0, 15.0, 12.0, 10.0, 6.0, 7.0, 8.0, 1.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.03839346393942833, -0.03717665746808052, -0.03595985099673271, -0.034743040800094604, -0.033526234328746796, -0.03230942785739899, -0.031092621386051178, -0.02987581491470337, -0.02865900844335556, -0.02744220197200775, -0.026225393638014793, -0.025008587166666985, -0.023791780695319176, -0.022574972361326218, -0.02135816588997841, -0.0201413594186306, -0.018924551084637642, -0.017707744613289833, -0.016490936279296875, -0.015274129807949066, -0.014057323336601257, -0.012840515933930874, -0.01162370853126049, -0.010406902059912682, -0.009190094657242298, -0.007973287254571915, -0.006756480783224106, -0.005539673380553722, -0.004322866443544626, -0.00310605950653553, -0.0018892521038651466, -0.0006724456325173378, 0.0005443617701530457, 0.0017611688235774636, 0.0029779758770018816, 0.004194783046841621, 0.0054115899838507175, 0.006628396920859814, 0.007845204323530197, 0.009062010794878006, 0.01027881819754839, 0.011495625600218773, 0.012712432071566582, 0.013929239474236965, 0.015146046876907349, 0.016362853348255157, 0.017579659819602966, 0.018796466290950775, 0.020013274624943733, 0.021230081096291542, 0.0224468894302845, 0.02366369590163231, 0.024880502372980118, 0.026097308844327927, 0.027314117178320885, 0.028530923649668694, 0.02974773198366165, 0.03096453845500946, 0.03218134492635727, 0.03339815139770508, 0.034614961594343185, 0.035831768065690994, 0.0370485745370388, 0.03826538100838661, 0.03948218747973442]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 13.0, 9.0, 14.0, 15.0, 19.0, 25.0, 16.0, 33.0, 21.0, 44.0, 27.0, 29.0, 33.0, 39.0, 33.0, 41.0, 35.0, 23.0, 41.0, 31.0, 31.0, 50.0, 30.0, 42.0, 26.0, 27.0, 26.0, 28.0, 24.0, 19.0, 21.0, 19.0, 20.0, 9.0, 11.0, 11.0, 9.0, 12.0, 8.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.02709183655679226, -0.02627384476363659, -0.02545585110783577, -0.0246378593146801, -0.02381986565887928, -0.02300187386572361, -0.02218388020992279, -0.02136588841676712, -0.02054789662361145, -0.01972990483045578, -0.01891191117465496, -0.01809391938149929, -0.01727592572569847, -0.0164579339325428, -0.01563994213938713, -0.014821948483586311, -0.014003954827785492, -0.013185962103307247, -0.012367969378829002, -0.011549977585673332, -0.010731983929872513, -0.009913992136716843, -0.009095999412238598, -0.008278006687760353, -0.007460013963282108, -0.0066420212388038635, -0.005824028514325619, -0.005006036255508661, -0.0041880435310304165, -0.0033700508065521717, -0.0025520585477352142, -0.0017340658232569695, -0.0009160712361335754, -9.807862807065248e-05, 0.0007199139799922705, 0.0015379064716398716, 0.0023558991961181164, 0.003173891920596361, 0.003991884179413319, 0.004809876903891563, 0.005627869628369808, 0.006445862352848053, 0.007263855077326298, 0.008081847801804543, 0.008899839594960213, 0.009717833250761032, 0.010535825043916702, 0.011353817768394947, 0.012171810492873192, 0.012989803217351437, 0.013807795941829681, 0.014625787734985352, 0.015443781390786171, 0.01626177318394184, 0.01707976683974266, 0.01789775863289833, 0.018715750426054, 0.01953374221920967, 0.02035173587501049, 0.02116972766816616, 0.02198772132396698, 0.02280571311712265, 0.02362370491027832, 0.02444169856607914, 0.02525969222187996]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 9.0, 5.0, 24.0, 35.0, 48.0, 57.0, 104.0, 158.0, 215.0, 344.0, 493.0, 750.0, 1039.0, 1605.0, 2314.0, 3395.0, 5005.0, 7300.0, 10926.0, 16372.0, 24844.0, 39798.0, 65058.0, 112142.0, 214753.0, 595188.0, 1624470.0, 863190.0, 272641.0, 132687.0, 74932.0, 44393.0, 27702.0, 17792.0, 11599.0, 7554.0, 4988.0, 3445.0, 2173.0, 1537.0, 1023.0, 685.0, 529.0, 318.0, 222.0, 151.0, 103.0, 64.0, 40.0, 21.0, 21.0, 8.0, 8.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03167724609375, -0.030608654022216797, -0.029540061950683594, -0.02847146987915039, -0.027402877807617188, -0.026334285736083984, -0.02526569366455078, -0.024197101593017578, -0.023128509521484375, -0.022059917449951172, -0.02099132537841797, -0.019922733306884766, -0.018854141235351562, -0.01778554916381836, -0.016716957092285156, -0.015648365020751953, -0.01457977294921875, -0.013511180877685547, -0.012442588806152344, -0.01137399673461914, -0.010305404663085938, -0.009236812591552734, -0.008168220520019531, -0.007099628448486328, -0.006031036376953125, -0.004962444305419922, -0.0038938522338867188, -0.0028252601623535156, -0.0017566680908203125, -0.0006880760192871094, 0.00038051605224609375, 0.0014491081237792969, 0.0025177001953125, 0.003586292266845703, 0.004654884338378906, 0.005723476409912109, 0.0067920684814453125, 0.007860660552978516, 0.008929252624511719, 0.009997844696044922, 0.011066436767578125, 0.012135028839111328, 0.013203620910644531, 0.014272212982177734, 0.015340805053710938, 0.01640939712524414, 0.017477989196777344, 0.018546581268310547, 0.01961517333984375, 0.020683765411376953, 0.021752357482910156, 0.02282094955444336, 0.023889541625976562, 0.024958133697509766, 0.02602672576904297, 0.027095317840576172, 0.028163909912109375, 0.029232501983642578, 0.03030109405517578, 0.031369686126708984, 0.03243827819824219, 0.03350687026977539, 0.034575462341308594, 0.0356440544128418, 0.036712646484375]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 12.0, 10.0, 9.0, 13.0, 16.0, 22.0, 15.0, 23.0, 24.0, 27.0, 46.0, 25.0, 23.0, 31.0, 38.0, 41.0, 35.0, 35.0, 36.0, 38.0, 29.0, 36.0, 44.0, 36.0, 44.0, 39.0, 28.0, 23.0, 25.0, 28.0, 27.0, 18.0, 11.0, 14.0, 14.0, 14.0, 12.0, 13.0, 8.0, 1.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016845703125, -0.01634061336517334, -0.01583552360534668, -0.01533043384552002, -0.01482534408569336, -0.0143202543258667, -0.013815164566040039, -0.013310074806213379, -0.012804985046386719, -0.012299895286560059, -0.011794805526733398, -0.011289715766906738, -0.010784626007080078, -0.010279536247253418, -0.009774446487426758, -0.009269356727600098, -0.008764266967773438, -0.008259177207946777, -0.007754087448120117, -0.007248997688293457, -0.006743907928466797, -0.006238818168640137, -0.0057337284088134766, -0.005228638648986816, -0.004723548889160156, -0.004218459129333496, -0.003713369369506836, -0.0032082796096801758, -0.0027031898498535156, -0.0021981000900268555, -0.0016930103302001953, -0.0011879205703735352, -0.000682830810546875, -0.00017774105072021484, 0.0003273487091064453, 0.0008324384689331055, 0.0013375282287597656, 0.0018426179885864258, 0.002347707748413086, 0.002852797508239746, 0.0033578872680664062, 0.0038629770278930664, 0.0043680667877197266, 0.004873156547546387, 0.005378246307373047, 0.005883336067199707, 0.006388425827026367, 0.006893515586853027, 0.0073986053466796875, 0.007903695106506348, 0.008408784866333008, 0.008913874626159668, 0.009418964385986328, 0.009924054145812988, 0.010429143905639648, 0.010934233665466309, 0.011439323425292969, 0.011944413185119629, 0.012449502944946289, 0.01295459270477295, 0.01345968246459961, 0.01396477222442627, 0.01446986198425293, 0.01497495174407959, 0.01548004150390625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 9.0, 4.0, 12.0, 13.0, 20.0, 42.0, 46.0, 58.0, 126.0, 169.0, 258.0, 459.0, 714.0, 1063.0, 1689.0, 2834.0, 4593.0, 7586.0, 13209.0, 22270.0, 39554.0, 72148.0, 134894.0, 271757.0, 636813.0, 1531573.0, 788006.0, 320987.0, 154990.0, 81578.0, 44903.0, 25431.0, 14513.0, 8572.0, 5096.0, 3052.0, 1946.0, 1172.0, 743.0, 489.0, 331.0, 205.0, 136.0, 84.0, 51.0, 37.0, 26.0, 15.0, 12.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02764892578125, -0.026682376861572266, -0.02571582794189453, -0.024749279022216797, -0.023782730102539062, -0.022816181182861328, -0.021849632263183594, -0.02088308334350586, -0.019916534423828125, -0.01894998550415039, -0.017983436584472656, -0.017016887664794922, -0.016050338745117188, -0.015083789825439453, -0.014117240905761719, -0.013150691986083984, -0.01218414306640625, -0.011217594146728516, -0.010251045227050781, -0.009284496307373047, -0.008317947387695312, -0.007351398468017578, -0.006384849548339844, -0.005418300628662109, -0.004451751708984375, -0.0034852027893066406, -0.0025186538696289062, -0.0015521049499511719, -0.0005855560302734375, 0.0003809928894042969, 0.0013475418090820312, 0.0023140907287597656, 0.0032806396484375, 0.004247188568115234, 0.005213737487792969, 0.006180286407470703, 0.0071468353271484375, 0.008113384246826172, 0.009079933166503906, 0.01004648208618164, 0.011013031005859375, 0.01197957992553711, 0.012946128845214844, 0.013912677764892578, 0.014879226684570312, 0.015845775604248047, 0.01681232452392578, 0.017778873443603516, 0.01874542236328125, 0.019711971282958984, 0.02067852020263672, 0.021645069122314453, 0.022611618041992188, 0.023578166961669922, 0.024544715881347656, 0.02551126480102539, 0.026477813720703125, 0.02744436264038086, 0.028410911560058594, 0.029377460479736328, 0.030344009399414062, 0.0313105583190918, 0.03227710723876953, 0.033243656158447266, 0.034210205078125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 14.0, 17.0, 16.0, 25.0, 31.0, 34.0, 33.0, 36.0, 54.0, 62.0, 81.0, 84.0, 100.0, 98.0, 122.0, 129.0, 161.0, 209.0, 195.0, 209.0, 251.0, 266.0, 232.0, 238.0, 164.0, 156.0, 155.0, 157.0, 108.0, 100.0, 72.0, 77.0, 70.0, 56.0, 53.0, 36.0, 42.0, 29.0, 17.0, 18.0, 11.0, 10.0, 9.0, 3.0, 5.0, 7.0, 0.0, 2.0, 2.0, 4.0, 3.0], "bins": [-0.00852203369140625, -0.008272528648376465, -0.00802302360534668, -0.0077735185623168945, -0.007524013519287109, -0.007274508476257324, -0.007025003433227539, -0.006775498390197754, -0.006525993347167969, -0.006276488304138184, -0.0060269832611083984, -0.005777478218078613, -0.005527973175048828, -0.005278468132019043, -0.005028963088989258, -0.004779458045959473, -0.0045299530029296875, -0.004280447959899902, -0.004030942916870117, -0.003781437873840332, -0.003531932830810547, -0.0032824277877807617, -0.0030329227447509766, -0.0027834177017211914, -0.0025339126586914062, -0.002284407615661621, -0.002034902572631836, -0.0017853975296020508, -0.0015358924865722656, -0.0012863874435424805, -0.0010368824005126953, -0.0007873773574829102, -0.000537872314453125, -0.00028836727142333984, -3.886222839355469e-05, 0.00021064281463623047, 0.0004601478576660156, 0.0007096529006958008, 0.0009591579437255859, 0.001208662986755371, 0.0014581680297851562, 0.0017076730728149414, 0.0019571781158447266, 0.0022066831588745117, 0.002456188201904297, 0.002705693244934082, 0.002955198287963867, 0.0032047033309936523, 0.0034542083740234375, 0.0037037134170532227, 0.003953218460083008, 0.004202723503112793, 0.004452228546142578, 0.004701733589172363, 0.0049512386322021484, 0.005200743675231934, 0.005450248718261719, 0.005699753761291504, 0.005949258804321289, 0.006198763847351074, 0.006448268890380859, 0.0066977739334106445, 0.00694727897644043, 0.007196784019470215, 0.0074462890625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 6.0, 1.0, 10.0, 11.0, 17.0, 16.0, 17.0, 25.0, 37.0, 48.0, 33.0, 58.0, 65.0, 72.0, 84.0, 93.0, 72.0, 63.0, 61.0, 28.0, 50.0, 19.0, 20.0, 17.0, 13.0, 10.0, 8.0, 6.0, 3.0, 6.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022141853347420692, -0.021349061280488968, -0.020556269213557243, -0.01976347528398037, -0.018970683217048645, -0.01817789115011692, -0.017385099083185196, -0.016592305153608322, -0.015799513086676598, -0.015006721019744873, -0.014213928021490574, -0.01342113595455885, -0.01262834295630455, -0.011835550889372826, -0.011042758822441101, -0.010249965824186802, -0.009457173757255077, -0.008664381690323353, -0.007871588692069054, -0.007078796625137329, -0.00628600362688303, -0.005493211559951305, -0.0047004190273582935, -0.003907626494765282, -0.00311483396217227, -0.002322041429579258, -0.001529249013401568, -0.0007364565972238779, 5.633593536913395e-05, 0.0008491282351315022, 0.001641920767724514, 0.002434713300317526, 0.0032275058329105377, 0.00402029836550355, 0.004813090898096561, 0.005605882965028286, 0.006398675963282585, 0.00719146803021431, 0.007984260097146034, 0.008777053095400333, 0.009569846093654633, 0.010362638160586357, 0.011155431158840656, 0.01194822322577238, 0.01274101622402668, 0.013533808290958405, 0.014326600357890129, 0.015119393356144428, 0.015912186354398727, 0.016704978421330452, 0.017497770488262177, 0.01829056441783905, 0.019083356484770775, 0.0198761485517025, 0.020668940618634224, 0.02146173268556595, 0.022254524752497673, 0.023047316819429398, 0.023840108886361122, 0.024632902815937996, 0.02542569488286972, 0.026218486949801445, 0.02701127901673317, 0.027804072946310043, 0.028596865013241768]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 3.0, 7.0, 17.0, 16.0, 14.0, 19.0, 23.0, 19.0, 22.0, 33.0, 25.0, 27.0, 37.0, 29.0, 41.0, 45.0, 44.0, 37.0, 45.0, 35.0, 41.0, 47.0, 49.0, 33.0, 34.0, 29.0, 22.0, 28.0, 31.0, 17.0, 25.0, 20.0, 13.0, 15.0, 10.0, 8.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020570410415530205, -0.01997828297317028, -0.019386157393455505, -0.01879402995109558, -0.018201902508735657, -0.01760977692902088, -0.017017649486660957, -0.016425523906946182, -0.015833396464586258, -0.015241269953548908, -0.014649143442511559, -0.014057016000151634, -0.013464889489114285, -0.012872762978076935, -0.01228063553571701, -0.01168850902467966, -0.011096382513642311, -0.010504256002604961, -0.009912129491567612, -0.009320002049207687, -0.008727875538170338, -0.008135749027132988, -0.007543622050434351, -0.006951495073735714, -0.006359368562698364, -0.0057672420516610146, -0.0051751150749623775, -0.0045829880982637405, -0.003990861587226391, -0.0033987348433583975, -0.002806608099490404, -0.002214481122791767, -0.0016223546117544174, -0.001030227867886424, -0.0004381011240184307, 0.00015402561984956264, 0.000746152363717556, 0.0013382791075855494, 0.0019304058514535427, 0.0025225328281521797, 0.0031146593391895294, 0.0037067860830575228, 0.004298912826925516, 0.004891039803624153, 0.005483166314661503, 0.0060752928256988525, 0.0066674198023974895, 0.0072595467790961266, 0.007851673290133476, 0.008443799801170826, 0.009035926312208176, 0.0096280537545681, 0.01022018026560545, 0.0108123067766428, 0.011404434219002724, 0.011996560730040073, 0.012588687241077423, 0.013180813752114773, 0.013772940263152122, 0.014365067705512047, 0.014957194216549397, 0.015549320727586746, 0.01614144816994667, 0.016733575612306595, 0.01732570119202137]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 8.0, 8.0, 8.0, 11.0, 11.0, 13.0, 36.0, 42.0, 62.0, 84.0, 95.0, 159.0, 226.0, 367.0, 547.0, 773.0, 1272.0, 1894.0, 3028.0, 4852.0, 8103.0, 14042.0, 25602.0, 51585.0, 118837.0, 382632.0, 254507.0, 88499.0, 40318.0, 20731.0, 11756.0, 6936.0, 4118.0, 2612.0, 1642.0, 1014.0, 717.0, 431.0, 297.0, 210.0, 159.0, 97.0, 61.0, 44.0, 25.0, 27.0, 28.0, 20.0, 5.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.017911195755004883, -0.017267704010009766, -0.01662421226501465, -0.01598072052001953, -0.015337228775024414, -0.014693737030029297, -0.01405024528503418, -0.013406753540039062, -0.012763261795043945, -0.012119770050048828, -0.011476278305053711, -0.010832786560058594, -0.010189294815063477, -0.00954580307006836, -0.008902311325073242, -0.008258819580078125, -0.007615327835083008, -0.006971836090087891, -0.0063283443450927734, -0.005684852600097656, -0.005041360855102539, -0.004397869110107422, -0.0037543773651123047, -0.0031108856201171875, -0.0024673938751220703, -0.0018239021301269531, -0.001180410385131836, -0.0005369186401367188, 0.00010657310485839844, 0.0007500648498535156, 0.0013935565948486328, 0.00203704833984375, 0.002680540084838867, 0.0033240318298339844, 0.0039675235748291016, 0.004611015319824219, 0.005254507064819336, 0.005897998809814453, 0.00654149055480957, 0.0071849822998046875, 0.007828474044799805, 0.008471965789794922, 0.009115457534790039, 0.009758949279785156, 0.010402441024780273, 0.01104593276977539, 0.011689424514770508, 0.012332916259765625, 0.012976408004760742, 0.01361989974975586, 0.014263391494750977, 0.014906883239746094, 0.015550374984741211, 0.016193866729736328, 0.016837358474731445, 0.017480850219726562, 0.01812434196472168, 0.018767833709716797, 0.019411325454711914, 0.02005481719970703, 0.02069830894470215, 0.021341800689697266, 0.021985292434692383, 0.0226287841796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 16.0, 16.0, 15.0, 23.0, 16.0, 20.0, 23.0, 33.0, 28.0, 42.0, 37.0, 35.0, 38.0, 40.0, 55.0, 48.0, 46.0, 42.0, 55.0, 39.0, 30.0, 41.0, 28.0, 33.0, 19.0, 21.0, 21.0, 31.0, 12.0, 20.0, 20.0, 8.0, 7.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0224151611328125, -0.021768569946289062, -0.021121978759765625, -0.020475387573242188, -0.01982879638671875, -0.019182205200195312, -0.018535614013671875, -0.017889022827148438, -0.017242431640625, -0.016595840454101562, -0.015949249267578125, -0.015302658081054688, -0.01465606689453125, -0.014009475708007812, -0.013362884521484375, -0.012716293334960938, -0.0120697021484375, -0.011423110961914062, -0.010776519775390625, -0.010129928588867188, -0.00948333740234375, -0.008836746215820312, -0.008190155029296875, -0.0075435638427734375, -0.00689697265625, -0.0062503814697265625, -0.005603790283203125, -0.0049571990966796875, -0.00431060791015625, -0.0036640167236328125, -0.003017425537109375, -0.0023708343505859375, -0.0017242431640625, -0.0010776519775390625, -0.000431060791015625, 0.0002155303955078125, 0.00086212158203125, 0.0015087127685546875, 0.002155303955078125, 0.0028018951416015625, 0.003448486328125, 0.0040950775146484375, 0.004741668701171875, 0.0053882598876953125, 0.00603485107421875, 0.0066814422607421875, 0.007328033447265625, 0.007974624633789062, 0.0086212158203125, 0.009267807006835938, 0.009914398193359375, 0.010560989379882812, 0.01120758056640625, 0.011854171752929688, 0.012500762939453125, 0.013147354125976562, 0.0137939453125, 0.014440536499023438, 0.015087127685546875, 0.015733718872070312, 0.01638031005859375, 0.017026901245117188, 0.017673492431640625, 0.018320083618164062, 0.0189666748046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 1.0, 7.0, 10.0, 21.0, 28.0, 27.0, 42.0, 65.0, 98.0, 160.0, 201.0, 360.0, 521.0, 812.0, 1257.0, 2017.0, 3378.0, 5870.0, 11126.0, 25227.0, 85091.0, 743035.0, 111708.0, 28857.0, 12389.0, 6483.0, 3702.0, 2199.0, 1344.0, 847.0, 527.0, 356.0, 266.0, 144.0, 113.0, 77.0, 69.0, 40.0, 18.0, 15.0, 19.0, 10.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04168701171875, -0.04044532775878906, -0.039203643798828125, -0.03796195983886719, -0.03672027587890625, -0.03547859191894531, -0.034236907958984375, -0.03299522399902344, -0.0317535400390625, -0.030511856079101562, -0.029270172119140625, -0.028028488159179688, -0.02678680419921875, -0.025545120239257812, -0.024303436279296875, -0.023061752319335938, -0.021820068359375, -0.020578384399414062, -0.019336700439453125, -0.018095016479492188, -0.01685333251953125, -0.015611648559570312, -0.014369964599609375, -0.013128280639648438, -0.0118865966796875, -0.010644912719726562, -0.009403228759765625, -0.008161544799804688, -0.00691986083984375, -0.0056781768798828125, -0.004436492919921875, -0.0031948089599609375, -0.001953125, -0.0007114410400390625, 0.000530242919921875, 0.0017719268798828125, 0.00301361083984375, 0.0042552947998046875, 0.005496978759765625, 0.0067386627197265625, 0.0079803466796875, 0.009222030639648438, 0.010463714599609375, 0.011705398559570312, 0.01294708251953125, 0.014188766479492188, 0.015430450439453125, 0.016672134399414062, 0.017913818359375, 0.019155502319335938, 0.020397186279296875, 0.021638870239257812, 0.02288055419921875, 0.024122238159179688, 0.025363922119140625, 0.026605606079101562, 0.0278472900390625, 0.029088973999023438, 0.030330657958984375, 0.03157234191894531, 0.03281402587890625, 0.03405570983886719, 0.035297393798828125, 0.03653907775878906, 0.03778076171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 10.0, 3.0, 7.0, 9.0, 10.0, 10.0, 16.0, 11.0, 17.0, 19.0, 26.0, 22.0, 27.0, 28.0, 31.0, 43.0, 32.0, 32.0, 41.0, 38.0, 38.0, 42.0, 46.0, 38.0, 38.0, 34.0, 42.0, 35.0, 25.0, 27.0, 35.0, 33.0, 24.0, 15.0, 24.0, 16.0, 14.0, 16.0, 9.0, 5.0, 6.0, 4.0, 5.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01015472412109375, -0.009767413139343262, -0.009380102157592773, -0.008992791175842285, -0.008605480194091797, -0.008218169212341309, -0.00783085823059082, -0.007443547248840332, -0.007056236267089844, -0.0066689252853393555, -0.006281614303588867, -0.005894303321838379, -0.005506992340087891, -0.005119681358337402, -0.004732370376586914, -0.004345059394836426, -0.0039577484130859375, -0.0035704374313354492, -0.003183126449584961, -0.0027958154678344727, -0.0024085044860839844, -0.002021193504333496, -0.0016338825225830078, -0.0012465715408325195, -0.0008592605590820312, -0.00047194957733154297, -8.463859558105469e-05, 0.0003026723861694336, 0.0006899833679199219, 0.0010772943496704102, 0.0014646053314208984, 0.0018519163131713867, 0.002239227294921875, 0.0026265382766723633, 0.0030138492584228516, 0.00340116024017334, 0.003788471221923828, 0.004175782203674316, 0.004563093185424805, 0.004950404167175293, 0.005337715148925781, 0.0057250261306762695, 0.006112337112426758, 0.006499648094177246, 0.006886959075927734, 0.007274270057678223, 0.007661581039428711, 0.0080488920211792, 0.008436203002929688, 0.008823513984680176, 0.009210824966430664, 0.009598135948181152, 0.00998544692993164, 0.010372757911682129, 0.010760068893432617, 0.011147379875183105, 0.011534690856933594, 0.011922001838684082, 0.01230931282043457, 0.012696623802185059, 0.013083934783935547, 0.013471245765686035, 0.013858556747436523, 0.014245867729187012, 0.0146331787109375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 14.0, 15.0, 7.0, 14.0, 19.0, 28.0, 31.0, 46.0, 52.0, 115.0, 121.0, 158.0, 228.0, 395.0, 593.0, 1032.0, 1826.0, 3661.0, 8419.0, 26933.0, 691321.0, 275010.0, 23077.0, 7659.0, 3306.0, 1683.0, 960.0, 598.0, 362.0, 257.0, 159.0, 132.0, 79.0, 80.0, 38.0, 23.0, 16.0, 22.0, 15.0, 17.0, 9.0, 4.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.006374359130859375, -0.006168365478515625, -0.005962371826171875, -0.005756378173828125, -0.005550384521484375, -0.005344390869140625, -0.005138397216796875, -0.004932403564453125, -0.004726409912109375, -0.004520416259765625, -0.004314422607421875, -0.004108428955078125, -0.003902435302734375, -0.003696441650390625, -0.003490447998046875, -0.003284454345703125, -0.003078460693359375, -0.002872467041015625, -0.002666473388671875, -0.002460479736328125, -0.002254486083984375, -0.002048492431640625, -0.001842498779296875, -0.001636505126953125, -0.001430511474609375, -0.001224517822265625, -0.001018524169921875, -0.000812530517578125, -0.000606536865234375, -0.000400543212890625, -0.000194549560546875, 1.1444091796875e-05, 0.000217437744140625, 0.000423431396484375, 0.000629425048828125, 0.000835418701171875, 0.001041412353515625, 0.001247406005859375, 0.001453399658203125, 0.001659393310546875, 0.001865386962890625, 0.002071380615234375, 0.002277374267578125, 0.002483367919921875, 0.002689361572265625, 0.002895355224609375, 0.003101348876953125, 0.003307342529296875, 0.003513336181640625, 0.003719329833984375, 0.003925323486328125, 0.004131317138671875, 0.004337310791015625, 0.004543304443359375, 0.004749298095703125, 0.004955291748046875, 0.005161285400390625, 0.005367279052734375, 0.005573272705078125, 0.005779266357421875, 0.005985260009765625, 0.006191253662109375, 0.006397247314453125, 0.006603240966796875, 0.006809234619140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 6.0, 12.0, 16.0, 0.0, 22.0, 28.0, 37.0, 0.0, 46.0, 51.0, 70.0, 0.0, 82.0, 90.0, 94.0, 0.0, 93.0, 91.0, 68.0, 0.0, 55.0, 40.0, 30.0, 0.0, 23.0, 13.0, 11.0, 0.0, 10.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5050172805786133e-06, -1.4603137969970703e-06, -1.4156103134155273e-06, -1.3709068298339844e-06, -1.3262033462524414e-06, -1.2814998626708984e-06, -1.2367963790893555e-06, -1.1920928955078125e-06, -1.1473894119262695e-06, -1.1026859283447266e-06, -1.0579824447631836e-06, -1.0132789611816406e-06, -9.685754776000977e-07, -9.238719940185547e-07, -8.791685104370117e-07, -8.344650268554688e-07, -7.897615432739258e-07, -7.450580596923828e-07, -7.003545761108398e-07, -6.556510925292969e-07, -6.109476089477539e-07, -5.662441253662109e-07, -5.21540641784668e-07, -4.76837158203125e-07, -4.3213367462158203e-07, -3.8743019104003906e-07, -3.427267074584961e-07, -2.980232238769531e-07, -2.5331974029541016e-07, -2.086162567138672e-07, -1.6391277313232422e-07, -1.1920928955078125e-07, -7.450580596923828e-08, -2.9802322387695312e-08, 1.4901161193847656e-08, 5.960464477539063e-08, 1.043081283569336e-07, 1.4901161193847656e-07, 1.9371509552001953e-07, 2.384185791015625e-07, 2.8312206268310547e-07, 3.2782554626464844e-07, 3.725290298461914e-07, 4.172325134277344e-07, 4.6193599700927734e-07, 5.066394805908203e-07, 5.513429641723633e-07, 5.960464477539062e-07, 6.407499313354492e-07, 6.854534149169922e-07, 7.301568984985352e-07, 7.748603820800781e-07, 8.195638656616211e-07, 8.642673492431641e-07, 9.08970832824707e-07, 9.5367431640625e-07, 9.98377799987793e-07, 1.043081283569336e-06, 1.087784767150879e-06, 1.1324882507324219e-06, 1.1771917343139648e-06, 1.2218952178955078e-06, 1.2665987014770508e-06, 1.3113021850585938e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 4.0, 17.0, 19.0, 22.0, 43.0, 45.0, 69.0, 76.0, 153.0, 185.0, 289.0, 430.0, 657.0, 1146.0, 2192.0, 5023.0, 14436.0, 63438.0, 778008.0, 144514.0, 23685.0, 7321.0, 2997.0, 1424.0, 782.0, 478.0, 320.0, 243.0, 141.0, 116.0, 76.0, 55.0, 39.0, 29.0, 21.0, 22.0, 7.0, 6.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007411956787109375, -0.007185220718383789, -0.006958484649658203, -0.006731748580932617, -0.006505012512207031, -0.006278276443481445, -0.006051540374755859, -0.0058248043060302734, -0.0055980682373046875, -0.0053713321685791016, -0.005144596099853516, -0.00491786003112793, -0.004691123962402344, -0.004464387893676758, -0.004237651824951172, -0.004010915756225586, -0.0037841796875, -0.003557443618774414, -0.003330707550048828, -0.003103971481323242, -0.0028772354125976562, -0.0026504993438720703, -0.0024237632751464844, -0.0021970272064208984, -0.0019702911376953125, -0.0017435550689697266, -0.0015168190002441406, -0.0012900829315185547, -0.0010633468627929688, -0.0008366107940673828, -0.0006098747253417969, -0.00038313865661621094, -0.000156402587890625, 7.033348083496094e-05, 0.0002970695495605469, 0.0005238056182861328, 0.0007505416870117188, 0.0009772777557373047, 0.0012040138244628906, 0.0014307498931884766, 0.0016574859619140625, 0.0018842220306396484, 0.0021109580993652344, 0.0023376941680908203, 0.0025644302368164062, 0.002791166305541992, 0.003017902374267578, 0.003244638442993164, 0.00347137451171875, 0.003698110580444336, 0.003924846649169922, 0.004151582717895508, 0.004378318786621094, 0.00460505485534668, 0.004831790924072266, 0.0050585269927978516, 0.0052852630615234375, 0.0055119991302490234, 0.005738735198974609, 0.005965471267700195, 0.006192207336425781, 0.006418943405151367, 0.006645679473876953, 0.006872415542602539, 0.007099151611328125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 9.0, 16.0, 22.0, 29.0, 64.0, 115.0, 316.0, 199.0, 88.0, 54.0, 22.0, 13.0, 19.0, 6.0, 3.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001361846923828125, -0.001320376992225647, -0.001278907060623169, -0.001237437129020691, -0.0011959671974182129, -0.0011544972658157349, -0.0011130273342132568, -0.0010715574026107788, -0.0010300874710083008, -0.0009886175394058228, -0.0009471476078033447, -0.0009056776762008667, -0.0008642077445983887, -0.0008227378129959106, -0.0007812678813934326, -0.0007397979497909546, -0.0006983280181884766, -0.0006568580865859985, -0.0006153881549835205, -0.0005739182233810425, -0.0005324482917785645, -0.0004909783601760864, -0.0004495084285736084, -0.00040803849697113037, -0.00036656856536865234, -0.0003250986337661743, -0.0002836287021636963, -0.00024215877056121826, -0.00020068883895874023, -0.0001592189073562622, -0.00011774897575378418, -7.627904415130615e-05, -3.4809112548828125e-05, 6.660819053649902e-06, 4.813075065612793e-05, 8.960068225860596e-05, 0.00013107061386108398, 0.000172540545463562, 0.00021401047706604004, 0.00025548040866851807, 0.0002969503402709961, 0.0003384202718734741, 0.00037989020347595215, 0.0004213601350784302, 0.0004628300666809082, 0.0005042999982833862, 0.0005457699298858643, 0.0005872398614883423, 0.0006287097930908203, 0.0006701797246932983, 0.0007116496562957764, 0.0007531195878982544, 0.0007945895195007324, 0.0008360594511032104, 0.0008775293827056885, 0.0009189993143081665, 0.0009604692459106445, 0.0010019391775131226, 0.0010434091091156006, 0.0010848790407180786, 0.0011263489723205566, 0.0011678189039230347, 0.0012092888355255127, 0.0012507587671279907, 0.0012922286987304688]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 11.0, 11.0, 13.0, 18.0, 17.0, 23.0, 30.0, 38.0, 42.0, 56.0, 81.0, 58.0, 99.0, 93.0, 77.0, 67.0, 61.0, 41.0, 32.0, 23.0, 16.0, 17.0, 14.0, 12.0, 7.0, 5.0, 2.0, 1.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021865997463464737, -0.02105432003736496, -0.020242640748620033, -0.019430963322520256, -0.01861928403377533, -0.017807606607675552, -0.016995927318930626, -0.01618424989283085, -0.015372570604085922, -0.01456089224666357, -0.013749213889241219, -0.012937535531818867, -0.012125857174396515, -0.011314179748296738, -0.010502500459551811, -0.009690823033452034, -0.008879144676029682, -0.00806746631860733, -0.0072557879611849785, -0.006444109603762627, -0.005632431246340275, -0.00482075335457921, -0.0040090749971568584, -0.0031973966397345066, -0.0023857182823121548, -0.001574039924889803, -0.0007623616838827729, 4.931655712425709e-05, 0.0008609949145466089, 0.001672673039138317, 0.002484351396560669, 0.0032960297539830208, 0.004107708111405373, 0.0049193864688277245, 0.005731064826250076, 0.006542743183672428, 0.00735442154109478, 0.008166098967194557, 0.008977778255939484, 0.00978945568203926, 0.010601134970784187, 0.01141281332820654, 0.012224491685628891, 0.013036170043051243, 0.013847848400473595, 0.014659525826573372, 0.015471205115318298, 0.016282882541418076, 0.017094559967517853, 0.01790623739361763, 0.018717916682362556, 0.019529594108462334, 0.02034127339720726, 0.021152950823307037, 0.021964630112051964, 0.02277630753815174, 0.023587986826896667, 0.024399664252996445, 0.02521134354174137, 0.02602302096784115, 0.026834700256586075, 0.027646377682685852, 0.02845805697143078, 0.029269734397530556, 0.030081413686275482]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 3.0, 9.0, 16.0, 17.0, 15.0, 20.0, 21.0, 18.0, 24.0, 26.0, 31.0, 31.0, 38.0, 23.0, 51.0, 36.0, 47.0, 37.0, 44.0, 36.0, 39.0, 44.0, 54.0, 36.0, 29.0, 31.0, 21.0, 27.0, 32.0, 14.0, 28.0, 18.0, 14.0, 14.0, 10.0, 8.0, 6.0, 9.0, 5.0, 7.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020207522436976433, -0.019622666761279106, -0.01903780922293663, -0.018452953547239304, -0.017868097871541977, -0.01728324219584465, -0.016698384657502174, -0.016113528981804848, -0.015528672374784946, -0.014943815767765045, -0.014358960092067719, -0.013774103485047817, -0.013189246878027916, -0.01260439120233059, -0.012019534595310688, -0.011434677988290787, -0.01084982231259346, -0.010264965705573559, -0.009680110029876232, -0.009095253422856331, -0.008510397747159004, -0.007925541140139103, -0.007340684533119202, -0.006755828391760588, -0.006170972250401974, -0.00558611610904336, -0.005001259967684746, -0.0044164033606648445, -0.0038315472193062305, -0.0032466910779476166, -0.002661834703758359, -0.0020769783295691013, -0.0014921203255653381, -0.0009072640677914023, -0.00032240781001746655, 0.00026244844775646925, 0.000847304705530405, 0.001432160846889019, 0.0020170172210782766, 0.0026018735952675343, 0.0031867297366261482, 0.003771585877984762, 0.004356442019343376, 0.0049412986263632774, 0.005526154767721891, 0.006111010909080505, 0.006695867516100407, 0.007280723657459021, 0.007865579798817635, 0.008450436405837536, 0.009035292081534863, 0.009620148688554764, 0.01020500436425209, 0.010789860971271992, 0.011374717578291893, 0.01195957325398922, 0.012544429861009121, 0.013129286468029022, 0.013714142143726349, 0.01429899875074625, 0.014883855357766151, 0.015468711033463478, 0.016053566709160805, 0.01663842424750328, 0.017223279923200607]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 7.0, 9.0, 13.0, 23.0, 43.0, 54.0, 82.0, 118.0, 188.0, 267.0, 348.0, 504.0, 738.0, 1079.0, 1496.0, 2219.0, 3176.0, 4705.0, 6735.0, 9973.0, 14559.0, 22243.0, 33891.0, 53773.0, 87582.0, 150481.0, 238004.0, 159927.0, 92567.0, 56654.0, 35796.0, 22933.0, 15440.0, 10201.0, 7072.0, 4761.0, 3336.0, 2260.0, 1636.0, 1193.0, 820.0, 515.0, 353.0, 263.0, 193.0, 121.0, 58.0, 45.0, 35.0, 19.0, 15.0, 13.0, 9.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.0291290283203125, -0.02817559242248535, -0.027222156524658203, -0.026268720626831055, -0.025315284729003906, -0.024361848831176758, -0.02340841293334961, -0.02245497703552246, -0.021501541137695312, -0.020548105239868164, -0.019594669342041016, -0.018641233444213867, -0.01768779754638672, -0.01673436164855957, -0.015780925750732422, -0.014827489852905273, -0.013874053955078125, -0.012920618057250977, -0.011967182159423828, -0.01101374626159668, -0.010060310363769531, -0.009106874465942383, -0.008153438568115234, -0.007200002670288086, -0.0062465667724609375, -0.005293130874633789, -0.004339694976806641, -0.003386259078979492, -0.0024328231811523438, -0.0014793872833251953, -0.0005259513854980469, 0.00042748451232910156, 0.00138092041015625, 0.0023343563079833984, 0.003287792205810547, 0.004241228103637695, 0.005194664001464844, 0.006148099899291992, 0.007101535797119141, 0.008054971694946289, 0.009008407592773438, 0.009961843490600586, 0.010915279388427734, 0.011868715286254883, 0.012822151184082031, 0.01377558708190918, 0.014729022979736328, 0.015682458877563477, 0.016635894775390625, 0.017589330673217773, 0.018542766571044922, 0.01949620246887207, 0.02044963836669922, 0.021403074264526367, 0.022356510162353516, 0.023309946060180664, 0.024263381958007812, 0.02521681785583496, 0.02617025375366211, 0.027123689651489258, 0.028077125549316406, 0.029030561447143555, 0.029983997344970703, 0.03093743324279785, 0.031890869140625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 9.0, 5.0, 9.0, 11.0, 17.0, 21.0, 11.0, 16.0, 25.0, 28.0, 26.0, 29.0, 31.0, 40.0, 34.0, 39.0, 37.0, 49.0, 35.0, 51.0, 47.0, 55.0, 42.0, 34.0, 37.0, 41.0, 28.0, 25.0, 25.0, 22.0, 20.0, 25.0, 8.0, 12.0, 9.0, 11.0, 6.0, 8.0, 9.0, 4.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0179595947265625, -0.017437219619750977, -0.016914844512939453, -0.01639246940612793, -0.015870094299316406, -0.015347719192504883, -0.01482534408569336, -0.014302968978881836, -0.013780593872070312, -0.013258218765258789, -0.012735843658447266, -0.012213468551635742, -0.011691093444824219, -0.011168718338012695, -0.010646343231201172, -0.010123968124389648, -0.009601593017578125, -0.009079217910766602, -0.008556842803955078, -0.008034467697143555, -0.007512092590332031, -0.006989717483520508, -0.006467342376708984, -0.005944967269897461, -0.0054225921630859375, -0.004900217056274414, -0.004377841949462891, -0.003855466842651367, -0.0033330917358398438, -0.0028107166290283203, -0.002288341522216797, -0.0017659664154052734, -0.00124359130859375, -0.0007212162017822266, -0.00019884109497070312, 0.0003235340118408203, 0.0008459091186523438, 0.0013682842254638672, 0.0018906593322753906, 0.002413034439086914, 0.0029354095458984375, 0.003457784652709961, 0.003980159759521484, 0.004502534866333008, 0.005024909973144531, 0.005547285079956055, 0.006069660186767578, 0.0065920352935791016, 0.007114410400390625, 0.0076367855072021484, 0.008159160614013672, 0.008681535720825195, 0.009203910827636719, 0.009726285934448242, 0.010248661041259766, 0.010771036148071289, 0.011293411254882812, 0.011815786361694336, 0.01233816146850586, 0.012860536575317383, 0.013382911682128906, 0.01390528678894043, 0.014427661895751953, 0.014950037002563477, 0.015472412109375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 7.0, 6.0, 10.0, 6.0, 25.0, 26.0, 47.0, 53.0, 84.0, 124.0, 194.0, 290.0, 399.0, 590.0, 931.0, 1271.0, 2127.0, 3150.0, 4905.0, 7694.0, 12217.0, 19848.0, 32565.0, 55039.0, 93205.0, 171914.0, 271082.0, 154048.0, 85780.0, 50650.0, 29966.0, 18526.0, 11306.0, 7313.0, 4621.0, 2868.0, 1908.0, 1245.0, 842.0, 528.0, 353.0, 254.0, 183.0, 117.0, 74.0, 52.0, 29.0, 25.0, 24.0, 8.0, 18.0, 4.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.035369873046875, -0.03427886962890625, -0.0331878662109375, -0.03209686279296875, -0.031005859375, -0.02991485595703125, -0.0288238525390625, -0.02773284912109375, -0.026641845703125, -0.02555084228515625, -0.0244598388671875, -0.02336883544921875, -0.02227783203125, -0.02118682861328125, -0.0200958251953125, -0.01900482177734375, -0.017913818359375, -0.01682281494140625, -0.0157318115234375, -0.01464080810546875, -0.0135498046875, -0.01245880126953125, -0.0113677978515625, -0.01027679443359375, -0.009185791015625, -0.00809478759765625, -0.0070037841796875, -0.00591278076171875, -0.00482177734375, -0.00373077392578125, -0.0026397705078125, -0.00154876708984375, -0.000457763671875, 0.00063323974609375, 0.0017242431640625, 0.00281524658203125, 0.00390625, 0.00499725341796875, 0.0060882568359375, 0.00717926025390625, 0.008270263671875, 0.00936126708984375, 0.0104522705078125, 0.01154327392578125, 0.01263427734375, 0.01372528076171875, 0.0148162841796875, 0.01590728759765625, 0.016998291015625, 0.01808929443359375, 0.0191802978515625, 0.02027130126953125, 0.0213623046875, 0.02245330810546875, 0.0235443115234375, 0.02463531494140625, 0.025726318359375, 0.02681732177734375, 0.0279083251953125, 0.02899932861328125, 0.03009033203125, 0.03118133544921875, 0.0322723388671875, 0.03336334228515625, 0.034454345703125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 0.0, 0.0, 6.0, 5.0, 6.0, 5.0, 11.0, 11.0, 15.0, 11.0, 20.0, 20.0, 21.0, 17.0, 28.0, 21.0, 32.0, 46.0, 31.0, 34.0, 35.0, 42.0, 45.0, 38.0, 33.0, 34.0, 44.0, 26.0, 31.0, 37.0, 44.0, 36.0, 18.0, 23.0, 28.0, 21.0, 22.0, 15.0, 10.0, 13.0, 14.0, 6.0, 10.0, 7.0, 13.0, 5.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.01025390625, -0.009952306747436523, -0.009650707244873047, -0.00934910774230957, -0.009047508239746094, -0.008745908737182617, -0.00844430923461914, -0.008142709732055664, -0.007841110229492188, -0.007539510726928711, -0.007237911224365234, -0.006936311721801758, -0.006634712219238281, -0.006333112716674805, -0.006031513214111328, -0.0057299137115478516, -0.005428314208984375, -0.0051267147064208984, -0.004825115203857422, -0.004523515701293945, -0.004221916198730469, -0.003920316696166992, -0.0036187171936035156, -0.003317117691040039, -0.0030155181884765625, -0.002713918685913086, -0.0024123191833496094, -0.002110719680786133, -0.0018091201782226562, -0.0015075206756591797, -0.0012059211730957031, -0.0009043216705322266, -0.00060272216796875, -0.00030112266540527344, 4.76837158203125e-07, 0.0003020763397216797, 0.0006036758422851562, 0.0009052753448486328, 0.0012068748474121094, 0.001508474349975586, 0.0018100738525390625, 0.002111673355102539, 0.0024132728576660156, 0.002714872360229492, 0.0030164718627929688, 0.0033180713653564453, 0.003619670867919922, 0.0039212703704833984, 0.004222869873046875, 0.0045244693756103516, 0.004826068878173828, 0.005127668380737305, 0.005429267883300781, 0.005730867385864258, 0.006032466888427734, 0.006334066390991211, 0.0066356658935546875, 0.006937265396118164, 0.007238864898681641, 0.007540464401245117, 0.007842063903808594, 0.00814366340637207, 0.008445262908935547, 0.008746862411499023, 0.0090484619140625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 17.0, 21.0, 12.0, 25.0, 47.0, 86.0, 104.0, 136.0, 170.0, 295.0, 385.0, 502.0, 710.0, 1052.0, 1524.0, 2326.0, 3524.0, 5437.0, 8889.0, 16142.0, 31441.0, 94911.0, 646754.0, 147859.0, 38726.0, 18671.0, 10512.0, 6264.0, 3878.0, 2552.0, 1669.0, 1243.0, 736.0, 513.0, 397.0, 288.0, 198.0, 136.0, 114.0, 87.0, 77.0, 40.0, 22.0, 19.0, 16.0, 13.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0016117095947265625, -0.0015607476234436035, -0.0015097856521606445, -0.0014588236808776855, -0.0014078617095947266, -0.0013568997383117676, -0.0013059377670288086, -0.0012549757957458496, -0.0012040138244628906, -0.0011530518531799316, -0.0011020898818969727, -0.0010511279106140137, -0.0010001659393310547, -0.0009492039680480957, -0.0008982419967651367, -0.0008472800254821777, -0.0007963180541992188, -0.0007453560829162598, -0.0006943941116333008, -0.0006434321403503418, -0.0005924701690673828, -0.0005415081977844238, -0.0004905462265014648, -0.00043958425521850586, -0.0003886222839355469, -0.0003376603126525879, -0.0002866983413696289, -0.00023573637008666992, -0.00018477439880371094, -0.00013381242752075195, -8.285045623779297e-05, -3.1888484954833984e-05, 1.9073486328125e-05, 7.003545761108398e-05, 0.00012099742889404297, 0.00017195940017700195, 0.00022292137145996094, 0.0002738833427429199, 0.0003248453140258789, 0.0003758072853088379, 0.0004267692565917969, 0.00047773122787475586, 0.0005286931991577148, 0.0005796551704406738, 0.0006306171417236328, 0.0006815791130065918, 0.0007325410842895508, 0.0007835030555725098, 0.0008344650268554688, 0.0008854269981384277, 0.0009363889694213867, 0.0009873509407043457, 0.0010383129119873047, 0.0010892748832702637, 0.0011402368545532227, 0.0011911988258361816, 0.0012421607971191406, 0.0012931227684020996, 0.0013440847396850586, 0.0013950467109680176, 0.0014460086822509766, 0.0014969706535339355, 0.0015479326248168945, 0.0015988945960998535, 0.0016498565673828125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 5.0, 4.0, 7.0, 8.0, 9.0, 0.0, 16.0, 19.0, 44.0, 44.0, 81.0, 0.0, 87.0, 113.0, 101.0, 109.0, 82.0, 86.0, 0.0, 53.0, 47.0, 29.0, 26.0, 9.0, 0.0, 8.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6782432794570923e-06, -1.6279518604278564e-06, -1.5776604413986206e-06, -1.5273690223693848e-06, -1.477077603340149e-06, -1.426786184310913e-06, -1.3764947652816772e-06, -1.3262033462524414e-06, -1.2759119272232056e-06, -1.2256205081939697e-06, -1.1753290891647339e-06, -1.125037670135498e-06, -1.0747462511062622e-06, -1.0244548320770264e-06, -9.741634130477905e-07, -9.238719940185547e-07, -8.735805749893188e-07, -8.23289155960083e-07, -7.729977369308472e-07, -7.227063179016113e-07, -6.724148988723755e-07, -6.221234798431396e-07, -5.718320608139038e-07, -5.21540641784668e-07, -4.7124922275543213e-07, -4.209578037261963e-07, -3.7066638469696045e-07, -3.203749656677246e-07, -2.7008354663848877e-07, -2.1979212760925293e-07, -1.695007085800171e-07, -1.1920928955078125e-07, -6.891787052154541e-08, -1.862645149230957e-08, 3.166496753692627e-08, 8.195638656616211e-08, 1.3224780559539795e-07, 1.825392246246338e-07, 2.3283064365386963e-07, 2.8312206268310547e-07, 3.334134817123413e-07, 3.8370490074157715e-07, 4.33996319770813e-07, 4.842877388000488e-07, 5.345791578292847e-07, 5.848705768585205e-07, 6.351619958877563e-07, 6.854534149169922e-07, 7.35744833946228e-07, 7.860362529754639e-07, 8.363276720046997e-07, 8.866190910339355e-07, 9.369105100631714e-07, 9.872019290924072e-07, 1.037493348121643e-06, 1.087784767150879e-06, 1.1380761861801147e-06, 1.1883676052093506e-06, 1.2386590242385864e-06, 1.2889504432678223e-06, 1.339241862297058e-06, 1.389533281326294e-06, 1.4398247003555298e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 5.0, 8.0, 19.0, 20.0, 28.0, 36.0, 49.0, 61.0, 65.0, 126.0, 176.0, 256.0, 427.0, 815.0, 1523.0, 3033.0, 6672.0, 15951.0, 47077.0, 560020.0, 343535.0, 41588.0, 14705.0, 6197.0, 2785.0, 1397.0, 721.0, 397.0, 249.0, 154.0, 136.0, 63.0, 67.0, 48.0, 32.0, 25.0, 23.0, 21.0, 6.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0024852752685546875, -0.0024074912071228027, -0.002329707145690918, -0.002251923084259033, -0.0021741390228271484, -0.0020963549613952637, -0.002018570899963379, -0.0019407868385314941, -0.0018630027770996094, -0.0017852187156677246, -0.0017074346542358398, -0.001629650592803955, -0.0015518665313720703, -0.0014740824699401855, -0.0013962984085083008, -0.001318514347076416, -0.0012407302856445312, -0.0011629462242126465, -0.0010851621627807617, -0.001007378101348877, -0.0009295940399169922, -0.0008518099784851074, -0.0007740259170532227, -0.0006962418556213379, -0.0006184577941894531, -0.0005406737327575684, -0.0004628896713256836, -0.00038510560989379883, -0.00030732154846191406, -0.0002295374870300293, -0.00015175342559814453, -7.396936416625977e-05, 3.814697265625e-06, 8.159875869750977e-05, 0.00015938282012939453, 0.0002371668815612793, 0.00031495094299316406, 0.00039273500442504883, 0.0004705190658569336, 0.0005483031272888184, 0.0006260871887207031, 0.0007038712501525879, 0.0007816553115844727, 0.0008594393730163574, 0.0009372234344482422, 0.001015007495880127, 0.0010927915573120117, 0.0011705756187438965, 0.0012483596801757812, 0.001326143741607666, 0.0014039278030395508, 0.0014817118644714355, 0.0015594959259033203, 0.001637279987335205, 0.0017150640487670898, 0.0017928481101989746, 0.0018706321716308594, 0.0019484162330627441, 0.002026200294494629, 0.0021039843559265137, 0.0021817684173583984, 0.002259552478790283, 0.002337336540222168, 0.0024151206016540527, 0.0024929046630859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 7.0, 6.0, 9.0, 16.0, 10.0, 28.0, 38.0, 39.0, 92.0, 210.0, 312.0, 99.0, 39.0, 23.0, 23.0, 17.0, 13.0, 6.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00070953369140625, -0.000687427818775177, -0.000665321946144104, -0.000643216073513031, -0.000621110200881958, -0.000599004328250885, -0.000576898455619812, -0.000554792582988739, -0.000532686710357666, -0.000510580837726593, -0.00048847496509552, -0.000466369092464447, -0.000444263219833374, -0.000422157347202301, -0.00040005147457122803, -0.00037794560194015503, -0.00035583972930908203, -0.00033373385667800903, -0.00031162798404693604, -0.00028952211141586304, -0.00026741623878479004, -0.00024531036615371704, -0.00022320449352264404, -0.00020109862089157104, -0.00017899274826049805, -0.00015688687562942505, -0.00013478100299835205, -0.00011267513036727905, -9.056925773620605e-05, -6.846338510513306e-05, -4.635751247406006e-05, -2.425163984298706e-05, -2.1457672119140625e-06, 1.9960105419158936e-05, 4.2065978050231934e-05, 6.417185068130493e-05, 8.627772331237793e-05, 0.00010838359594345093, 0.00013048946857452393, 0.00015259534120559692, 0.00017470121383666992, 0.00019680708646774292, 0.00021891295909881592, 0.00024101883172988892, 0.0002631247043609619, 0.0002852305769920349, 0.0003073364496231079, 0.0003294423222541809, 0.0003515481948852539, 0.0003736540675163269, 0.0003957599401473999, 0.0004178658127784729, 0.0004399716854095459, 0.0004620775580406189, 0.0004841834306716919, 0.0005062893033027649, 0.0005283951759338379, 0.0005505010485649109, 0.0005726069211959839, 0.0005947127938270569, 0.0006168186664581299, 0.0006389245390892029, 0.0006610304117202759, 0.0006831362843513489, 0.0007052421569824219]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 17.0, 14.0, 30.0, 19.0, 35.0, 40.0, 53.0, 64.0, 56.0, 93.0, 107.0, 84.0, 77.0, 59.0, 54.0, 35.0, 31.0, 16.0, 18.0, 9.0, 6.0, 10.0, 8.0, 5.0, 5.0, 6.0, 0.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.01990484818816185, -0.019156500697135925, -0.01840815506875515, -0.017659807577729225, -0.01691146194934845, -0.016163114458322525, -0.01541476882994175, -0.014666421338915825, -0.01391807571053505, -0.0131697291508317, -0.01242138259112835, -0.011673036031425, -0.01092468947172165, -0.010176342912018299, -0.009427996352314949, -0.008679648861289024, -0.007931302301585674, -0.007182955741882324, -0.006434609182178974, -0.005686262622475624, -0.004937916062772274, -0.004189569503068924, -0.0034412224777042866, -0.0026928759180009365, -0.0019445293582975864, -0.0011961827985942364, -0.0004478361224755645, 0.0003005105536431074, 0.0010488571133464575, 0.0017972036730498075, 0.0025455504655838013, 0.0032938970252871513, 0.004042243584990501, 0.0047905901446938515, 0.0055389367043972015, 0.006287283264100552, 0.007035629823803902, 0.007783976383507252, 0.008532322943210602, 0.009280670434236526, 0.010029016062617302, 0.010777362622320652, 0.011525709182024002, 0.012274055741727352, 0.013022402301430702, 0.013770748861134052, 0.014519095420837402, 0.015267442911863327, 0.01601579040288925, 0.016764137893915176, 0.017512483522295952, 0.018260831013321877, 0.019009176641702652, 0.019757524132728577, 0.020505869761109352, 0.021254217252135277, 0.022002562880516052, 0.022750910371541977, 0.023499255999922752, 0.024247603490948677, 0.024995949119329453, 0.025744296610355377, 0.026492642238736153, 0.027240989729762077, 0.027989335358142853]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 5.0, 9.0, 16.0, 9.0, 9.0, 16.0, 13.0, 20.0, 22.0, 23.0, 25.0, 21.0, 32.0, 36.0, 32.0, 35.0, 37.0, 44.0, 50.0, 45.0, 41.0, 45.0, 46.0, 39.0, 30.0, 34.0, 29.0, 32.0, 18.0, 20.0, 31.0, 21.0, 20.0, 17.0, 16.0, 8.0, 10.0, 7.0, 11.0, 10.0, 4.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01770825870335102, -0.01717531494796276, -0.01664237305521965, -0.01610942929983139, -0.01557648554444313, -0.015043542720377445, -0.01451059989631176, -0.0139776561409235, -0.013444713316857815, -0.01291177049279213, -0.01237882673740387, -0.011845883913338184, -0.011312941089272499, -0.01077999733388424, -0.010247054509818554, -0.009714111685752869, -0.009181167930364609, -0.008648225106298923, -0.008115281350910664, -0.007582338526844978, -0.007049395237118006, -0.006516451947391033, -0.005983509123325348, -0.005450565833598375, -0.004917622543871403, -0.00438467925414443, -0.0038517361972481012, -0.0033187931403517723, -0.0027858498506247997, -0.002252906560897827, -0.0017199635040014982, -0.0011870204471051693, -0.000654079020023346, -0.0001211358467116952, 0.00041180732659995556, 0.0009447504999116063, 0.001477693673223257, 0.0020106369629502296, 0.0025435800198465586, 0.0030765230767428875, 0.00360946636646986, 0.004142409656196833, 0.004675352945923805, 0.0052082957699894905, 0.005741239059716463, 0.006274182349443436, 0.006807125173509121, 0.0073400684632360935, 0.007873011752963066, 0.008405954577028751, 0.008938898332417011, 0.009471841156482697, 0.010004784911870956, 0.010537727735936642, 0.011070670560002327, 0.011603614315390587, 0.012136557139456272, 0.012669499963521957, 0.013202443718910217, 0.013735386542975903, 0.014268329367041588, 0.014801273122429848, 0.015334215946495533, 0.015867158770561218, 0.016400102525949478]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 13.0, 7.0, 17.0, 41.0, 54.0, 80.0, 127.0, 155.0, 237.0, 339.0, 532.0, 808.0, 1094.0, 1585.0, 2230.0, 3312.0, 4899.0, 6978.0, 10625.0, 16311.0, 25687.0, 41479.0, 70077.0, 127631.0, 268566.0, 859368.0, 1671560.0, 597862.0, 214078.0, 108291.0, 61075.0, 36440.0, 22393.0, 13990.0, 8919.0, 5773.0, 3846.0, 2512.0, 1661.0, 1103.0, 791.0, 518.0, 372.0, 235.0, 206.0, 124.0, 78.0, 72.0, 44.0, 31.0, 23.0, 18.0, 8.0, 7.0, 4.0, 4.0, 2.0], "bins": [-0.0218658447265625, -0.021210432052612305, -0.02055501937866211, -0.019899606704711914, -0.01924419403076172, -0.018588781356811523, -0.017933368682861328, -0.017277956008911133, -0.016622543334960938, -0.015967130661010742, -0.015311717987060547, -0.014656305313110352, -0.014000892639160156, -0.013345479965209961, -0.012690067291259766, -0.01203465461730957, -0.011379241943359375, -0.01072382926940918, -0.010068416595458984, -0.009413003921508789, -0.008757591247558594, -0.008102178573608398, -0.007446765899658203, -0.006791353225708008, -0.0061359405517578125, -0.005480527877807617, -0.004825115203857422, -0.0041697025299072266, -0.0035142898559570312, -0.002858877182006836, -0.0022034645080566406, -0.0015480518341064453, -0.00089263916015625, -0.0002372264862060547, 0.0004181861877441406, 0.001073598861694336, 0.0017290115356445312, 0.0023844242095947266, 0.003039836883544922, 0.003695249557495117, 0.0043506622314453125, 0.005006074905395508, 0.005661487579345703, 0.0063169002532958984, 0.006972312927246094, 0.007627725601196289, 0.008283138275146484, 0.00893855094909668, 0.009593963623046875, 0.01024937629699707, 0.010904788970947266, 0.011560201644897461, 0.012215614318847656, 0.012871026992797852, 0.013526439666748047, 0.014181852340698242, 0.014837265014648438, 0.015492677688598633, 0.016148090362548828, 0.016803503036499023, 0.01745891571044922, 0.018114328384399414, 0.01876974105834961, 0.019425153732299805, 0.02008056640625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 4.0, 10.0, 9.0, 24.0, 15.0, 19.0, 25.0, 24.0, 27.0, 28.0, 31.0, 35.0, 23.0, 48.0, 46.0, 56.0, 43.0, 47.0, 45.0, 46.0, 44.0, 35.0, 29.0, 37.0, 32.0, 29.0, 22.0, 32.0, 18.0, 15.0, 15.0, 14.0, 12.0, 14.0, 10.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01117706298828125, -0.01085364818572998, -0.010530233383178711, -0.010206818580627441, -0.009883403778076172, -0.009559988975524902, -0.009236574172973633, -0.008913159370422363, -0.008589744567871094, -0.008266329765319824, -0.007942914962768555, -0.007619500160217285, -0.007296085357666016, -0.006972670555114746, -0.0066492557525634766, -0.006325840950012207, -0.0060024261474609375, -0.005679011344909668, -0.0053555965423583984, -0.005032181739807129, -0.004708766937255859, -0.00438535213470459, -0.00406193733215332, -0.0037385225296020508, -0.0034151077270507812, -0.0030916929244995117, -0.002768278121948242, -0.0024448633193969727, -0.002121448516845703, -0.0017980337142944336, -0.001474618911743164, -0.0011512041091918945, -0.000827789306640625, -0.0005043745040893555, -0.00018095970153808594, 0.0001424551010131836, 0.0004658699035644531, 0.0007892847061157227, 0.0011126995086669922, 0.0014361143112182617, 0.0017595291137695312, 0.0020829439163208008, 0.0024063587188720703, 0.00272977352142334, 0.0030531883239746094, 0.003376603126525879, 0.0037000179290771484, 0.004023432731628418, 0.0043468475341796875, 0.004670262336730957, 0.0049936771392822266, 0.005317091941833496, 0.005640506744384766, 0.005963921546936035, 0.006287336349487305, 0.006610751152038574, 0.006934165954589844, 0.007257580757141113, 0.007580995559692383, 0.007904410362243652, 0.008227825164794922, 0.008551239967346191, 0.008874654769897461, 0.00919806957244873, 0.009521484375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 12.0, 14.0, 38.0, 41.0, 88.0, 97.0, 172.0, 283.0, 434.0, 677.0, 1118.0, 1755.0, 2672.0, 4523.0, 7521.0, 12302.0, 21185.0, 37481.0, 68298.0, 132644.0, 274632.0, 657691.0, 1602754.0, 749693.0, 302980.0, 144227.0, 74246.0, 40376.0, 22698.0, 12954.0, 7941.0, 4764.0, 2989.0, 1825.0, 1129.0, 729.0, 471.0, 296.0, 208.0, 102.0, 76.0, 56.0, 25.0, 19.0, 16.0, 12.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0173492431640625, -0.01678156852722168, -0.01621389389038086, -0.01564621925354004, -0.015078544616699219, -0.014510869979858398, -0.013943195343017578, -0.013375520706176758, -0.012807846069335938, -0.012240171432495117, -0.011672496795654297, -0.011104822158813477, -0.010537147521972656, -0.009969472885131836, -0.009401798248291016, -0.008834123611450195, -0.008266448974609375, -0.007698774337768555, -0.007131099700927734, -0.006563425064086914, -0.005995750427246094, -0.0054280757904052734, -0.004860401153564453, -0.004292726516723633, -0.0037250518798828125, -0.003157377243041992, -0.002589702606201172, -0.0020220279693603516, -0.0014543533325195312, -0.0008866786956787109, -0.0003190040588378906, 0.0002486705780029297, 0.00081634521484375, 0.0013840198516845703, 0.0019516944885253906, 0.002519369125366211, 0.0030870437622070312, 0.0036547183990478516, 0.004222393035888672, 0.004790067672729492, 0.0053577423095703125, 0.005925416946411133, 0.006493091583251953, 0.0070607662200927734, 0.007628440856933594, 0.008196115493774414, 0.008763790130615234, 0.009331464767456055, 0.009899139404296875, 0.010466814041137695, 0.011034488677978516, 0.011602163314819336, 0.012169837951660156, 0.012737512588500977, 0.013305187225341797, 0.013872861862182617, 0.014440536499023438, 0.015008211135864258, 0.015575885772705078, 0.0161435604095459, 0.01671123504638672, 0.01727890968322754, 0.01784658432006836, 0.01841425895690918, 0.01898193359375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 5.0, 6.0, 13.0, 12.0, 17.0, 17.0, 22.0, 21.0, 34.0, 40.0, 47.0, 54.0, 79.0, 92.0, 95.0, 135.0, 149.0, 181.0, 212.0, 221.0, 273.0, 304.0, 319.0, 276.0, 218.0, 189.0, 177.0, 152.0, 131.0, 119.0, 79.0, 65.0, 61.0, 47.0, 44.0, 39.0, 31.0, 23.0, 11.0, 19.0, 12.0, 9.0, 4.0, 8.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00568389892578125, -0.005521237850189209, -0.005358576774597168, -0.005195915699005127, -0.005033254623413086, -0.004870593547821045, -0.004707932472229004, -0.004545271396636963, -0.004382610321044922, -0.004219949245452881, -0.00405728816986084, -0.003894627094268799, -0.003731966018676758, -0.003569304943084717, -0.0034066438674926758, -0.0032439827919006348, -0.0030813217163085938, -0.0029186606407165527, -0.0027559995651245117, -0.0025933384895324707, -0.0024306774139404297, -0.0022680163383483887, -0.0021053552627563477, -0.0019426941871643066, -0.0017800331115722656, -0.0016173720359802246, -0.0014547109603881836, -0.0012920498847961426, -0.0011293888092041016, -0.0009667277336120605, -0.0008040666580200195, -0.0006414055824279785, -0.0004787445068359375, -0.0003160834312438965, -0.00015342235565185547, 9.238719940185547e-06, 0.00017189979553222656, 0.0003345608711242676, 0.0004972219467163086, 0.0006598830223083496, 0.0008225440979003906, 0.0009852051734924316, 0.0011478662490844727, 0.0013105273246765137, 0.0014731884002685547, 0.0016358494758605957, 0.0017985105514526367, 0.0019611716270446777, 0.0021238327026367188, 0.0022864937782287598, 0.0024491548538208008, 0.002611815929412842, 0.002774477005004883, 0.002937138080596924, 0.003099799156188965, 0.003262460231781006, 0.003425121307373047, 0.003587782382965088, 0.003750443458557129, 0.00391310453414917, 0.004075765609741211, 0.004238426685333252, 0.004401087760925293, 0.004563748836517334, 0.004726409912109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 7.0, 4.0, 7.0, 19.0, 19.0, 26.0, 30.0, 36.0, 39.0, 53.0, 67.0, 71.0, 93.0, 81.0, 98.0, 58.0, 66.0, 36.0, 43.0, 19.0, 25.0, 23.0, 10.0, 10.0, 11.0, 9.0, 7.0, 7.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.011549476534128189, -0.011093901470303535, -0.010638326406478882, -0.010182751342654228, -0.009727176278829575, -0.009271601215004921, -0.008816026151180267, -0.008360451087355614, -0.00790487602353096, -0.0074493009597063065, -0.006993725895881653, -0.006538150832056999, -0.006082575768232346, -0.005627000704407692, -0.005171425640583038, -0.004715850576758385, -0.004260275512933731, -0.0038047004491090775, -0.003349125385284424, -0.00289355032145977, -0.0024379752576351166, -0.001982400193810463, -0.0015268251299858093, -0.0010712500661611557, -0.0006156750023365021, -0.00016009993851184845, 0.0002954751253128052, 0.0007510501891374588, 0.0012066252529621124, 0.001662200316786766, 0.0021177753806114197, 0.0025733504444360733, 0.003028925508260727, 0.0034845005720853806, 0.003940075635910034, 0.004395650699734688, 0.004851225763559341, 0.005306800827383995, 0.005762375891208649, 0.006217950955033302, 0.006673526018857956, 0.0071291010826826096, 0.007584676146507263, 0.008040251210331917, 0.00849582627415657, 0.008951401337981224, 0.009406976401805878, 0.009862551465630531, 0.010318126529455185, 0.010773701593279839, 0.011229276657104492, 0.011684851720929146, 0.0121404267847538, 0.012596001848578453, 0.013051576912403107, 0.01350715197622776, 0.013962727040052414, 0.014418302103877068, 0.014873877167701721, 0.015329452231526375, 0.01578502729535103, 0.016240602359175682, 0.016696177423000336, 0.01715175248682499, 0.017607327550649643]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 9.0, 9.0, 14.0, 14.0, 20.0, 21.0, 29.0, 36.0, 20.0, 29.0, 30.0, 41.0, 43.0, 40.0, 39.0, 40.0, 40.0, 41.0, 42.0, 42.0, 47.0, 44.0, 37.0, 34.0, 31.0, 24.0, 26.0, 26.0, 18.0, 14.0, 9.0, 17.0, 7.0, 7.0, 4.0, 5.0, 11.0, 5.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.011295566335320473, -0.010952138341963291, -0.01060871034860611, -0.010265281423926353, -0.009921853430569172, -0.00957842543721199, -0.009234997443854809, -0.008891569450497627, -0.008548140525817871, -0.00820471253246069, -0.007861284539103508, -0.007517856080085039, -0.00717442762106657, -0.006830999627709389, -0.006487571634352207, -0.006144143640995026, -0.005800715647637844, -0.0054572876542806625, -0.005113859195262194, -0.004770431201905012, -0.004427002742886543, -0.004083574749529362, -0.00374014675617218, -0.003396718529984355, -0.0030532903037965298, -0.0027098620776087046, -0.0023664338514208794, -0.002023005858063698, -0.0016795776318758726, -0.0013361494056880474, -0.0009927214123308659, -0.0006492931861430407, -0.00030586402863264084, 3.756413934752345e-05, 0.00038099230732768774, 0.0007244204171001911, 0.0010678486432880163, 0.0014112768694758415, 0.001754704862833023, 0.0020981330890208483, 0.0024415613152086735, 0.0027849895413964987, 0.003128417767584324, 0.0034718457609415054, 0.0038152739871293306, 0.004158702213317156, 0.004502130206674337, 0.004845558665692806, 0.005188986659049988, 0.005532414652407169, 0.005875843111425638, 0.00621927110478282, 0.006562699563801289, 0.00690612755715847, 0.007249555550515652, 0.007592983543872833, 0.00793641246855259, 0.008279840461909771, 0.008623268455266953, 0.008966697379946709, 0.00931012537330389, 0.009653553366661072, 0.009996981360018253, 0.010340409353375435, 0.010683837346732616]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 9.0, 12.0, 21.0, 39.0, 30.0, 55.0, 91.0, 157.0, 203.0, 328.0, 506.0, 850.0, 1223.0, 2197.0, 3529.0, 6041.0, 10532.0, 19522.0, 36925.0, 75365.0, 190286.0, 426244.0, 142630.0, 61724.0, 30884.0, 16574.0, 9119.0, 5373.0, 3080.0, 1873.0, 1100.0, 729.0, 437.0, 287.0, 192.0, 132.0, 75.0, 52.0, 29.0, 29.0, 15.0, 10.0, 17.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01313018798828125, -0.012697815895080566, -0.012265443801879883, -0.0118330717086792, -0.011400699615478516, -0.010968327522277832, -0.010535955429077148, -0.010103583335876465, -0.009671211242675781, -0.009238839149475098, -0.008806467056274414, -0.00837409496307373, -0.007941722869873047, -0.007509350776672363, -0.00707697868347168, -0.006644606590270996, -0.0062122344970703125, -0.005779862403869629, -0.005347490310668945, -0.004915118217468262, -0.004482746124267578, -0.0040503740310668945, -0.003618001937866211, -0.0031856298446655273, -0.0027532577514648438, -0.00232088565826416, -0.0018885135650634766, -0.001456141471862793, -0.0010237693786621094, -0.0005913972854614258, -0.0001590251922607422, 0.0002733469009399414, 0.000705718994140625, 0.0011380910873413086, 0.0015704631805419922, 0.0020028352737426758, 0.0024352073669433594, 0.002867579460144043, 0.0032999515533447266, 0.00373232364654541, 0.004164695739746094, 0.004597067832946777, 0.005029439926147461, 0.0054618120193481445, 0.005894184112548828, 0.006326556205749512, 0.006758928298950195, 0.007191300392150879, 0.0076236724853515625, 0.008056044578552246, 0.00848841667175293, 0.008920788764953613, 0.009353160858154297, 0.00978553295135498, 0.010217905044555664, 0.010650277137756348, 0.011082649230957031, 0.011515021324157715, 0.011947393417358398, 0.012379765510559082, 0.012812137603759766, 0.01324450969696045, 0.013676881790161133, 0.014109253883361816, 0.0145416259765625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 7.0, 7.0, 6.0, 12.0, 14.0, 12.0, 16.0, 19.0, 32.0, 29.0, 28.0, 23.0, 33.0, 47.0, 38.0, 41.0, 49.0, 35.0, 33.0, 45.0, 60.0, 42.0, 51.0, 48.0, 30.0, 29.0, 35.0, 33.0, 26.0, 13.0, 17.0, 20.0, 18.0, 6.0, 3.0, 9.0, 9.0, 3.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01242828369140625, -0.012061476707458496, -0.011694669723510742, -0.011327862739562988, -0.010961055755615234, -0.01059424877166748, -0.010227441787719727, -0.009860634803771973, -0.009493827819824219, -0.009127020835876465, -0.008760213851928711, -0.008393406867980957, -0.008026599884033203, -0.007659792900085449, -0.007292985916137695, -0.006926178932189941, -0.0065593719482421875, -0.006192564964294434, -0.00582575798034668, -0.005458950996398926, -0.005092144012451172, -0.004725337028503418, -0.004358530044555664, -0.00399172306060791, -0.0036249160766601562, -0.0032581090927124023, -0.0028913021087646484, -0.0025244951248168945, -0.0021576881408691406, -0.0017908811569213867, -0.0014240741729736328, -0.001057267189025879, -0.000690460205078125, -0.0003236532211303711, 4.315376281738281e-05, 0.0004099607467651367, 0.0007767677307128906, 0.0011435747146606445, 0.0015103816986083984, 0.0018771886825561523, 0.0022439956665039062, 0.00261080265045166, 0.002977609634399414, 0.003344416618347168, 0.003711223602294922, 0.004078030586242676, 0.00444483757019043, 0.004811644554138184, 0.0051784515380859375, 0.005545258522033691, 0.005912065505981445, 0.006278872489929199, 0.006645679473876953, 0.007012486457824707, 0.007379293441772461, 0.007746100425720215, 0.008112907409667969, 0.008479714393615723, 0.008846521377563477, 0.00921332836151123, 0.009580135345458984, 0.009946942329406738, 0.010313749313354492, 0.010680556297302246, 0.01104736328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 20.0, 24.0, 22.0, 41.0, 52.0, 82.0, 119.0, 165.0, 220.0, 336.0, 499.0, 693.0, 875.0, 1292.0, 1834.0, 2600.0, 3986.0, 6360.0, 10547.0, 19907.0, 44047.0, 198491.0, 617155.0, 74113.0, 27684.0, 14096.0, 7996.0, 4960.0, 3126.0, 2121.0, 1469.0, 1032.0, 770.0, 518.0, 372.0, 257.0, 212.0, 134.0, 98.0, 53.0, 61.0, 43.0, 23.0, 16.0, 4.0, 8.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0189666748046875, -0.01839590072631836, -0.01782512664794922, -0.017254352569580078, -0.016683578491210938, -0.016112804412841797, -0.015542030334472656, -0.014971256256103516, -0.014400482177734375, -0.013829708099365234, -0.013258934020996094, -0.012688159942626953, -0.012117385864257812, -0.011546611785888672, -0.010975837707519531, -0.01040506362915039, -0.00983428955078125, -0.00926351547241211, -0.008692741394042969, -0.008121967315673828, -0.0075511932373046875, -0.006980419158935547, -0.006409645080566406, -0.005838871002197266, -0.005268096923828125, -0.004697322845458984, -0.004126548767089844, -0.003555774688720703, -0.0029850006103515625, -0.002414226531982422, -0.0018434524536132812, -0.0012726783752441406, -0.000701904296875, -0.00013113021850585938, 0.00043964385986328125, 0.0010104179382324219, 0.0015811920166015625, 0.002151966094970703, 0.0027227401733398438, 0.0032935142517089844, 0.003864288330078125, 0.004435062408447266, 0.005005836486816406, 0.005576610565185547, 0.0061473846435546875, 0.006718158721923828, 0.007288932800292969, 0.00785970687866211, 0.00843048095703125, 0.00900125503540039, 0.009572029113769531, 0.010142803192138672, 0.010713577270507812, 0.011284351348876953, 0.011855125427246094, 0.012425899505615234, 0.012996673583984375, 0.013567447662353516, 0.014138221740722656, 0.014708995819091797, 0.015279769897460938, 0.015850543975830078, 0.01642131805419922, 0.01699209213256836, 0.0175628662109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 3.0, 7.0, 12.0, 11.0, 10.0, 22.0, 20.0, 18.0, 24.0, 31.0, 28.0, 35.0, 29.0, 33.0, 30.0, 49.0, 49.0, 54.0, 46.0, 37.0, 44.0, 46.0, 42.0, 45.0, 32.0, 45.0, 35.0, 24.0, 27.0, 21.0, 20.0, 13.0, 7.0, 11.0, 7.0, 10.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00865936279296875, -0.008424758911132812, -0.008190155029296875, -0.007955551147460938, -0.007720947265625, -0.0074863433837890625, -0.007251739501953125, -0.0070171356201171875, -0.00678253173828125, -0.0065479278564453125, -0.006313323974609375, -0.0060787200927734375, -0.0058441162109375, -0.0056095123291015625, -0.005374908447265625, -0.0051403045654296875, -0.00490570068359375, -0.0046710968017578125, -0.004436492919921875, -0.0042018890380859375, -0.00396728515625, -0.0037326812744140625, -0.003498077392578125, -0.0032634735107421875, -0.00302886962890625, -0.0027942657470703125, -0.002559661865234375, -0.0023250579833984375, -0.0020904541015625, -0.0018558502197265625, -0.001621246337890625, -0.0013866424560546875, -0.00115203857421875, -0.0009174346923828125, -0.000682830810546875, -0.0004482269287109375, -0.000213623046875, 2.09808349609375e-05, 0.000255584716796875, 0.0004901885986328125, 0.00072479248046875, 0.0009593963623046875, 0.001194000244140625, 0.0014286041259765625, 0.0016632080078125, 0.0018978118896484375, 0.002132415771484375, 0.0023670196533203125, 0.00260162353515625, 0.0028362274169921875, 0.003070831298828125, 0.0033054351806640625, 0.0035400390625, 0.0037746429443359375, 0.004009246826171875, 0.0042438507080078125, 0.00447845458984375, 0.0047130584716796875, 0.004947662353515625, 0.0051822662353515625, 0.0054168701171875, 0.0056514739990234375, 0.005886077880859375, 0.0061206817626953125, 0.00635528564453125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 13.0, 21.0, 25.0, 26.0, 40.0, 51.0, 66.0, 116.0, 180.0, 202.0, 325.0, 432.0, 704.0, 947.0, 1538.0, 2317.0, 3660.0, 6328.0, 11555.0, 24607.0, 73559.0, 709557.0, 142382.0, 34571.0, 15142.0, 7754.0, 4383.0, 2717.0, 1733.0, 1112.0, 809.0, 476.0, 357.0, 258.0, 180.0, 132.0, 79.0, 48.0, 50.0, 26.0, 17.0, 16.0, 16.0, 11.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0021533966064453125, -0.00208321213722229, -0.0020130276679992676, -0.0019428431987762451, -0.0018726587295532227, -0.0018024742603302002, -0.0017322897911071777, -0.0016621053218841553, -0.0015919208526611328, -0.0015217363834381104, -0.0014515519142150879, -0.0013813674449920654, -0.001311182975769043, -0.0012409985065460205, -0.001170814037322998, -0.0011006295680999756, -0.0010304450988769531, -0.0009602606296539307, -0.0008900761604309082, -0.0008198916912078857, -0.0007497072219848633, -0.0006795227527618408, -0.0006093382835388184, -0.0005391538143157959, -0.00046896934509277344, -0.000398784875869751, -0.0003286004066467285, -0.00025841593742370605, -0.0001882314682006836, -0.00011804699897766113, -4.786252975463867e-05, 2.232193946838379e-05, 9.250640869140625e-05, 0.0001626908779144287, 0.00023287534713745117, 0.00030305981636047363, 0.0003732442855834961, 0.00044342875480651855, 0.000513613224029541, 0.0005837976932525635, 0.0006539821624755859, 0.0007241666316986084, 0.0007943511009216309, 0.0008645355701446533, 0.0009347200393676758, 0.0010049045085906982, 0.0010750889778137207, 0.0011452734470367432, 0.0012154579162597656, 0.001285642385482788, 0.0013558268547058105, 0.001426011323928833, 0.0014961957931518555, 0.001566380262374878, 0.0016365647315979004, 0.0017067492008209229, 0.0017769336700439453, 0.0018471181392669678, 0.0019173026084899902, 0.0019874870777130127, 0.002057671546936035, 0.0021278560161590576, 0.00219804048538208, 0.0022682249546051025, 0.002338409423828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 7.0, 8.0, 6.0, 6.0, 18.0, 14.0, 14.0, 30.0, 26.0, 38.0, 58.0, 0.0, 60.0, 81.0, 74.0, 80.0, 74.0, 70.0, 72.0, 51.0, 47.0, 44.0, 23.0, 24.0, 15.0, 8.0, 13.0, 0.0, 8.0, 8.0, 6.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.911073923110962e-06, -1.8551945686340332e-06, -1.7993152141571045e-06, -1.7434358596801758e-06, -1.687556505203247e-06, -1.6316771507263184e-06, -1.5757977962493896e-06, -1.519918441772461e-06, -1.4640390872955322e-06, -1.4081597328186035e-06, -1.3522803783416748e-06, -1.296401023864746e-06, -1.2405216693878174e-06, -1.1846423149108887e-06, -1.12876296043396e-06, -1.0728836059570312e-06, -1.0170042514801025e-06, -9.611248970031738e-07, -9.052455425262451e-07, -8.493661880493164e-07, -7.934868335723877e-07, -7.37607479095459e-07, -6.817281246185303e-07, -6.258487701416016e-07, -5.699694156646729e-07, -5.140900611877441e-07, -4.5821070671081543e-07, -4.023313522338867e-07, -3.46451997756958e-07, -2.905726432800293e-07, -2.3469328880310059e-07, -1.7881393432617188e-07, -1.2293457984924316e-07, -6.705522537231445e-08, -1.1175870895385742e-08, 4.470348358154297e-08, 1.0058283805847168e-07, 1.564621925354004e-07, 2.123415470123291e-07, 2.682209014892578e-07, 3.241002559661865e-07, 3.7997961044311523e-07, 4.3585896492004395e-07, 4.917383193969727e-07, 5.476176738739014e-07, 6.034970283508301e-07, 6.593763828277588e-07, 7.152557373046875e-07, 7.711350917816162e-07, 8.270144462585449e-07, 8.828938007354736e-07, 9.387731552124023e-07, 9.94652509689331e-07, 1.0505318641662598e-06, 1.1064112186431885e-06, 1.1622905731201172e-06, 1.218169927597046e-06, 1.2740492820739746e-06, 1.3299286365509033e-06, 1.385807991027832e-06, 1.4416873455047607e-06, 1.4975666999816895e-06, 1.5534460544586182e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 13.0, 11.0, 15.0, 31.0, 60.0, 76.0, 114.0, 184.0, 266.0, 463.0, 766.0, 1361.0, 2384.0, 4498.0, 9019.0, 19659.0, 45809.0, 123637.0, 523632.0, 199403.0, 65425.0, 26528.0, 12188.0, 5869.0, 3044.0, 1750.0, 920.0, 526.0, 322.0, 208.0, 125.0, 61.0, 59.0, 38.0, 24.0, 24.0, 11.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00283050537109375, -0.0027512013912200928, -0.0026718974113464355, -0.0025925934314727783, -0.002513289451599121, -0.002433985471725464, -0.0023546814918518066, -0.0022753775119781494, -0.002196073532104492, -0.002116769552230835, -0.0020374655723571777, -0.0019581615924835205, -0.0018788576126098633, -0.001799553632736206, -0.0017202496528625488, -0.0016409456729888916, -0.0015616416931152344, -0.0014823377132415771, -0.00140303373336792, -0.0013237297534942627, -0.0012444257736206055, -0.0011651217937469482, -0.001085817813873291, -0.0010065138339996338, -0.0009272098541259766, -0.0008479058742523193, -0.0007686018943786621, -0.0006892979145050049, -0.0006099939346313477, -0.0005306899547576904, -0.0004513859748840332, -0.000372081995010376, -0.00029277801513671875, -0.00021347403526306152, -0.0001341700553894043, -5.486607551574707e-05, 2.4437904357910156e-05, 0.00010374188423156738, 0.0001830458641052246, 0.00026234984397888184, 0.00034165382385253906, 0.0004209578037261963, 0.0005002617835998535, 0.0005795657634735107, 0.000658869743347168, 0.0007381737232208252, 0.0008174777030944824, 0.0008967816829681396, 0.0009760856628417969, 0.001055389642715454, 0.0011346936225891113, 0.0012139976024627686, 0.0012933015823364258, 0.001372605562210083, 0.0014519095420837402, 0.0015312135219573975, 0.0016105175018310547, 0.001689821481704712, 0.0017691254615783691, 0.0018484294414520264, 0.0019277334213256836, 0.002007037401199341, 0.002086341381072998, 0.0021656453609466553, 0.0022449493408203125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 7.0, 4.0, 8.0, 7.0, 18.0, 23.0, 18.0, 33.0, 27.0, 38.0, 42.0, 47.0, 69.0, 107.0, 111.0, 68.0, 75.0, 57.0, 32.0, 30.0, 26.0, 36.0, 17.0, 15.0, 16.0, 7.0, 8.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.00069427490234375, -0.0006765797734260559, -0.0006588846445083618, -0.0006411895155906677, -0.0006234943866729736, -0.0006057992577552795, -0.0005881041288375854, -0.0005704089999198914, -0.0005527138710021973, -0.0005350187420845032, -0.0005173236131668091, -0.000499628484249115, -0.0004819333553314209, -0.0004642382264137268, -0.0004465430974960327, -0.0004288479685783386, -0.00041115283966064453, -0.00039345771074295044, -0.00037576258182525635, -0.00035806745290756226, -0.00034037232398986816, -0.00032267719507217407, -0.00030498206615448, -0.0002872869372367859, -0.0002695918083190918, -0.0002518966794013977, -0.0002342015504837036, -0.00021650642156600952, -0.00019881129264831543, -0.00018111616373062134, -0.00016342103481292725, -0.00014572590589523315, -0.00012803077697753906, -0.00011033564805984497, -9.264051914215088e-05, -7.494539022445679e-05, -5.7250261306762695e-05, -3.9555132389068604e-05, -2.1860003471374512e-05, -4.16487455368042e-06, 1.3530254364013672e-05, 3.1225383281707764e-05, 4.8920512199401855e-05, 6.661564111709595e-05, 8.431077003479004e-05, 0.00010200589895248413, 0.00011970102787017822, 0.00013739615678787231, 0.0001550912857055664, 0.0001727864146232605, 0.0001904815435409546, 0.00020817667245864868, 0.00022587180137634277, 0.00024356693029403687, 0.00026126205921173096, 0.00027895718812942505, 0.00029665231704711914, 0.00031434744596481323, 0.0003320425748825073, 0.0003497377038002014, 0.0003674328327178955, 0.0003851279616355896, 0.0004028230905532837, 0.0004205182194709778, 0.0004382133483886719]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 0.0, 4.0, 6.0, 6.0, 8.0, 9.0, 19.0, 30.0, 24.0, 36.0, 39.0, 59.0, 77.0, 91.0, 107.0, 109.0, 70.0, 69.0, 55.0, 42.0, 32.0, 22.0, 16.0, 13.0, 13.0, 18.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014816348440945148, -0.01430505234748125, -0.013793757185339928, -0.01328246109187603, -0.012771164998412132, -0.012259868904948235, -0.011748573742806911, -0.011237277649343014, -0.01072598248720169, -0.010214686393737793, -0.00970339123159647, -0.009192095138132572, -0.008680799044668674, -0.008169503882527351, -0.007658207789063454, -0.007146911695599556, -0.006635615602135658, -0.006124319974333048, -0.00561302388086915, -0.00510172825306654, -0.004590432159602642, -0.004079136531800032, -0.0035678409039974213, -0.003056545043364167, -0.002545249182730913, -0.002033953322097659, -0.0015226575778797269, -0.0010113618336617947, -0.0005000659730285406, 1.122988760471344e-05, 0.0005225255154073238, 0.0010338213760405779, 0.0015451163053512573, 0.0020564121659845114, 0.0025677080266177654, 0.003079003654420376, 0.00359029951505363, 0.004101595375686884, 0.004612891003489494, 0.005124187096953392, 0.005635482724756002, 0.006146778352558613, 0.0066580744460225105, 0.007169370073825121, 0.007680665701627731, 0.008191961795091629, 0.008703257888555527, 0.00921455305069685, 0.009725849144160748, 0.010237145237624645, 0.010748440399765968, 0.011259736493229866, 0.011771032586693764, 0.012282328680157661, 0.012793623842298985, 0.013304919935762882, 0.013816215097904205, 0.014327511191368103, 0.014838806353509426, 0.015350102446973324, 0.015861397609114647, 0.016372693702578545, 0.016883989796042442, 0.01739528588950634, 0.017906581982970238]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 12.0, 7.0, 8.0, 12.0, 15.0, 14.0, 19.0, 23.0, 38.0, 30.0, 23.0, 30.0, 34.0, 46.0, 32.0, 46.0, 43.0, 36.0, 44.0, 37.0, 46.0, 48.0, 39.0, 42.0, 38.0, 33.0, 26.0, 26.0, 28.0, 23.0, 13.0, 14.0, 11.0, 11.0, 8.0, 6.0, 2.0, 12.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01140633039176464, -0.011064806953072548, -0.01072328444570303, -0.010381761007010937, -0.010040238499641418, -0.009698715060949326, -0.009357191622257233, -0.009015669114887714, -0.008674146607518196, -0.008332623168826103, -0.007991100661456585, -0.007649577222764492, -0.007308054715394974, -0.006966531276702881, -0.006625008303672075, -0.00628348533064127, -0.005941961891949177, -0.005600438918918371, -0.005258915945887566, -0.004917392507195473, -0.0045758699998259544, -0.0042343465611338615, -0.003892823588103056, -0.0035513006150722504, -0.0032097776420414448, -0.002868254669010639, -0.0025267316959798336, -0.0021852084901183844, -0.0018436855170875788, -0.0015021625440567732, -0.001160639338195324, -0.0008191163651645184, -0.0004775943234562874, -0.00013607129221782088, 0.00020545173902064562, 0.000546974828466773, 0.0008884978014975786, 0.0012300207745283842, 0.0015715439803898335, 0.001913066953420639, 0.0022545899264514446, 0.00259611289948225, 0.002937635872513056, 0.003279159078374505, 0.0036206820514053106, 0.0039622047916054726, 0.0043037282302975655, 0.004645251203328371, 0.004986774176359177, 0.005328297149389982, 0.005669820122420788, 0.006011343561112881, 0.006352866068482399, 0.006694389507174492, 0.0070359124802052975, 0.007377435453236103, 0.007718958426266909, 0.008060481399297714, 0.008402004837989807, 0.008743527345359325, 0.009085050784051418, 0.009426573291420937, 0.00976809673011303, 0.010109620168805122, 0.01045114267617464]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 15.0, 15.0, 19.0, 22.0, 40.0, 68.0, 105.0, 138.0, 195.0, 285.0, 418.0, 577.0, 893.0, 1250.0, 1858.0, 2684.0, 4006.0, 6106.0, 9063.0, 14045.0, 21549.0, 34937.0, 56694.0, 98869.0, 198730.0, 263755.0, 136389.0, 73275.0, 44126.0, 27226.0, 17480.0, 11192.0, 7426.0, 4945.0, 3210.0, 2214.0, 1492.0, 1002.0, 685.0, 474.0, 334.0, 236.0, 156.0, 105.0, 90.0, 44.0, 47.0, 22.0, 19.0, 16.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01922607421875, -0.018610715866088867, -0.017995357513427734, -0.0173799991607666, -0.01676464080810547, -0.016149282455444336, -0.015533924102783203, -0.01491856575012207, -0.014303207397460938, -0.013687849044799805, -0.013072490692138672, -0.012457132339477539, -0.011841773986816406, -0.011226415634155273, -0.01061105728149414, -0.009995698928833008, -0.009380340576171875, -0.008764982223510742, -0.00814962387084961, -0.0075342655181884766, -0.006918907165527344, -0.006303548812866211, -0.005688190460205078, -0.005072832107543945, -0.0044574737548828125, -0.0038421154022216797, -0.003226757049560547, -0.002611398696899414, -0.0019960403442382812, -0.0013806819915771484, -0.0007653236389160156, -0.0001499652862548828, 0.00046539306640625, 0.0010807514190673828, 0.0016961097717285156, 0.0023114681243896484, 0.0029268264770507812, 0.003542184829711914, 0.004157543182373047, 0.00477290153503418, 0.0053882598876953125, 0.006003618240356445, 0.006618976593017578, 0.007234334945678711, 0.007849693298339844, 0.008465051651000977, 0.00908041000366211, 0.009695768356323242, 0.010311126708984375, 0.010926485061645508, 0.01154184341430664, 0.012157201766967773, 0.012772560119628906, 0.013387918472290039, 0.014003276824951172, 0.014618635177612305, 0.015233993530273438, 0.01584935188293457, 0.016464710235595703, 0.017080068588256836, 0.01769542694091797, 0.0183107852935791, 0.018926143646240234, 0.019541501998901367, 0.0201568603515625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 8.0, 9.0, 11.0, 21.0, 19.0, 25.0, 23.0, 28.0, 22.0, 30.0, 32.0, 42.0, 44.0, 30.0, 44.0, 47.0, 40.0, 39.0, 64.0, 37.0, 41.0, 46.0, 34.0, 40.0, 30.0, 25.0, 23.0, 22.0, 20.0, 13.0, 12.0, 10.0, 7.0, 12.0, 5.0, 3.0, 10.0, 1.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0102691650390625, -0.009965658187866211, -0.009662151336669922, -0.009358644485473633, -0.009055137634277344, -0.008751630783081055, -0.008448123931884766, -0.008144617080688477, -0.007841110229492188, -0.0075376033782958984, -0.007234096527099609, -0.00693058967590332, -0.006627082824707031, -0.006323575973510742, -0.006020069122314453, -0.005716562271118164, -0.005413055419921875, -0.005109548568725586, -0.004806041717529297, -0.004502534866333008, -0.004199028015136719, -0.0038955211639404297, -0.0035920143127441406, -0.0032885074615478516, -0.0029850006103515625, -0.0026814937591552734, -0.0023779869079589844, -0.0020744800567626953, -0.0017709732055664062, -0.0014674663543701172, -0.0011639595031738281, -0.0008604526519775391, -0.00055694580078125, -0.00025343894958496094, 5.0067901611328125e-05, 0.0003535747528076172, 0.0006570816040039062, 0.0009605884552001953, 0.0012640953063964844, 0.0015676021575927734, 0.0018711090087890625, 0.0021746158599853516, 0.0024781227111816406, 0.0027816295623779297, 0.0030851364135742188, 0.003388643264770508, 0.003692150115966797, 0.003995656967163086, 0.004299163818359375, 0.004602670669555664, 0.004906177520751953, 0.005209684371948242, 0.005513191223144531, 0.00581669807434082, 0.006120204925537109, 0.0064237117767333984, 0.0067272186279296875, 0.0070307254791259766, 0.007334232330322266, 0.007637739181518555, 0.007941246032714844, 0.008244752883911133, 0.008548259735107422, 0.008851766586303711, 0.0091552734375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 7.0, 6.0, 18.0, 30.0, 37.0, 77.0, 121.0, 167.0, 280.0, 470.0, 792.0, 1335.0, 2176.0, 3761.0, 6645.0, 11426.0, 20612.0, 37906.0, 71979.0, 151648.0, 324427.0, 210492.0, 96084.0, 47872.0, 26094.0, 14398.0, 8322.0, 4645.0, 2741.0, 1614.0, 921.0, 558.0, 330.0, 223.0, 128.0, 86.0, 38.0, 31.0, 20.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023895263671875, -0.0231168270111084, -0.022338390350341797, -0.021559953689575195, -0.020781517028808594, -0.020003080368041992, -0.01922464370727539, -0.01844620704650879, -0.017667770385742188, -0.016889333724975586, -0.016110897064208984, -0.015332460403442383, -0.014554023742675781, -0.01377558708190918, -0.012997150421142578, -0.012218713760375977, -0.011440277099609375, -0.010661840438842773, -0.009883403778076172, -0.00910496711730957, -0.008326530456542969, -0.007548093795776367, -0.006769657135009766, -0.005991220474243164, -0.0052127838134765625, -0.004434347152709961, -0.0036559104919433594, -0.002877473831176758, -0.0020990371704101562, -0.0013206005096435547, -0.0005421638488769531, 0.00023627281188964844, 0.00101470947265625, 0.0017931461334228516, 0.002571582794189453, 0.0033500194549560547, 0.004128456115722656, 0.004906892776489258, 0.005685329437255859, 0.006463766098022461, 0.0072422027587890625, 0.008020639419555664, 0.008799076080322266, 0.009577512741088867, 0.010355949401855469, 0.01113438606262207, 0.011912822723388672, 0.012691259384155273, 0.013469696044921875, 0.014248132705688477, 0.015026569366455078, 0.01580500602722168, 0.01658344268798828, 0.017361879348754883, 0.018140316009521484, 0.018918752670288086, 0.019697189331054688, 0.02047562599182129, 0.02125406265258789, 0.022032499313354492, 0.022810935974121094, 0.023589372634887695, 0.024367809295654297, 0.0251462459564209, 0.0259246826171875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 12.0, 7.0, 13.0, 12.0, 14.0, 19.0, 19.0, 22.0, 25.0, 32.0, 34.0, 42.0, 42.0, 43.0, 41.0, 36.0, 39.0, 36.0, 43.0, 38.0, 37.0, 43.0, 46.0, 43.0, 37.0, 22.0, 23.0, 22.0, 28.0, 23.0, 19.0, 18.0, 10.0, 12.0, 13.0, 7.0, 5.0, 8.0, 1.0, 7.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004962921142578125, -0.004770994186401367, -0.004579067230224609, -0.0043871402740478516, -0.004195213317871094, -0.004003286361694336, -0.003811359405517578, -0.0036194324493408203, -0.0034275054931640625, -0.0032355785369873047, -0.003043651580810547, -0.002851724624633789, -0.0026597976684570312, -0.0024678707122802734, -0.0022759437561035156, -0.002084016799926758, -0.00189208984375, -0.0017001628875732422, -0.0015082359313964844, -0.0013163089752197266, -0.0011243820190429688, -0.0009324550628662109, -0.0007405281066894531, -0.0005486011505126953, -0.0003566741943359375, -0.0001647472381591797, 2.7179718017578125e-05, 0.00021910667419433594, 0.00041103363037109375, 0.0006029605865478516, 0.0007948875427246094, 0.0009868144989013672, 0.001178741455078125, 0.0013706684112548828, 0.0015625953674316406, 0.0017545223236083984, 0.0019464492797851562, 0.002138376235961914, 0.002330303192138672, 0.0025222301483154297, 0.0027141571044921875, 0.0029060840606689453, 0.003098011016845703, 0.003289937973022461, 0.0034818649291992188, 0.0036737918853759766, 0.0038657188415527344, 0.004057645797729492, 0.00424957275390625, 0.004441499710083008, 0.004633426666259766, 0.0048253536224365234, 0.005017280578613281, 0.005209207534790039, 0.005401134490966797, 0.005593061447143555, 0.0057849884033203125, 0.00597691535949707, 0.006168842315673828, 0.006360769271850586, 0.006552696228027344, 0.0067446231842041016, 0.006936550140380859, 0.007128477096557617, 0.007320404052734375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 5.0, 17.0, 17.0, 26.0, 38.0, 68.0, 70.0, 114.0, 208.0, 240.0, 387.0, 595.0, 833.0, 1225.0, 1743.0, 2481.0, 3645.0, 5190.0, 8388.0, 14625.0, 38063.0, 673711.0, 230577.0, 30084.0, 12939.0, 7653.0, 4678.0, 3347.0, 2338.0, 1590.0, 1123.0, 788.0, 576.0, 337.0, 278.0, 177.0, 125.0, 87.0, 51.0, 43.0, 19.0, 13.0, 16.0, 10.0, 4.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.0020465850830078125, -0.001987949013710022, -0.0019293129444122314, -0.001870676875114441, -0.0018120408058166504, -0.0017534047365188599, -0.0016947686672210693, -0.0016361325979232788, -0.0015774965286254883, -0.0015188604593276978, -0.0014602243900299072, -0.0014015883207321167, -0.0013429522514343262, -0.0012843161821365356, -0.0012256801128387451, -0.0011670440435409546, -0.001108407974243164, -0.0010497719049453735, -0.000991135835647583, -0.0009324997663497925, -0.000873863697052002, -0.0008152276277542114, -0.0007565915584564209, -0.0006979554891586304, -0.0006393194198608398, -0.0005806833505630493, -0.0005220472812652588, -0.00046341121196746826, -0.00040477514266967773, -0.0003461390733718872, -0.0002875030040740967, -0.00022886693477630615, -0.00017023086547851562, -0.0001115947961807251, -5.295872688293457e-05, 5.677342414855957e-06, 6.431341171264648e-05, 0.000122949481010437, 0.00018158555030822754, 0.00024022161960601807, 0.0002988576889038086, 0.0003574937582015991, 0.00041612982749938965, 0.0004747658967971802, 0.0005334019660949707, 0.0005920380353927612, 0.0006506741046905518, 0.0007093101739883423, 0.0007679462432861328, 0.0008265823125839233, 0.0008852183818817139, 0.0009438544511795044, 0.001002490520477295, 0.0010611265897750854, 0.001119762659072876, 0.0011783987283706665, 0.001237034797668457, 0.0012956708669662476, 0.001354306936264038, 0.0014129430055618286, 0.0014715790748596191, 0.0015302151441574097, 0.0015888512134552002, 0.0016474872827529907, 0.0017061233520507812]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 0.0, 1.0, 8.0, 7.0, 0.0, 21.0, 23.0, 0.0, 35.0, 60.0, 0.0, 89.0, 125.0, 222.0, 0.0, 138.0, 67.0, 0.0, 49.0, 53.0, 27.0, 0.0, 25.0, 18.0, 0.0, 9.0, 5.0, 0.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2097880244255066e-06, -1.16787850856781e-06, -1.1259689927101135e-06, -1.084059476852417e-06, -1.0421499609947205e-06, -1.000240445137024e-06, -9.583309292793274e-07, -9.164214134216309e-07, -8.745118975639343e-07, -8.326023817062378e-07, -7.906928658485413e-07, -7.487833499908447e-07, -7.068738341331482e-07, -6.649643182754517e-07, -6.230548024177551e-07, -5.811452865600586e-07, -5.392357707023621e-07, -4.973262548446655e-07, -4.55416738986969e-07, -4.1350722312927246e-07, -3.7159770727157593e-07, -3.296881914138794e-07, -2.8777867555618286e-07, -2.4586915969848633e-07, -2.039596438407898e-07, -1.6205012798309326e-07, -1.2014061212539673e-07, -7.82310962677002e-08, -3.632158041000366e-08, 5.587935447692871e-09, 4.7497451305389404e-08, 8.940696716308594e-08, 1.3131648302078247e-07, 1.73225998878479e-07, 2.1513551473617554e-07, 2.5704503059387207e-07, 2.989545464515686e-07, 3.4086406230926514e-07, 3.8277357816696167e-07, 4.246830940246582e-07, 4.6659260988235474e-07, 5.085021257400513e-07, 5.504116415977478e-07, 5.923211574554443e-07, 6.342306733131409e-07, 6.761401891708374e-07, 7.180497050285339e-07, 7.599592208862305e-07, 8.01868736743927e-07, 8.437782526016235e-07, 8.856877684593201e-07, 9.275972843170166e-07, 9.695068001747131e-07, 1.0114163160324097e-06, 1.0533258318901062e-06, 1.0952353477478027e-06, 1.1371448636054993e-06, 1.1790543794631958e-06, 1.2209638953208923e-06, 1.2628734111785889e-06, 1.3047829270362854e-06, 1.346692442893982e-06, 1.3886019587516785e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 7.0, 9.0, 8.0, 18.0, 23.0, 33.0, 54.0, 69.0, 95.0, 154.0, 253.0, 290.0, 476.0, 755.0, 1085.0, 1550.0, 2516.0, 3836.0, 6283.0, 10567.0, 20367.0, 69699.0, 810939.0, 70697.0, 20573.0, 10630.0, 6236.0, 3922.0, 2497.0, 1622.0, 1107.0, 697.0, 425.0, 311.0, 249.0, 165.0, 92.0, 70.0, 50.0, 45.0, 26.0, 20.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0024433135986328125, -0.002370387315750122, -0.0022974610328674316, -0.002224534749984741, -0.0021516084671020508, -0.0020786821842193604, -0.00200575590133667, -0.0019328296184539795, -0.001859903335571289, -0.0017869770526885986, -0.0017140507698059082, -0.0016411244869232178, -0.0015681982040405273, -0.001495271921157837, -0.0014223456382751465, -0.001349419355392456, -0.0012764930725097656, -0.0012035667896270752, -0.0011306405067443848, -0.0010577142238616943, -0.000984787940979004, -0.0009118616580963135, -0.000838935375213623, -0.0007660090923309326, -0.0006930828094482422, -0.0006201565265655518, -0.0005472302436828613, -0.0004743039608001709, -0.00040137767791748047, -0.00032845139503479004, -0.0002555251121520996, -0.00018259882926940918, -0.00010967254638671875, -3.674626350402832e-05, 3.618001937866211e-05, 0.00010910630226135254, 0.00018203258514404297, 0.0002549588680267334, 0.00032788515090942383, 0.00040081143379211426, 0.0004737377166748047, 0.0005466639995574951, 0.0006195902824401855, 0.000692516565322876, 0.0007654428482055664, 0.0008383691310882568, 0.0009112954139709473, 0.0009842216968536377, 0.0010571479797363281, 0.0011300742626190186, 0.001203000545501709, 0.0012759268283843994, 0.0013488531112670898, 0.0014217793941497803, 0.0014947056770324707, 0.0015676319599151611, 0.0016405582427978516, 0.001713484525680542, 0.0017864108085632324, 0.0018593370914459229, 0.0019322633743286133, 0.0020051896572113037, 0.002078115940093994, 0.0021510422229766846, 0.002223968505859375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 9.0, 9.0, 8.0, 8.0, 8.0, 9.0, 18.0, 37.0, 93.0, 257.0, 306.0, 90.0, 30.0, 21.0, 16.0, 9.0, 11.0, 2.0, 4.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006771087646484375, -0.0006572306156158447, -0.000637352466583252, -0.0006174743175506592, -0.0005975961685180664, -0.0005777180194854736, -0.0005578398704528809, -0.0005379617214202881, -0.0005180835723876953, -0.0004982054233551025, -0.00047832727432250977, -0.000458449125289917, -0.0004385709762573242, -0.00041869282722473145, -0.00039881467819213867, -0.0003789365291595459, -0.0003590583801269531, -0.00033918023109436035, -0.0003193020820617676, -0.0002994239330291748, -0.00027954578399658203, -0.00025966763496398926, -0.00023978948593139648, -0.0002199113368988037, -0.00020003318786621094, -0.00018015503883361816, -0.0001602768898010254, -0.00014039874076843262, -0.00012052059173583984, -0.00010064244270324707, -8.07642936706543e-05, -6.0886144638061523e-05, -4.100799560546875e-05, -2.1129846572875977e-05, -1.2516975402832031e-06, 1.862645149230957e-05, 3.8504600524902344e-05, 5.838274955749512e-05, 7.826089859008789e-05, 9.813904762268066e-05, 0.00011801719665527344, 0.0001378953456878662, 0.00015777349472045898, 0.00017765164375305176, 0.00019752979278564453, 0.0002174079418182373, 0.00023728609085083008, 0.00025716423988342285, 0.0002770423889160156, 0.0002969205379486084, 0.00031679868698120117, 0.00033667683601379395, 0.0003565549850463867, 0.0003764331340789795, 0.00039631128311157227, 0.00041618943214416504, 0.0004360675811767578, 0.0004559457302093506, 0.00047582387924194336, 0.0004957020282745361, 0.0005155801773071289, 0.0005354583263397217, 0.0005553364753723145, 0.0005752146244049072, 0.0005950927734375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 8.0, 3.0, 5.0, 1.0, 8.0, 16.0, 17.0, 13.0, 29.0, 36.0, 36.0, 46.0, 52.0, 57.0, 86.0, 100.0, 83.0, 81.0, 61.0, 61.0, 36.0, 29.0, 26.0, 15.0, 24.0, 12.0, 13.0, 14.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01078855898231268, -0.010390453971922398, -0.00999234989285469, -0.009594244882464409, -0.009196140803396702, -0.00879803579300642, -0.008399931713938713, -0.008001826703548431, -0.007603722158819437, -0.007205617614090443, -0.006807513069361448, -0.006409408524632454, -0.006011303514242172, -0.005613199435174465, -0.0052150944247841835, -0.004816989880055189, -0.004418885335326195, -0.0040207807905972, -0.003622676245868206, -0.003224571468308568, -0.0028264669235795736, -0.0024283623788505793, -0.0020302576012909412, -0.0016321530565619469, -0.0012340485118329525, -0.0008359439088962972, -0.00043783930595964193, -3.973464481532574e-05, 0.00035836989991366863, 0.000756474444642663, 0.001154579222202301, 0.0015526837669312954, 0.0019507883116602898, 0.002348892856389284, 0.0027469974011182785, 0.0031451021786779165, 0.003543206723406911, 0.003941311500966549, 0.004339416045695543, 0.004737520590424538, 0.005135625135153532, 0.005533729679882526, 0.005931834224611521, 0.006329938769340515, 0.006728043779730797, 0.007126147858798504, 0.0075242528691887856, 0.007922356948256493, 0.008320461958646774, 0.008718566969037056, 0.009116671048104763, 0.009514776058495045, 0.009912880137562752, 0.010310985147953033, 0.010709090158343315, 0.011107194237411022, 0.01150529831647873, 0.011903403326869011, 0.012301507405936718, 0.012699612416327, 0.013097716495394707, 0.013495821505784988, 0.01389392651617527, 0.014292030595242977, 0.014690135605633259]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 6.0, 11.0, 15.0, 17.0, 14.0, 17.0, 18.0, 14.0, 30.0, 32.0, 32.0, 27.0, 25.0, 45.0, 27.0, 35.0, 37.0, 34.0, 42.0, 32.0, 36.0, 44.0, 30.0, 33.0, 45.0, 34.0, 28.0, 36.0, 18.0, 20.0, 26.0, 14.0, 16.0, 16.0, 11.0, 6.0, 12.0, 4.0, 6.0, 6.0, 6.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00871752854436636, -0.008444925770163536, -0.008172322064638138, -0.00789971835911274, -0.007627115584909916, -0.007354512345045805, -0.007081909105181694, -0.006809305865317583, -0.006536702625453472, -0.006264099385589361, -0.00599149614572525, -0.005718892905861139, -0.005446289665997028, -0.005173686426132917, -0.0049010831862688065, -0.0046284799464046955, -0.0043558767065405846, -0.004083273466676474, -0.0038106702268123627, -0.0035380669869482517, -0.0032654637470841408, -0.00299286050722003, -0.002720257267355919, -0.002447654027491808, -0.002175050787627697, -0.001902447547763586, -0.001629844307899475, -0.0013572410680353642, -0.0010846378281712532, -0.0008120345883071423, -0.0005394313484430313, -0.00026682810857892036, 5.775131285190582e-06, 0.00027837837114930153, 0.0005509816110134125, 0.0008235848508775234, 0.0010961880907416344, 0.0013687913306057453, 0.0016413945704698563, 0.0019139978103339672, 0.002186601050198078, 0.002459204290062189, 0.0027318075299263, 0.003004410769790411, 0.003277014009654522, 0.003549617249518633, 0.003822220489382744, 0.004094823729246855, 0.004367426969110966, 0.004640030208975077, 0.004912633448839188, 0.005185236688703299, 0.0054578399285674095, 0.0057304431684315205, 0.006003046408295631, 0.006275649648159742, 0.006548252888023853, 0.006820856127887964, 0.007093459367752075, 0.007366062607616186, 0.007638665847480297, 0.00791126862168312, 0.008183872327208519, 0.008456476032733917, 0.008729078806936741]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 1.0, 6.0, 10.0, 9.0, 18.0, 35.0, 27.0, 44.0, 81.0, 125.0, 198.0, 266.0, 370.0, 517.0, 747.0, 1168.0, 1666.0, 2617.0, 3941.0, 5973.0, 9267.0, 14705.0, 23683.0, 38881.0, 66130.0, 120734.0, 254220.0, 785081.0, 1744858.0, 630325.0, 221102.0, 109650.0, 60845.0, 35824.0, 21632.0, 13605.0, 8835.0, 5767.0, 3750.0, 2461.0, 1641.0, 1150.0, 731.0, 529.0, 362.0, 248.0, 144.0, 114.0, 72.0, 50.0, 34.0, 18.0, 11.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01318359375, -0.01280057430267334, -0.01241755485534668, -0.01203453540802002, -0.01165151596069336, -0.0112684965133667, -0.010885477066040039, -0.010502457618713379, -0.010119438171386719, -0.009736418724060059, -0.009353399276733398, -0.008970379829406738, -0.008587360382080078, -0.008204340934753418, -0.007821321487426758, -0.007438302040100098, -0.0070552825927734375, -0.006672263145446777, -0.006289243698120117, -0.005906224250793457, -0.005523204803466797, -0.005140185356140137, -0.0047571659088134766, -0.004374146461486816, -0.003991127014160156, -0.003608107566833496, -0.003225088119506836, -0.0028420686721801758, -0.0024590492248535156, -0.0020760297775268555, -0.0016930103302001953, -0.0013099908828735352, -0.000926971435546875, -0.0005439519882202148, -0.0001609325408935547, 0.00022208690643310547, 0.0006051063537597656, 0.0009881258010864258, 0.001371145248413086, 0.001754164695739746, 0.0021371841430664062, 0.0025202035903930664, 0.0029032230377197266, 0.0032862424850463867, 0.003669261932373047, 0.004052281379699707, 0.004435300827026367, 0.004818320274353027, 0.0052013397216796875, 0.005584359169006348, 0.005967378616333008, 0.006350398063659668, 0.006733417510986328, 0.007116436958312988, 0.0074994564056396484, 0.007882475852966309, 0.008265495300292969, 0.008648514747619629, 0.009031534194946289, 0.00941455364227295, 0.00979757308959961, 0.01018059253692627, 0.01056361198425293, 0.01094663143157959, 0.01132965087890625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 8.0, 9.0, 9.0, 17.0, 10.0, 15.0, 16.0, 22.0, 24.0, 24.0, 17.0, 27.0, 29.0, 35.0, 33.0, 39.0, 34.0, 38.0, 43.0, 34.0, 44.0, 37.0, 33.0, 48.0, 45.0, 36.0, 34.0, 26.0, 25.0, 23.0, 20.0, 17.0, 23.0, 15.0, 17.0, 10.0, 6.0, 10.0, 5.0, 6.0, 6.0, 6.0, 4.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.005268096923828125, -0.005112767219543457, -0.004957437515258789, -0.004802107810974121, -0.004646778106689453, -0.004491448402404785, -0.004336118698120117, -0.004180788993835449, -0.004025459289550781, -0.0038701295852661133, -0.0037147998809814453, -0.0035594701766967773, -0.0034041404724121094, -0.0032488107681274414, -0.0030934810638427734, -0.0029381513595581055, -0.0027828216552734375, -0.0026274919509887695, -0.0024721622467041016, -0.0023168325424194336, -0.0021615028381347656, -0.0020061731338500977, -0.0018508434295654297, -0.0016955137252807617, -0.0015401840209960938, -0.0013848543167114258, -0.0012295246124267578, -0.0010741949081420898, -0.0009188652038574219, -0.0007635354995727539, -0.0006082057952880859, -0.00045287609100341797, -0.00029754638671875, -0.00014221668243408203, 1.3113021850585938e-05, 0.0001684427261352539, 0.0003237724304199219, 0.00047910213470458984, 0.0006344318389892578, 0.0007897615432739258, 0.0009450912475585938, 0.0011004209518432617, 0.0012557506561279297, 0.0014110803604125977, 0.0015664100646972656, 0.0017217397689819336, 0.0018770694732666016, 0.0020323991775512695, 0.0021877288818359375, 0.0023430585861206055, 0.0024983882904052734, 0.0026537179946899414, 0.0028090476989746094, 0.0029643774032592773, 0.0031197071075439453, 0.0032750368118286133, 0.0034303665161132812, 0.0035856962203979492, 0.003741025924682617, 0.003896355628967285, 0.004051685333251953, 0.004207015037536621, 0.004362344741821289, 0.004517674446105957, 0.004673004150390625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 14.0, 10.0, 18.0, 28.0, 42.0, 54.0, 81.0, 146.0, 222.0, 393.0, 570.0, 820.0, 1437.0, 2353.0, 3786.0, 6063.0, 9959.0, 16423.0, 27837.0, 49017.0, 87622.0, 165948.0, 337297.0, 820615.0, 1457866.0, 619645.0, 273110.0, 137711.0, 73529.0, 41313.0, 23945.0, 13905.0, 8590.0, 5211.0, 3264.0, 2086.0, 1272.0, 813.0, 499.0, 263.0, 188.0, 106.0, 84.0, 39.0, 39.0, 21.0, 16.0, 5.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00928497314453125, -0.00898885726928711, -0.008692741394042969, -0.008396625518798828, -0.008100509643554688, -0.007804393768310547, -0.007508277893066406, -0.007212162017822266, -0.006916046142578125, -0.006619930267333984, -0.006323814392089844, -0.006027698516845703, -0.0057315826416015625, -0.005435466766357422, -0.005139350891113281, -0.004843235015869141, -0.004547119140625, -0.004251003265380859, -0.003954887390136719, -0.003658771514892578, -0.0033626556396484375, -0.003066539764404297, -0.0027704238891601562, -0.0024743080139160156, -0.002178192138671875, -0.0018820762634277344, -0.0015859603881835938, -0.0012898445129394531, -0.0009937286376953125, -0.0006976127624511719, -0.00040149688720703125, -0.00010538101196289062, 0.00019073486328125, 0.0004868507385253906, 0.0007829666137695312, 0.0010790824890136719, 0.0013751983642578125, 0.0016713142395019531, 0.0019674301147460938, 0.0022635459899902344, 0.002559661865234375, 0.0028557777404785156, 0.0031518936157226562, 0.003448009490966797, 0.0037441253662109375, 0.004040241241455078, 0.004336357116699219, 0.004632472991943359, 0.0049285888671875, 0.005224704742431641, 0.005520820617675781, 0.005816936492919922, 0.0061130523681640625, 0.006409168243408203, 0.006705284118652344, 0.007001399993896484, 0.007297515869140625, 0.007593631744384766, 0.007889747619628906, 0.008185863494873047, 0.008481979370117188, 0.008778095245361328, 0.009074211120605469, 0.00937032699584961, 0.00966644287109375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 11.0, 14.0, 20.0, 27.0, 31.0, 29.0, 35.0, 37.0, 49.0, 69.0, 82.0, 89.0, 118.0, 131.0, 160.0, 162.0, 157.0, 199.0, 238.0, 287.0, 311.0, 258.0, 234.0, 198.0, 188.0, 139.0, 128.0, 117.0, 112.0, 87.0, 73.0, 48.0, 42.0, 46.0, 31.0, 25.0, 19.0, 11.0, 18.0, 13.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028018951416015625, -0.0027147531509399414, -0.0026276111602783203, -0.0025404691696166992, -0.002453327178955078, -0.002366185188293457, -0.002279043197631836, -0.002191901206970215, -0.0021047592163085938, -0.0020176172256469727, -0.0019304752349853516, -0.0018433332443237305, -0.0017561912536621094, -0.0016690492630004883, -0.0015819072723388672, -0.001494765281677246, -0.001407623291015625, -0.001320481300354004, -0.0012333393096923828, -0.0011461973190307617, -0.0010590553283691406, -0.0009719133377075195, -0.0008847713470458984, -0.0007976293563842773, -0.0007104873657226562, -0.0006233453750610352, -0.0005362033843994141, -0.00044906139373779297, -0.0003619194030761719, -0.0002747774124145508, -0.0001876354217529297, -0.0001004934310913086, -1.33514404296875e-05, 7.37905502319336e-05, 0.0001609325408935547, 0.0002480745315551758, 0.0003352165222167969, 0.00042235851287841797, 0.0005095005035400391, 0.0005966424942016602, 0.0006837844848632812, 0.0007709264755249023, 0.0008580684661865234, 0.0009452104568481445, 0.0010323524475097656, 0.0011194944381713867, 0.0012066364288330078, 0.001293778419494629, 0.00138092041015625, 0.001468062400817871, 0.0015552043914794922, 0.0016423463821411133, 0.0017294883728027344, 0.0018166303634643555, 0.0019037723541259766, 0.0019909143447875977, 0.0020780563354492188, 0.00216519832611084, 0.002252340316772461, 0.002339482307434082, 0.002426624298095703, 0.0025137662887573242, 0.0026009082794189453, 0.0026880502700805664, 0.0027751922607421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 10.0, 5.0, 13.0, 24.0, 25.0, 24.0, 49.0, 44.0, 59.0, 83.0, 82.0, 88.0, 104.0, 85.0, 68.0, 46.0, 34.0, 23.0, 33.0, 22.0, 14.0, 16.0, 7.0, 9.0, 8.0, 5.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007800758816301823, -0.007521199062466621, -0.00724163930863142, -0.006962079554796219, -0.006682519800961018, -0.006402960047125816, -0.006123400758951902, -0.005843841005116701, -0.0055642812512815, -0.005284721497446299, -0.005005161743611097, -0.004725601989775896, -0.004446042701601982, -0.004166482947766781, -0.0038869231939315796, -0.0036073634400963783, -0.003327803686261177, -0.003048243932425976, -0.0027686841785907745, -0.002489124657586217, -0.0022095649037510157, -0.0019300051499158144, -0.001650445512495935, -0.0013708858750760555, -0.0010913261212408543, -0.0008117664256133139, -0.0005322067299857736, -0.0002526470343582332, 2.6912661269307137e-05, 0.0003064724151045084, 0.0005860320525243878, 0.0008655916899442673, 0.0011451514437794685, 0.0014247111976146698, 0.0017042708350345492, 0.0019838304724544287, 0.00226339022628963, 0.002542949980124831, 0.002822509501129389, 0.00310206925496459, 0.0033816290087997913, 0.0036611887626349926, 0.003940748516470194, 0.004220308270305395, 0.004499867558479309, 0.00477942731231451, 0.005058987066149712, 0.005338546819984913, 0.005618106573820114, 0.005897666327655315, 0.006177226081490517, 0.006456785835325718, 0.006736345589160919, 0.0070159053429961205, 0.007295464631170034, 0.007575024385005236, 0.007854584604501724, 0.008134144358336926, 0.008413704112172127, 0.008693263866007328, 0.00897282361984253, 0.00925238337367773, 0.009531943127512932, 0.009811501950025558, 0.01009106170386076]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 2.0, 13.0, 20.0, 17.0, 15.0, 22.0, 24.0, 19.0, 32.0, 34.0, 39.0, 39.0, 58.0, 48.0, 39.0, 44.0, 39.0, 46.0, 47.0, 46.0, 34.0, 38.0, 37.0, 39.0, 37.0, 17.0, 22.0, 18.0, 22.0, 21.0, 10.0, 8.0, 6.0, 10.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.006916028913110495, -0.006715869065374136, -0.00651570875197649, -0.006315548904240131, -0.006115389056503773, -0.005915229208767414, -0.005715068895369768, -0.0055149090476334095, -0.0053147487342357635, -0.005114588886499405, -0.004914428573101759, -0.0047142687253654, -0.004514108877629042, -0.004313948564231396, -0.004113788716495037, -0.0039136288687586784, -0.00371346902102232, -0.0035133089404553175, -0.003313149092718959, -0.0031129890121519566, -0.002912829164415598, -0.0027126690838485956, -0.0025125090032815933, -0.0023123491555452347, -0.0021121890749782324, -0.001912029110826552, -0.0017118691466748714, -0.0015117090661078691, -0.0013115491019561887, -0.0011113891378045082, -0.0009112290572375059, -0.0007110690930858254, -0.0005109095945954323, -0.00031074960133992136, -0.00011058960808441043, 8.957041427493095e-05, 0.0002897303784266114, 0.0004898903425782919, 0.0006900504231452942, 0.0008902103872969747, 0.0010903703514486551, 0.0012905303156003356, 0.001490690279752016, 0.0016908503603190184, 0.0018910103244706988, 0.0020911702886223793, 0.0022913303691893816, 0.002491490449756384, 0.0026916502974927425, 0.002891810378059745, 0.0030919702257961035, 0.0032921303063631058, 0.0034922901540994644, 0.0036924502346664667, 0.003892610315233469, 0.004092770162969828, 0.004292930476367474, 0.004493090324103832, 0.004693250637501478, 0.004893410485237837, 0.0050935703329741955, 0.005293730646371841, 0.0054938904941082, 0.005694050341844559, 0.005894210189580917]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 12.0, 11.0, 20.0, 18.0, 35.0, 43.0, 78.0, 92.0, 145.0, 241.0, 353.0, 507.0, 762.0, 1092.0, 1781.0, 2733.0, 4290.0, 7012.0, 11877.0, 20090.0, 36440.0, 71485.0, 160057.0, 369713.0, 183969.0, 80021.0, 40366.0, 22126.0, 12467.0, 7501.0, 4698.0, 3012.0, 1838.0, 1207.0, 796.0, 566.0, 370.0, 232.0, 165.0, 100.0, 78.0, 42.0, 34.0, 20.0, 24.0, 14.0, 9.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.0064239501953125, -0.006232619285583496, -0.006041288375854492, -0.005849957466125488, -0.005658626556396484, -0.0054672956466674805, -0.0052759647369384766, -0.005084633827209473, -0.004893302917480469, -0.004701972007751465, -0.004510641098022461, -0.004319310188293457, -0.004127979278564453, -0.003936648368835449, -0.0037453174591064453, -0.0035539865493774414, -0.0033626556396484375, -0.0031713247299194336, -0.0029799938201904297, -0.0027886629104614258, -0.002597332000732422, -0.002406001091003418, -0.002214670181274414, -0.00202333927154541, -0.0018320083618164062, -0.0016406774520874023, -0.0014493465423583984, -0.0012580156326293945, -0.0010666847229003906, -0.0008753538131713867, -0.0006840229034423828, -0.0004926919937133789, -0.000301361083984375, -0.0001100301742553711, 8.130073547363281e-05, 0.0002726316452026367, 0.0004639625549316406, 0.0006552934646606445, 0.0008466243743896484, 0.0010379552841186523, 0.0012292861938476562, 0.0014206171035766602, 0.001611948013305664, 0.001803278923034668, 0.001994609832763672, 0.0021859407424926758, 0.0023772716522216797, 0.0025686025619506836, 0.0027599334716796875, 0.0029512643814086914, 0.0031425952911376953, 0.0033339262008666992, 0.003525257110595703, 0.003716588020324707, 0.003907918930053711, 0.004099249839782715, 0.004290580749511719, 0.004481911659240723, 0.0046732425689697266, 0.0048645734786987305, 0.005055904388427734, 0.005247235298156738, 0.005438566207885742, 0.005629897117614746, 0.00582122802734375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 5.0, 11.0, 18.0, 18.0, 17.0, 20.0, 23.0, 32.0, 30.0, 45.0, 51.0, 49.0, 39.0, 44.0, 42.0, 39.0, 50.0, 49.0, 42.0, 44.0, 40.0, 41.0, 44.0, 24.0, 24.0, 21.0, 23.0, 19.0, 20.0, 16.0, 10.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00696563720703125, -0.006754755973815918, -0.006543874740600586, -0.006332993507385254, -0.006122112274169922, -0.00591123104095459, -0.005700349807739258, -0.005489468574523926, -0.005278587341308594, -0.005067706108093262, -0.00485682487487793, -0.004645943641662598, -0.004435062408447266, -0.004224181175231934, -0.0040132999420166016, -0.0038024187088012695, -0.0035915374755859375, -0.0033806562423706055, -0.0031697750091552734, -0.0029588937759399414, -0.0027480125427246094, -0.0025371313095092773, -0.0023262500762939453, -0.0021153688430786133, -0.0019044876098632812, -0.0016936063766479492, -0.0014827251434326172, -0.0012718439102172852, -0.0010609626770019531, -0.0008500814437866211, -0.0006392002105712891, -0.00042831897735595703, -0.000217437744140625, -6.556510925292969e-06, 0.00020432472229003906, 0.0004152059555053711, 0.0006260871887207031, 0.0008369684219360352, 0.0010478496551513672, 0.0012587308883666992, 0.0014696121215820312, 0.0016804933547973633, 0.0018913745880126953, 0.0021022558212280273, 0.0023131370544433594, 0.0025240182876586914, 0.0027348995208740234, 0.0029457807540893555, 0.0031566619873046875, 0.0033675432205200195, 0.0035784244537353516, 0.0037893056869506836, 0.004000186920166016, 0.004211068153381348, 0.00442194938659668, 0.004632830619812012, 0.004843711853027344, 0.005054593086242676, 0.005265474319458008, 0.00547635555267334, 0.005687236785888672, 0.005898118019104004, 0.006108999252319336, 0.006319880485534668, 0.00653076171875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 9.0, 9.0, 24.0, 33.0, 39.0, 49.0, 79.0, 112.0, 158.0, 185.0, 339.0, 466.0, 634.0, 981.0, 1414.0, 2120.0, 3319.0, 5549.0, 9746.0, 19692.0, 51643.0, 467072.0, 392183.0, 48703.0, 19472.0, 9648.0, 5369.0, 3131.0, 1987.0, 1348.0, 935.0, 621.0, 445.0, 299.0, 210.0, 158.0, 114.0, 79.0, 46.0, 38.0, 26.0, 13.0, 19.0, 7.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.01119232177734375, -0.010852932929992676, -0.010513544082641602, -0.010174155235290527, -0.009834766387939453, -0.009495377540588379, -0.009155988693237305, -0.00881659984588623, -0.008477210998535156, -0.008137822151184082, -0.007798433303833008, -0.007459044456481934, -0.007119655609130859, -0.006780266761779785, -0.006440877914428711, -0.006101489067077637, -0.0057621002197265625, -0.005422711372375488, -0.005083322525024414, -0.00474393367767334, -0.004404544830322266, -0.004065155982971191, -0.003725767135620117, -0.003386378288269043, -0.0030469894409179688, -0.0027076005935668945, -0.0023682117462158203, -0.002028822898864746, -0.0016894340515136719, -0.0013500452041625977, -0.0010106563568115234, -0.0006712675094604492, -0.000331878662109375, 7.510185241699219e-06, 0.00034689903259277344, 0.0006862878799438477, 0.0010256767272949219, 0.001365065574645996, 0.0017044544219970703, 0.0020438432693481445, 0.0023832321166992188, 0.002722620964050293, 0.003062009811401367, 0.0034013986587524414, 0.0037407875061035156, 0.00408017635345459, 0.004419565200805664, 0.004758954048156738, 0.0050983428955078125, 0.005437731742858887, 0.005777120590209961, 0.006116509437561035, 0.006455898284912109, 0.006795287132263184, 0.007134675979614258, 0.007474064826965332, 0.007813453674316406, 0.00815284252166748, 0.008492231369018555, 0.008831620216369629, 0.009171009063720703, 0.009510397911071777, 0.009849786758422852, 0.010189175605773926, 0.010528564453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 3.0, 2.0, 13.0, 10.0, 12.0, 12.0, 8.0, 11.0, 15.0, 30.0, 22.0, 30.0, 31.0, 28.0, 39.0, 33.0, 33.0, 40.0, 34.0, 42.0, 40.0, 37.0, 34.0, 40.0, 39.0, 29.0, 35.0, 35.0, 34.0, 32.0, 23.0, 28.0, 22.0, 18.0, 13.0, 18.0, 13.0, 12.0, 8.0, 9.0, 8.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.003879547119140625, -0.0037613511085510254, -0.0036431550979614258, -0.003524959087371826, -0.0034067630767822266, -0.003288567066192627, -0.0031703710556030273, -0.0030521750450134277, -0.002933979034423828, -0.0028157830238342285, -0.002697587013244629, -0.0025793910026550293, -0.0024611949920654297, -0.00234299898147583, -0.0022248029708862305, -0.002106606960296631, -0.0019884109497070312, -0.0018702149391174316, -0.001752018928527832, -0.0016338229179382324, -0.0015156269073486328, -0.0013974308967590332, -0.0012792348861694336, -0.001161038875579834, -0.0010428428649902344, -0.0009246468544006348, -0.0008064508438110352, -0.0006882548332214355, -0.0005700588226318359, -0.00045186281204223633, -0.0003336668014526367, -0.0002154707908630371, -9.72747802734375e-05, 2.092123031616211e-05, 0.00013911724090576172, 0.00025731325149536133, 0.00037550926208496094, 0.0004937052726745605, 0.0006119012832641602, 0.0007300972938537598, 0.0008482933044433594, 0.000966489315032959, 0.0010846853256225586, 0.0012028813362121582, 0.0013210773468017578, 0.0014392733573913574, 0.001557469367980957, 0.0016756653785705566, 0.0017938613891601562, 0.0019120573997497559, 0.0020302534103393555, 0.002148449420928955, 0.0022666454315185547, 0.0023848414421081543, 0.002503037452697754, 0.0026212334632873535, 0.002739429473876953, 0.0028576254844665527, 0.0029758214950561523, 0.003094017505645752, 0.0032122135162353516, 0.003330409526824951, 0.0034486055374145508, 0.0035668015480041504, 0.00368499755859375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 9.0, 12.0, 12.0, 21.0, 19.0, 25.0, 32.0, 47.0, 75.0, 95.0, 79.0, 162.0, 251.0, 264.0, 441.0, 659.0, 1042.0, 1688.0, 3027.0, 5825.0, 13849.0, 51580.0, 792293.0, 136107.0, 22622.0, 8167.0, 4078.0, 2211.0, 1296.0, 816.0, 475.0, 335.0, 247.0, 152.0, 134.0, 98.0, 70.0, 57.0, 43.0, 46.0, 29.0, 13.0, 11.0, 14.0, 9.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0012445449829101562, -0.0012040287256240845, -0.0011635124683380127, -0.001122996211051941, -0.0010824799537658691, -0.0010419636964797974, -0.0010014474391937256, -0.0009609311819076538, -0.000920414924621582, -0.0008798986673355103, -0.0008393824100494385, -0.0007988661527633667, -0.0007583498954772949, -0.0007178336381912231, -0.0006773173809051514, -0.0006368011236190796, -0.0005962848663330078, -0.000555768609046936, -0.0005152523517608643, -0.0004747360944747925, -0.0004342198371887207, -0.0003937035799026489, -0.00035318732261657715, -0.00031267106533050537, -0.0002721548080444336, -0.00023163855075836182, -0.00019112229347229004, -0.00015060603618621826, -0.00011008977890014648, -6.957352161407471e-05, -2.905726432800293e-05, 1.1458992958068848e-05, 5.1975250244140625e-05, 9.24915075302124e-05, 0.00013300776481628418, 0.00017352402210235596, 0.00021404027938842773, 0.0002545565366744995, 0.0002950727939605713, 0.00033558905124664307, 0.00037610530853271484, 0.0004166215658187866, 0.0004571378231048584, 0.0004976540803909302, 0.000538170337677002, 0.0005786865949630737, 0.0006192028522491455, 0.0006597191095352173, 0.0007002353668212891, 0.0007407516241073608, 0.0007812678813934326, 0.0008217841386795044, 0.0008623003959655762, 0.000902816653251648, 0.0009433329105377197, 0.0009838491678237915, 0.0010243654251098633, 0.001064881682395935, 0.0011053979396820068, 0.0011459141969680786, 0.0011864304542541504, 0.0012269467115402222, 0.001267462968826294, 0.0013079792261123657, 0.0013484954833984375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 4.0, 16.0, 7.0, 14.0, 11.0, 19.0, 25.0, 19.0, 36.0, 33.0, 76.0, 59.0, 46.0, 53.0, 60.0, 58.0, 46.0, 71.0, 52.0, 44.0, 37.0, 32.0, 30.0, 17.0, 26.0, 20.0, 18.0, 14.0, 7.0, 10.0, 8.0, 14.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6065314412117004e-06, -1.5441328287124634e-06, -1.4817342162132263e-06, -1.4193356037139893e-06, -1.3569369912147522e-06, -1.2945383787155151e-06, -1.232139766216278e-06, -1.169741153717041e-06, -1.107342541217804e-06, -1.044943928718567e-06, -9.825453162193298e-07, -9.201467037200928e-07, -8.577480912208557e-07, -7.953494787216187e-07, -7.329508662223816e-07, -6.705522537231445e-07, -6.081536412239075e-07, -5.457550287246704e-07, -4.833564162254333e-07, -4.209578037261963e-07, -3.5855919122695923e-07, -2.9616057872772217e-07, -2.337619662284851e-07, -1.7136335372924805e-07, -1.0896474123001099e-07, -4.6566128730773926e-08, 1.5832483768463135e-08, 7.82310962677002e-08, 1.4062970876693726e-07, 2.0302832126617432e-07, 2.654269337654114e-07, 3.2782554626464844e-07, 3.902241587638855e-07, 4.5262277126312256e-07, 5.150213837623596e-07, 5.774199962615967e-07, 6.398186087608337e-07, 7.022172212600708e-07, 7.646158337593079e-07, 8.270144462585449e-07, 8.89413058757782e-07, 9.51811671257019e-07, 1.014210283756256e-06, 1.0766088962554932e-06, 1.1390075087547302e-06, 1.2014061212539673e-06, 1.2638047337532043e-06, 1.3262033462524414e-06, 1.3886019587516785e-06, 1.4510005712509155e-06, 1.5133991837501526e-06, 1.5757977962493896e-06, 1.6381964087486267e-06, 1.7005950212478638e-06, 1.7629936337471008e-06, 1.8253922462463379e-06, 1.887790858745575e-06, 1.950189471244812e-06, 2.012588083744049e-06, 2.074986696243286e-06, 2.137385308742523e-06, 2.1997839212417603e-06, 2.2621825337409973e-06, 2.3245811462402344e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 11.0, 13.0, 11.0, 12.0, 26.0, 27.0, 34.0, 59.0, 83.0, 101.0, 122.0, 175.0, 284.0, 348.0, 443.0, 654.0, 915.0, 1245.0, 1828.0, 2619.0, 3898.0, 6246.0, 9838.0, 16631.0, 31439.0, 72071.0, 266181.0, 448170.0, 94198.0, 38785.0, 19503.0, 11112.0, 6951.0, 4433.0, 2968.0, 2010.0, 1415.0, 969.0, 738.0, 496.0, 412.0, 292.0, 215.0, 175.0, 109.0, 85.0, 57.0, 46.0, 31.0, 32.0, 17.0, 10.0, 6.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0009622573852539062, -0.0009313523769378662, -0.0009004473686218262, -0.0008695423603057861, -0.0008386373519897461, -0.0008077323436737061, -0.000776827335357666, -0.000745922327041626, -0.0007150173187255859, -0.0006841123104095459, -0.0006532073020935059, -0.0006223022937774658, -0.0005913972854614258, -0.0005604922771453857, -0.0005295872688293457, -0.0004986822605133057, -0.0004677772521972656, -0.0004368722438812256, -0.00040596723556518555, -0.0003750622272491455, -0.00034415721893310547, -0.00031325221061706543, -0.0002823472023010254, -0.00025144219398498535, -0.0002205371856689453, -0.00018963217735290527, -0.00015872716903686523, -0.0001278221607208252, -9.691715240478516e-05, -6.601214408874512e-05, -3.510713577270508e-05, -4.202127456665039e-06, 2.6702880859375e-05, 5.760788917541504e-05, 8.851289749145508e-05, 0.00011941790580749512, 0.00015032291412353516, 0.0001812279224395752, 0.00021213293075561523, 0.00024303793907165527, 0.0002739429473876953, 0.00030484795570373535, 0.0003357529640197754, 0.00036665797233581543, 0.00039756298065185547, 0.0004284679889678955, 0.00045937299728393555, 0.0004902780055999756, 0.0005211830139160156, 0.0005520880222320557, 0.0005829930305480957, 0.0006138980388641357, 0.0006448030471801758, 0.0006757080554962158, 0.0007066130638122559, 0.0007375180721282959, 0.0007684230804443359, 0.000799328088760376, 0.000830233097076416, 0.0008611381053924561, 0.0008920431137084961, 0.0009229481220245361, 0.0009538531303405762, 0.0009847581386566162, 0.0010156631469726562]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 7.0, 11.0, 17.0, 22.0, 17.0, 36.0, 40.0, 55.0, 71.0, 212.0, 188.0, 74.0, 64.0, 40.0, 35.0, 20.0, 16.0, 16.0, 11.0, 13.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0005512237548828125, -0.0005344897508621216, -0.0005177557468414307, -0.0005010217428207397, -0.00048428773880004883, -0.0004675537347793579, -0.000450819730758667, -0.0004340857267379761, -0.00041735172271728516, -0.00040061771869659424, -0.0003838837146759033, -0.0003671497106552124, -0.0003504157066345215, -0.00033368170261383057, -0.00031694769859313965, -0.00030021369457244873, -0.0002834796905517578, -0.0002667456865310669, -0.000250011682510376, -0.00023327767848968506, -0.00021654367446899414, -0.00019980967044830322, -0.0001830756664276123, -0.0001663416624069214, -0.00014960765838623047, -0.00013287365436553955, -0.00011613965034484863, -9.940564632415771e-05, -8.26716423034668e-05, -6.593763828277588e-05, -4.920363426208496e-05, -3.246963024139404e-05, -1.5735626220703125e-05, 9.98377799987793e-07, 1.773238182067871e-05, 3.446638584136963e-05, 5.120038986206055e-05, 6.793439388275146e-05, 8.466839790344238e-05, 0.0001014024019241333, 0.00011813640594482422, 0.00013487040996551514, 0.00015160441398620605, 0.00016833841800689697, 0.0001850724220275879, 0.0002018064260482788, 0.00021854043006896973, 0.00023527443408966064, 0.00025200843811035156, 0.0002687424421310425, 0.0002854764461517334, 0.0003022104501724243, 0.00031894445419311523, 0.00033567845821380615, 0.00035241246223449707, 0.000369146466255188, 0.0003858804702758789, 0.0004026144742965698, 0.00041934847831726074, 0.00043608248233795166, 0.0004528164863586426, 0.0004695504903793335, 0.0004862844944000244, 0.0005030184984207153, 0.0005197525024414062]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 16.0, 21.0, 18.0, 42.0, 39.0, 53.0, 51.0, 70.0, 88.0, 115.0, 92.0, 96.0, 49.0, 43.0, 47.0, 36.0, 16.0, 24.0, 17.0, 10.0, 5.0, 9.0, 3.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008176167495548725, -0.00789280142635107, -0.00760943628847599, -0.007326070219278336, -0.007042704615741968, -0.006759339012205601, -0.006475972943007946, -0.006192607339471579, -0.005909241735935211, -0.005625876132398844, -0.005342510528862476, -0.005059144459664822, -0.004775778856128454, -0.004492413252592087, -0.004209047183394432, -0.003925681579858065, -0.0036423159763216972, -0.00335895037278533, -0.0030755845364183187, -0.0027922187000513077, -0.0025088530965149403, -0.002225487492978573, -0.0019421216566115618, -0.0016587558202445507, -0.0013753902167081833, -0.001092024496756494, -0.0008086587768048048, -0.0005252930568531156, -0.00024192733690142632, 4.143838305026293e-05, 0.00032480410300195217, 0.0006081699393689632, 0.0008915364742279053, 0.0011749021941795945, 0.0014582679141312838, 0.001741633634082973, 0.0020249993540346622, 0.0023083649575710297, 0.0025917307939380407, 0.002875096630305052, 0.0031584622338414192, 0.0034418278373777866, 0.0037251936737447977, 0.004008559510111809, 0.004291925113648176, 0.004575290717184544, 0.004858656786382198, 0.005142022389918566, 0.005425387993454933, 0.005708753596991301, 0.005992119200527668, 0.006275485269725323, 0.00655885087326169, 0.0068422164767980576, 0.007125582545995712, 0.00740894814953208, 0.007692313753068447, 0.007975679822266102, 0.008259044960141182, 0.008542411029338837, 0.008825777098536491, 0.009109142236411572, 0.009392508305609226, 0.009675873443484306, 0.009959239512681961]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 3.0, 3.0, 16.0, 21.0, 14.0, 15.0, 22.0, 29.0, 18.0, 29.0, 34.0, 42.0, 36.0, 54.0, 50.0, 34.0, 47.0, 39.0, 46.0, 46.0, 49.0, 32.0, 35.0, 39.0, 37.0, 34.0, 22.0, 22.0, 17.0, 21.0, 17.0, 15.0, 8.0, 8.0, 10.0, 2.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0067710233852267265, -0.0065748724155128, -0.006378721445798874, -0.00618257001042366, -0.005986419040709734, -0.005790268070995808, -0.005594117101281881, -0.005397966131567955, -0.005201814696192741, -0.005005663726478815, -0.004809512756764889, -0.004613361321389675, -0.004417210351675749, -0.0042210593819618225, -0.004024908412247896, -0.00382875744253397, -0.0036326064728200436, -0.0034364555031061172, -0.0032403043005615473, -0.003044153330847621, -0.002848002128303051, -0.0026518511585891247, -0.0024557001888751984, -0.002259549219161272, -0.002063398016616702, -0.001867246930487454, -0.0016710958443582058, -0.0014749448746442795, -0.0012787937885150313, -0.0010826427023857832, -0.0008864917326718569, -0.0006903406465426087, -0.0004941900260746479, -0.0002980389690492302, -0.00010188791202381253, 9.42631158977747e-05, 0.00029041420202702284, 0.000486565288156271, 0.0006827162578701973, 0.0008788673439994454, 0.0010750184301286936, 0.0012711695162579417, 0.0014673206023871899, 0.0016634715721011162, 0.0018596226582303643, 0.0020557737443596125, 0.0022519247140735388, 0.0024480759166181087, 0.002644226886332035, 0.0028403778560459614, 0.0030365290585905313, 0.0032326800283044577, 0.0034288312308490276, 0.003624982200562954, 0.0038211331702768803, 0.004017284139990807, 0.00421343557536602, 0.0044095865450799465, 0.004605737514793873, 0.0048018889501690865, 0.004998039919883013, 0.005194190889596939, 0.005390341859310865, 0.005586492829024792, 0.005782643798738718]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 17.0, 29.0, 30.0, 63.0, 83.0, 110.0, 181.0, 230.0, 317.0, 484.0, 686.0, 1009.0, 1512.0, 2203.0, 3277.0, 4904.0, 7056.0, 10848.0, 16508.0, 25501.0, 41302.0, 68425.0, 121142.0, 225003.0, 219367.0, 117272.0, 67054.0, 40197.0, 25202.0, 16090.0, 10632.0, 7084.0, 4698.0, 3172.0, 2188.0, 1462.0, 988.0, 711.0, 488.0, 329.0, 214.0, 145.0, 103.0, 66.0, 53.0, 39.0, 23.0, 19.0, 11.0, 11.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0101470947265625, -0.00982975959777832, -0.00951242446899414, -0.009195089340209961, -0.008877754211425781, -0.008560419082641602, -0.008243083953857422, -0.007925748825073242, -0.0076084136962890625, -0.007291078567504883, -0.006973743438720703, -0.0066564083099365234, -0.006339073181152344, -0.006021738052368164, -0.005704402923583984, -0.005387067794799805, -0.005069732666015625, -0.004752397537231445, -0.004435062408447266, -0.004117727279663086, -0.0038003921508789062, -0.0034830570220947266, -0.003165721893310547, -0.002848386764526367, -0.0025310516357421875, -0.002213716506958008, -0.0018963813781738281, -0.0015790462493896484, -0.0012617111206054688, -0.0009443759918212891, -0.0006270408630371094, -0.0003097057342529297, 7.62939453125e-06, 0.0003249645233154297, 0.0006422996520996094, 0.0009596347808837891, 0.0012769699096679688, 0.0015943050384521484, 0.0019116401672363281, 0.002228975296020508, 0.0025463104248046875, 0.002863645553588867, 0.003180980682373047, 0.0034983158111572266, 0.0038156509399414062, 0.004132986068725586, 0.004450321197509766, 0.004767656326293945, 0.005084991455078125, 0.005402326583862305, 0.005719661712646484, 0.006036996841430664, 0.006354331970214844, 0.0066716670989990234, 0.006989002227783203, 0.007306337356567383, 0.0076236724853515625, 0.007941007614135742, 0.008258342742919922, 0.008575677871704102, 0.008893013000488281, 0.009210348129272461, 0.00952768325805664, 0.00984501838684082, 0.010162353515625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 4.0, 11.0, 17.0, 11.0, 13.0, 23.0, 19.0, 30.0, 28.0, 30.0, 28.0, 32.0, 44.0, 44.0, 39.0, 46.0, 43.0, 42.0, 32.0, 52.0, 42.0, 37.0, 33.0, 35.0, 32.0, 32.0, 26.0, 26.0, 17.0, 19.0, 26.0, 11.0, 12.0, 10.0, 12.0, 3.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004833221435546875, -0.004675149917602539, -0.004517078399658203, -0.004359006881713867, -0.004200935363769531, -0.004042863845825195, -0.0038847923278808594, -0.0037267208099365234, -0.0035686492919921875, -0.0034105777740478516, -0.0032525062561035156, -0.0030944347381591797, -0.0029363632202148438, -0.002778291702270508, -0.002620220184326172, -0.002462148666381836, -0.0023040771484375, -0.002146005630493164, -0.001987934112548828, -0.0018298625946044922, -0.0016717910766601562, -0.0015137195587158203, -0.0013556480407714844, -0.0011975765228271484, -0.0010395050048828125, -0.0008814334869384766, -0.0007233619689941406, -0.0005652904510498047, -0.00040721893310546875, -0.0002491474151611328, -9.107589721679688e-05, 6.699562072753906e-05, 0.000225067138671875, 0.00038313865661621094, 0.0005412101745605469, 0.0006992816925048828, 0.0008573532104492188, 0.0010154247283935547, 0.0011734962463378906, 0.0013315677642822266, 0.0014896392822265625, 0.0016477108001708984, 0.0018057823181152344, 0.0019638538360595703, 0.0021219253540039062, 0.002279996871948242, 0.002438068389892578, 0.002596139907836914, 0.00275421142578125, 0.002912282943725586, 0.003070354461669922, 0.003228425979614258, 0.0033864974975585938, 0.0035445690155029297, 0.0037026405334472656, 0.0038607120513916016, 0.0040187835693359375, 0.0041768550872802734, 0.004334926605224609, 0.004492998123168945, 0.004651069641113281, 0.004809141159057617, 0.004967212677001953, 0.005125284194946289, 0.005283355712890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 16.0, 18.0, 25.0, 41.0, 57.0, 84.0, 129.0, 148.0, 260.0, 368.0, 532.0, 768.0, 1093.0, 1653.0, 2407.0, 3531.0, 5091.0, 7847.0, 11900.0, 18042.0, 28503.0, 44586.0, 73320.0, 125196.0, 222056.0, 202869.0, 113317.0, 67101.0, 41307.0, 26287.0, 16689.0, 10979.0, 7136.0, 4786.0, 3237.0, 2300.0, 1517.0, 1040.0, 751.0, 474.0, 354.0, 242.0, 166.0, 118.0, 69.0, 60.0, 27.0, 14.0, 17.0, 8.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0095672607421875, -0.009267449378967285, -0.00896763801574707, -0.008667826652526855, -0.00836801528930664, -0.008068203926086426, -0.007768392562866211, -0.007468581199645996, -0.007168769836425781, -0.006868958473205566, -0.0065691471099853516, -0.006269335746765137, -0.005969524383544922, -0.005669713020324707, -0.005369901657104492, -0.005070090293884277, -0.0047702789306640625, -0.004470467567443848, -0.004170656204223633, -0.003870844841003418, -0.003571033477783203, -0.0032712221145629883, -0.0029714107513427734, -0.0026715993881225586, -0.0023717880249023438, -0.002071976661682129, -0.001772165298461914, -0.0014723539352416992, -0.0011725425720214844, -0.0008727312088012695, -0.0005729198455810547, -0.00027310848236083984, 2.6702880859375e-05, 0.00032651424407958984, 0.0006263256072998047, 0.0009261369705200195, 0.0012259483337402344, 0.0015257596969604492, 0.001825571060180664, 0.002125382423400879, 0.0024251937866210938, 0.0027250051498413086, 0.0030248165130615234, 0.0033246278762817383, 0.003624439239501953, 0.003924250602722168, 0.004224061965942383, 0.004523873329162598, 0.0048236846923828125, 0.005123496055603027, 0.005423307418823242, 0.005723118782043457, 0.006022930145263672, 0.006322741508483887, 0.0066225528717041016, 0.006922364234924316, 0.007222175598144531, 0.007521986961364746, 0.007821798324584961, 0.008121609687805176, 0.00842142105102539, 0.008721232414245605, 0.00902104377746582, 0.009320855140686035, 0.00962066650390625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 12.0, 14.0, 15.0, 23.0, 16.0, 30.0, 28.0, 28.0, 32.0, 36.0, 31.0, 37.0, 45.0, 38.0, 43.0, 40.0, 44.0, 52.0, 34.0, 37.0, 36.0, 40.0, 26.0, 22.0, 28.0, 21.0, 26.0, 17.0, 21.0, 16.0, 14.0, 11.0, 10.0, 14.0, 8.0, 6.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034656524658203125, -0.0033653974533081055, -0.0032651424407958984, -0.0031648874282836914, -0.0030646324157714844, -0.0029643774032592773, -0.0028641223907470703, -0.0027638673782348633, -0.0026636123657226562, -0.0025633573532104492, -0.002463102340698242, -0.002362847328186035, -0.002262592315673828, -0.002162337303161621, -0.002062082290649414, -0.001961827278137207, -0.001861572265625, -0.001761317253112793, -0.001661062240600586, -0.001560807228088379, -0.0014605522155761719, -0.0013602972030639648, -0.0012600421905517578, -0.0011597871780395508, -0.0010595321655273438, -0.0009592771530151367, -0.0008590221405029297, -0.0007587671279907227, -0.0006585121154785156, -0.0005582571029663086, -0.00045800209045410156, -0.00035774707794189453, -0.0002574920654296875, -0.00015723705291748047, -5.698204040527344e-05, 4.3272972106933594e-05, 0.00014352798461914062, 0.00024378299713134766, 0.0003440380096435547, 0.0004442930221557617, 0.0005445480346679688, 0.0006448030471801758, 0.0007450580596923828, 0.0008453130722045898, 0.0009455680847167969, 0.001045823097229004, 0.001146078109741211, 0.001246333122253418, 0.001346588134765625, 0.001446843147277832, 0.001547098159790039, 0.001647353172302246, 0.0017476081848144531, 0.0018478631973266602, 0.0019481182098388672, 0.0020483732223510742, 0.0021486282348632812, 0.0022488832473754883, 0.0023491382598876953, 0.0024493932723999023, 0.0025496482849121094, 0.0026499032974243164, 0.0027501583099365234, 0.0028504133224487305, 0.0029506683349609375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 13.0, 9.0, 10.0, 19.0, 22.0, 36.0, 27.0, 53.0, 54.0, 77.0, 120.0, 130.0, 181.0, 196.0, 320.0, 456.0, 594.0, 872.0, 1407.0, 2409.0, 5161.0, 13980.0, 64290.0, 834016.0, 93817.0, 16841.0, 5833.0, 2744.0, 1466.0, 961.0, 620.0, 483.0, 360.0, 208.0, 173.0, 152.0, 115.0, 79.0, 48.0, 46.0, 46.0, 39.0, 17.0, 15.0, 10.0, 8.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0015897750854492188, -0.0015409737825393677, -0.0014921724796295166, -0.0014433711767196655, -0.0013945698738098145, -0.0013457685708999634, -0.0012969672679901123, -0.0012481659650802612, -0.0011993646621704102, -0.001150563359260559, -0.001101762056350708, -0.001052960753440857, -0.0010041594505310059, -0.0009553581476211548, -0.0009065568447113037, -0.0008577555418014526, -0.0008089542388916016, -0.0007601529359817505, -0.0007113516330718994, -0.0006625503301620483, -0.0006137490272521973, -0.0005649477243423462, -0.0005161464214324951, -0.00046734511852264404, -0.00041854381561279297, -0.0003697425127029419, -0.0003209412097930908, -0.00027213990688323975, -0.00022333860397338867, -0.0001745373010635376, -0.00012573599815368652, -7.693469524383545e-05, -2.8133392333984375e-05, 2.06679105758667e-05, 6.946921348571777e-05, 0.00011827051639556885, 0.00016707181930541992, 0.000215873122215271, 0.00026467442512512207, 0.00031347572803497314, 0.0003622770309448242, 0.0004110783338546753, 0.00045987963676452637, 0.0005086809396743774, 0.0005574822425842285, 0.0006062835454940796, 0.0006550848484039307, 0.0007038861513137817, 0.0007526874542236328, 0.0008014887571334839, 0.000850290060043335, 0.000899091362953186, 0.0009478926658630371, 0.0009966939687728882, 0.0010454952716827393, 0.0010942965745925903, 0.0011430978775024414, 0.0011918991804122925, 0.0012407004833221436, 0.0012895017862319946, 0.0013383030891418457, 0.0013871043920516968, 0.0014359056949615479, 0.001484706997871399, 0.00153350830078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 2.0, 6.0, 8.0, 7.0, 7.0, 11.0, 10.0, 23.0, 27.0, 37.0, 50.0, 92.0, 120.0, 177.0, 116.0, 85.0, 55.0, 36.0, 23.0, 14.0, 20.0, 13.0, 11.0, 5.0, 9.0, 8.0, 7.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5506520867347717e-06, -1.4919787645339966e-06, -1.4333054423332214e-06, -1.3746321201324463e-06, -1.3159587979316711e-06, -1.257285475730896e-06, -1.1986121535301208e-06, -1.1399388313293457e-06, -1.0812655091285706e-06, -1.0225921869277954e-06, -9.639188647270203e-07, -9.052455425262451e-07, -8.4657222032547e-07, -7.878988981246948e-07, -7.292255759239197e-07, -6.705522537231445e-07, -6.118789315223694e-07, -5.532056093215942e-07, -4.945322871208191e-07, -4.3585896492004395e-07, -3.771856427192688e-07, -3.1851232051849365e-07, -2.598389983177185e-07, -2.0116567611694336e-07, -1.424923539161682e-07, -8.381903171539307e-08, -2.514570951461792e-08, 3.3527612686157227e-08, 9.220093488693237e-08, 1.5087425708770752e-07, 2.0954757928848267e-07, 2.682209014892578e-07, 3.2689422369003296e-07, 3.855675458908081e-07, 4.4424086809158325e-07, 5.029141902923584e-07, 5.615875124931335e-07, 6.202608346939087e-07, 6.789341568946838e-07, 7.37607479095459e-07, 7.962808012962341e-07, 8.549541234970093e-07, 9.136274456977844e-07, 9.723007678985596e-07, 1.0309740900993347e-06, 1.0896474123001099e-06, 1.148320734500885e-06, 1.2069940567016602e-06, 1.2656673789024353e-06, 1.3243407011032104e-06, 1.3830140233039856e-06, 1.4416873455047607e-06, 1.5003606677055359e-06, 1.559033989906311e-06, 1.6177073121070862e-06, 1.6763806343078613e-06, 1.7350539565086365e-06, 1.7937272787094116e-06, 1.8524006009101868e-06, 1.911073923110962e-06, 1.969747245311737e-06, 2.028420567512512e-06, 2.0870938897132874e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 4.0, 8.0, 10.0, 11.0, 14.0, 20.0, 26.0, 34.0, 53.0, 70.0, 68.0, 112.0, 141.0, 231.0, 308.0, 384.0, 558.0, 776.0, 1183.0, 1755.0, 2825.0, 4395.0, 8174.0, 17251.0, 50416.0, 677859.0, 216669.0, 33953.0, 13158.0, 6687.0, 3800.0, 2397.0, 1556.0, 1100.0, 733.0, 471.0, 356.0, 277.0, 183.0, 128.0, 92.0, 82.0, 64.0, 56.0, 25.0, 23.0, 21.0, 14.0, 11.0, 5.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014543533325195312, -0.0014113783836364746, -0.001368403434753418, -0.0013254284858703613, -0.0012824535369873047, -0.001239478588104248, -0.0011965036392211914, -0.0011535286903381348, -0.0011105537414550781, -0.0010675787925720215, -0.0010246038436889648, -0.0009816288948059082, -0.0009386539459228516, -0.0008956789970397949, -0.0008527040481567383, -0.0008097290992736816, -0.000766754150390625, -0.0007237792015075684, -0.0006808042526245117, -0.0006378293037414551, -0.0005948543548583984, -0.0005518794059753418, -0.0005089044570922852, -0.0004659295082092285, -0.0004229545593261719, -0.00037997961044311523, -0.0003370046615600586, -0.00029402971267700195, -0.0002510547637939453, -0.00020807981491088867, -0.00016510486602783203, -0.0001221299171447754, -7.915496826171875e-05, -3.618001937866211e-05, 6.794929504394531e-06, 4.976987838745117e-05, 9.274482727050781e-05, 0.00013571977615356445, 0.0001786947250366211, 0.00022166967391967773, 0.0002646446228027344, 0.000307619571685791, 0.00035059452056884766, 0.0003935694694519043, 0.00043654441833496094, 0.0004795193672180176, 0.0005224943161010742, 0.0005654692649841309, 0.0006084442138671875, 0.0006514191627502441, 0.0006943941116333008, 0.0007373690605163574, 0.0007803440093994141, 0.0008233189582824707, 0.0008662939071655273, 0.000909268856048584, 0.0009522438049316406, 0.0009952187538146973, 0.001038193702697754, 0.0010811686515808105, 0.0011241436004638672, 0.0011671185493469238, 0.0012100934982299805, 0.0012530684471130371, 0.0012960433959960938]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 5.0, 2.0, 9.0, 3.0, 11.0, 16.0, 26.0, 29.0, 51.0, 145.0, 330.0, 158.0, 65.0, 40.0, 30.0, 15.0, 9.0, 14.0, 8.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004658699035644531, -0.0004534870386123657, -0.0004411041736602783, -0.0004287213087081909, -0.0004163384437561035, -0.0004039555788040161, -0.0003915727138519287, -0.0003791898488998413, -0.0003668069839477539, -0.0003544241189956665, -0.0003420412540435791, -0.0003296583890914917, -0.0003172755241394043, -0.0003048926591873169, -0.0002925097942352295, -0.0002801269292831421, -0.0002677440643310547, -0.0002553611993789673, -0.00024297833442687988, -0.00023059546947479248, -0.00021821260452270508, -0.00020582973957061768, -0.00019344687461853027, -0.00018106400966644287, -0.00016868114471435547, -0.00015629827976226807, -0.00014391541481018066, -0.00013153254985809326, -0.00011914968490600586, -0.00010676681995391846, -9.438395500183105e-05, -8.200109004974365e-05, -6.961822509765625e-05, -5.723536014556885e-05, -4.4852495193481445e-05, -3.246963024139404e-05, -2.008676528930664e-05, -7.703900337219238e-06, 4.678964614868164e-06, 1.7061829566955566e-05, 2.944469451904297e-05, 4.182755947113037e-05, 5.4210424423217773e-05, 6.659328937530518e-05, 7.897615432739258e-05, 9.135901927947998e-05, 0.00010374188423156738, 0.00011612474918365479, 0.0001285076141357422, 0.0001408904790878296, 0.000153273344039917, 0.0001656562089920044, 0.0001780390739440918, 0.0001904219388961792, 0.0002028048038482666, 0.000215187668800354, 0.0002275705337524414, 0.0002399533987045288, 0.0002523362636566162, 0.0002647191286087036, 0.000277101993560791, 0.0002894848585128784, 0.0003018677234649658, 0.0003142505884170532, 0.0003266334533691406]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 16.0, 17.0, 21.0, 27.0, 35.0, 57.0, 66.0, 83.0, 118.0, 108.0, 104.0, 77.0, 81.0, 46.0, 37.0, 28.0, 21.0, 11.0, 9.0, 4.0, 10.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007812042720615864, -0.0075183832086622715, -0.0072247241623699665, -0.006931064650416374, -0.006637405604124069, -0.006343746092170477, -0.006050086580216885, -0.00575642753392458, -0.005462768021970987, -0.005169108510017395, -0.00487544946372509, -0.004581789951771498, -0.004288130439817905, -0.0039944713935256, -0.003700811881572008, -0.0034071526024490595, -0.003113493323326111, -0.002819834044203162, -0.0025261747650802135, -0.0022325152531266212, -0.0019388559740036726, -0.001645196694880724, -0.0013515372993424535, -0.001057877903804183, -0.0007642186246812344, -0.0004705592873506248, -0.00017689995002001524, 0.00011675938731059432, 0.0004104187246412039, 0.0007040780037641525, 0.000997737399302423, 0.0012913967948406935, 0.0015850551426410675, 0.0018787144217640162, 0.002172373700886965, 0.002466033212840557, 0.0027596924919635057, 0.0030533517710864544, 0.0033470112830400467, 0.0036406705621629953, 0.003934329841285944, 0.004227989353239536, 0.004521648399531841, 0.004815307911485434, 0.005108967423439026, 0.005402626469731331, 0.005696285981684923, 0.0059899454936385155, 0.0062836045399308205, 0.006577264051884413, 0.006870923098176718, 0.00716458261013031, 0.007458241656422615, 0.007751901168376207, 0.0080455606803298, 0.008339219726622105, 0.008632879704236984, 0.00892653875052929, 0.009220198728144169, 0.009513857774436474, 0.009807516820728779, 0.010101176798343658, 0.010394835844635963, 0.010688494890928268, 0.010982153937220573]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 8.0, 14.0, 16.0, 15.0, 18.0, 26.0, 26.0, 21.0, 31.0, 34.0, 33.0, 48.0, 46.0, 46.0, 48.0, 43.0, 36.0, 49.0, 43.0, 34.0, 37.0, 41.0, 39.0, 27.0, 25.0, 31.0, 26.0, 17.0, 9.0, 18.0, 11.0, 11.0, 13.0, 6.0, 2.0, 8.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00555018987506628, -0.0053834738209843636, -0.005216758232563734, -0.005050042178481817, -0.004883326590061188, -0.004716610535979271, -0.004549894481897354, -0.004383178427815437, -0.004216462839394808, -0.004049746785312891, -0.0038830311968922615, -0.0037163151428103447, -0.0035495993215590715, -0.0033828835003077984, -0.0032161674462258816, -0.0030494516249746084, -0.0028827358037233353, -0.002716019982472062, -0.002549304161220789, -0.002382588107138872, -0.002215872285887599, -0.002049156464636326, -0.0018824405269697309, -0.0017157245893031359, -0.0015490087680518627, -0.0013822929468005896, -0.0012155770091339946, -0.0010488610714673996, -0.0008821452502161264, -0.0007154293707571924, -0.0005487134912982583, -0.0003819975536316633, -0.00021528219804167747, -4.8566318582743406e-05, 0.00011814956087619066, 0.00028486544033512473, 0.0004515813197940588, 0.0006182971992529929, 0.0007850130787119269, 0.0009517290163785219, 0.001118444837629795, 0.0012851606588810682, 0.0014518765965476632, 0.0016185925342142582, 0.0017853083554655313, 0.0019520241767168045, 0.0021187402307987213, 0.0022854560520499945, 0.0024521718733012676, 0.0026188876945525408, 0.002785603515803814, 0.0029523195698857307, 0.003119035391137004, 0.003285751212388277, 0.003452467266470194, 0.003619183087721467, 0.00378589890897274, 0.003952614963054657, 0.0041193305514752865, 0.004286046605557203, 0.004452762193977833, 0.00461947824805975, 0.004786194302141666, 0.004952910356223583, 0.005119625944644213]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 11.0, 19.0, 30.0, 43.0, 63.0, 94.0, 145.0, 182.0, 255.0, 362.0, 481.0, 694.0, 1013.0, 1483.0, 2120.0, 3261.0, 4783.0, 7446.0, 12005.0, 19582.0, 32803.0, 56856.0, 106084.0, 224396.0, 678569.0, 1700998.0, 814604.0, 251211.0, 115040.0, 61908.0, 36351.0, 21671.0, 13681.0, 8521.0, 5743.0, 3681.0, 2509.0, 1631.0, 1146.0, 840.0, 604.0, 410.0, 289.0, 187.0, 126.0, 116.0, 57.0, 50.0, 32.0, 26.0, 23.0, 23.0, 3.0, 11.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.00630950927734375, -0.0060961246490478516, -0.005882740020751953, -0.005669355392456055, -0.005455970764160156, -0.005242586135864258, -0.005029201507568359, -0.004815816879272461, -0.0046024322509765625, -0.004389047622680664, -0.004175662994384766, -0.003962278366088867, -0.0037488937377929688, -0.0035355091094970703, -0.003322124481201172, -0.0031087398529052734, -0.002895355224609375, -0.0026819705963134766, -0.002468585968017578, -0.0022552013397216797, -0.0020418167114257812, -0.0018284320831298828, -0.0016150474548339844, -0.001401662826538086, -0.0011882781982421875, -0.0009748935699462891, -0.0007615089416503906, -0.0005481243133544922, -0.00033473968505859375, -0.00012135505676269531, 9.202957153320312e-05, 0.00030541419982910156, 0.000518798828125, 0.0007321834564208984, 0.0009455680847167969, 0.0011589527130126953, 0.0013723373413085938, 0.0015857219696044922, 0.0017991065979003906, 0.002012491226196289, 0.0022258758544921875, 0.002439260482788086, 0.0026526451110839844, 0.002866029739379883, 0.0030794143676757812, 0.0032927989959716797, 0.003506183624267578, 0.0037195682525634766, 0.003932952880859375, 0.0041463375091552734, 0.004359722137451172, 0.00457310676574707, 0.004786491394042969, 0.004999876022338867, 0.005213260650634766, 0.005426645278930664, 0.0056400299072265625, 0.005853414535522461, 0.006066799163818359, 0.006280183792114258, 0.006493568420410156, 0.006706953048706055, 0.006920337677001953, 0.0071337223052978516, 0.00734710693359375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 8.0, 5.0, 6.0, 11.0, 18.0, 19.0, 17.0, 22.0, 29.0, 28.0, 26.0, 28.0, 41.0, 41.0, 57.0, 55.0, 47.0, 45.0, 46.0, 31.0, 28.0, 48.0, 50.0, 34.0, 52.0, 35.0, 27.0, 21.0, 17.0, 18.0, 18.0, 14.0, 12.0, 9.0, 8.0, 8.0, 5.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00362396240234375, -0.0035137832164764404, -0.003403604030609131, -0.0032934248447418213, -0.0031832456588745117, -0.003073066473007202, -0.0029628872871398926, -0.002852708101272583, -0.0027425289154052734, -0.002632349729537964, -0.0025221705436706543, -0.0024119913578033447, -0.002301812171936035, -0.0021916329860687256, -0.002081453800201416, -0.0019712746143341064, -0.0018610954284667969, -0.0017509162425994873, -0.0016407370567321777, -0.0015305578708648682, -0.0014203786849975586, -0.001310199499130249, -0.0012000203132629395, -0.0010898411273956299, -0.0009796619415283203, -0.0008694827556610107, -0.0007593035697937012, -0.0006491243839263916, -0.000538945198059082, -0.00042876601219177246, -0.0003185868263244629, -0.00020840764045715332, -9.822845458984375e-05, 1.195073127746582e-05, 0.0001221299171447754, 0.00023230910301208496, 0.00034248828887939453, 0.0004526674747467041, 0.0005628466606140137, 0.0006730258464813232, 0.0007832050323486328, 0.0008933842182159424, 0.001003563404083252, 0.0011137425899505615, 0.001223921775817871, 0.0013341009616851807, 0.0014442801475524902, 0.0015544593334197998, 0.0016646385192871094, 0.001774817705154419, 0.0018849968910217285, 0.001995176076889038, 0.0021053552627563477, 0.0022155344486236572, 0.002325713634490967, 0.0024358928203582764, 0.002546072006225586, 0.0026562511920928955, 0.002766430377960205, 0.0028766095638275146, 0.0029867887496948242, 0.003096967935562134, 0.0032071471214294434, 0.003317326307296753, 0.0034275054931640625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 16.0, 29.0, 33.0, 46.0, 103.0, 132.0, 230.0, 365.0, 635.0, 1122.0, 2028.0, 3806.0, 7163.0, 15163.0, 33260.0, 84485.0, 253701.0, 1014393.0, 2021932.0, 507536.0, 148302.0, 53994.0, 23242.0, 10743.0, 5305.0, 2849.0, 1557.0, 847.0, 510.0, 261.0, 181.0, 107.0, 66.0, 51.0, 30.0, 15.0, 8.0, 6.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0091705322265625, -0.008886337280273438, -0.008602142333984375, -0.008317947387695312, -0.00803375244140625, -0.0077495574951171875, -0.007465362548828125, -0.0071811676025390625, -0.00689697265625, -0.0066127777099609375, -0.006328582763671875, -0.0060443878173828125, -0.00576019287109375, -0.0054759979248046875, -0.005191802978515625, -0.0049076080322265625, -0.0046234130859375, -0.0043392181396484375, -0.004055023193359375, -0.0037708282470703125, -0.00348663330078125, -0.0032024383544921875, -0.002918243408203125, -0.0026340484619140625, -0.002349853515625, -0.0020656585693359375, -0.001781463623046875, -0.0014972686767578125, -0.00121307373046875, -0.0009288787841796875, -0.000644683837890625, -0.0003604888916015625, -7.62939453125e-05, 0.0002079010009765625, 0.000492095947265625, 0.0007762908935546875, 0.00106048583984375, 0.0013446807861328125, 0.001628875732421875, 0.0019130706787109375, 0.002197265625, 0.0024814605712890625, 0.002765655517578125, 0.0030498504638671875, 0.00333404541015625, 0.0036182403564453125, 0.003902435302734375, 0.0041866302490234375, 0.0044708251953125, 0.0047550201416015625, 0.005039215087890625, 0.0053234100341796875, 0.00560760498046875, 0.0058917999267578125, 0.006175994873046875, 0.0064601898193359375, 0.006744384765625, 0.0070285797119140625, 0.007312774658203125, 0.0075969696044921875, 0.00788116455078125, 0.008165359497070312, 0.008449554443359375, 0.008733749389648438, 0.0090179443359375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 12.0, 12.0, 13.0, 21.0, 20.0, 21.0, 44.0, 65.0, 66.0, 91.0, 108.0, 132.0, 156.0, 189.0, 234.0, 282.0, 363.0, 385.0, 372.0, 260.0, 260.0, 181.0, 149.0, 138.0, 106.0, 71.0, 71.0, 57.0, 46.0, 19.0, 25.0, 30.0, 12.0, 12.0, 8.0, 5.0, 10.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016937255859375, -0.00163191556930542, -0.0015701055526733398, -0.0015082955360412598, -0.0014464855194091797, -0.0013846755027770996, -0.0013228654861450195, -0.0012610554695129395, -0.0011992454528808594, -0.0011374354362487793, -0.0010756254196166992, -0.0010138154029846191, -0.0009520053863525391, -0.000890195369720459, -0.0008283853530883789, -0.0007665753364562988, -0.0007047653198242188, -0.0006429553031921387, -0.0005811452865600586, -0.0005193352699279785, -0.00045752525329589844, -0.00039571523666381836, -0.0003339052200317383, -0.0002720952033996582, -0.00021028518676757812, -0.00014847517013549805, -8.666515350341797e-05, -2.485513687133789e-05, 3.695487976074219e-05, 9.876489639282227e-05, 0.00016057491302490234, 0.00022238492965698242, 0.0002841949462890625, 0.0003460049629211426, 0.00040781497955322266, 0.00046962499618530273, 0.0005314350128173828, 0.0005932450294494629, 0.000655055046081543, 0.000716865062713623, 0.0007786750793457031, 0.0008404850959777832, 0.0009022951126098633, 0.0009641051292419434, 0.0010259151458740234, 0.0010877251625061035, 0.0011495351791381836, 0.0012113451957702637, 0.0012731552124023438, 0.0013349652290344238, 0.001396775245666504, 0.001458585262298584, 0.001520395278930664, 0.0015822052955627441, 0.0016440153121948242, 0.0017058253288269043, 0.0017676353454589844, 0.0018294453620910645, 0.0018912553787231445, 0.0019530653953552246, 0.0020148754119873047, 0.0020766854286193848, 0.002138495445251465, 0.002200305461883545, 0.002262115478515625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 18.0, 6.0, 12.0, 14.0, 21.0, 21.0, 30.0, 45.0, 46.0, 55.0, 88.0, 94.0, 100.0, 86.0, 65.0, 55.0, 40.0, 39.0, 19.0, 21.0, 26.0, 16.0, 15.0, 9.0, 4.0, 5.0, 4.0, 3.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.003964461386203766, -0.0038198456168174744, -0.003675229847431183, -0.0035306140780448914, -0.0033859983086586, -0.0032413825392723083, -0.003096766769886017, -0.0029521510004997253, -0.002807535231113434, -0.0026629194617271423, -0.002518303692340851, -0.0023736879229545593, -0.002229072153568268, -0.0020844563841819763, -0.0019398406147956848, -0.0017952248454093933, -0.0016506090760231018, -0.0015059933066368103, -0.0013613775372505188, -0.0012167617678642273, -0.0010721459984779358, -0.0009275302290916443, -0.0007829144597053528, -0.0006382986903190613, -0.0004936829209327698, -0.00034906715154647827, -0.00020445138216018677, -5.9835612773895264e-05, 8.478015661239624e-05, 0.00022939592599868774, 0.00037401169538497925, 0.0005186274647712708, 0.0006632436998188496, 0.0008078594692051411, 0.0009524752385914326, 0.001097091007977724, 0.0012417067773640156, 0.001386322546750307, 0.0015309383161365986, 0.00167555408552289, 0.0018201698549091816, 0.001964785624295473, 0.0021094013936817646, 0.002254017163068056, 0.0023986329324543476, 0.002543248701840639, 0.0026878644712269306, 0.002832480240613222, 0.0029770960099995136, 0.003121711779385805, 0.0032663275487720966, 0.003410943318158388, 0.0035555590875446796, 0.003700174856930971, 0.0038447906263172626, 0.003989406395703554, 0.004134022165089846, 0.004278637934476137, 0.004423253703862429, 0.00456786947324872, 0.004712485242635012, 0.004857101012021303, 0.005001716781407595, 0.005146332550793886, 0.005290948320180178]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 8.0, 8.0, 8.0, 8.0, 6.0, 6.0, 7.0, 14.0, 14.0, 25.0, 24.0, 19.0, 23.0, 23.0, 25.0, 34.0, 36.0, 34.0, 38.0, 34.0, 36.0, 43.0, 45.0, 34.0, 38.0, 46.0, 42.0, 28.0, 38.0, 33.0, 26.0, 20.0, 30.0, 17.0, 15.0, 16.0, 13.0, 10.0, 12.0, 11.0, 10.0, 9.0, 8.0, 4.0, 2.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.0031083417125046253, -0.0030097756534814835, -0.0029112095944583416, -0.0028126435354351997, -0.002714077476412058, -0.002615511417388916, -0.0025169451255351305, -0.0024183790665119886, -0.0023198130074888468, -0.002221246948465705, -0.002122680889442563, -0.002024114830419421, -0.0019255486549809575, -0.0018269825959578156, -0.001728416420519352, -0.00162985036149621, -0.0015312843024730682, -0.0014327182434499264, -0.0013341521844267845, -0.0012355860089883208, -0.001137019949965179, -0.001038453890942037, -0.0009398877737112343, -0.0008413216564804316, -0.0007427555974572897, -0.0006441895384341478, -0.0005456234212033451, -0.00044705733307637274, -0.0003484912449494004, -0.00024992518592625856, -0.0001513590686954558, -5.2792951464653015e-05, 4.5773107558488846e-05, 0.00014433919568546116, 0.00024290528381243348, 0.0003414713719394058, 0.0004400374600663781, 0.00053860351908952, 0.0006371696363203228, 0.0007357357535511255, 0.0008343018125742674, 0.0009328678715974092, 0.0010314339306205511, 0.0011300001060590148, 0.0012285661650821567, 0.0013271322241052985, 0.0014256983995437622, 0.001524264458566904, 0.001622830517590046, 0.0017213965766131878, 0.0018199626356363297, 0.0019185288110747933, 0.0020170947536826134, 0.0021156608127057552, 0.0022142271045595407, 0.0023127931635826826, 0.0024113592226058245, 0.0025099252816289663, 0.002608491340652108, 0.00270705739967525, 0.0028056236915290356, 0.0029041897505521774, 0.0030027558095753193, 0.003101321868598461, 0.003199887927621603]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 13.0, 23.0, 22.0, 31.0, 43.0, 73.0, 134.0, 164.0, 301.0, 451.0, 793.0, 1325.0, 2499.0, 4916.0, 10191.0, 24696.0, 79348.0, 490492.0, 332932.0, 61095.0, 20645.0, 8843.0, 4182.0, 2268.0, 1167.0, 698.0, 434.0, 249.0, 187.0, 106.0, 66.0, 44.0, 27.0, 24.0, 14.0, 9.0, 11.0, 10.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00457000732421875, -0.004422128200531006, -0.004274249076843262, -0.004126369953155518, -0.0039784908294677734, -0.0038306117057800293, -0.003682732582092285, -0.003534853458404541, -0.003386974334716797, -0.0032390952110290527, -0.0030912160873413086, -0.0029433369636535645, -0.0027954578399658203, -0.002647578716278076, -0.002499699592590332, -0.002351820468902588, -0.0022039413452148438, -0.0020560622215270996, -0.0019081830978393555, -0.0017603039741516113, -0.0016124248504638672, -0.001464545726776123, -0.001316666603088379, -0.0011687874794006348, -0.0010209083557128906, -0.0008730292320251465, -0.0007251501083374023, -0.0005772709846496582, -0.00042939186096191406, -0.0002815127372741699, -0.00013363361358642578, 1.424551010131836e-05, 0.0001621246337890625, 0.00031000375747680664, 0.0004578828811645508, 0.0006057620048522949, 0.0007536411285400391, 0.0009015202522277832, 0.0010493993759155273, 0.0011972784996032715, 0.0013451576232910156, 0.0014930367469787598, 0.001640915870666504, 0.001788794994354248, 0.0019366741180419922, 0.0020845532417297363, 0.0022324323654174805, 0.0023803114891052246, 0.0025281906127929688, 0.002676069736480713, 0.002823948860168457, 0.002971827983856201, 0.0031197071075439453, 0.0032675862312316895, 0.0034154653549194336, 0.0035633444786071777, 0.003711223602294922, 0.003859102725982666, 0.00400698184967041, 0.004154860973358154, 0.0043027400970458984, 0.004450619220733643, 0.004598498344421387, 0.004746377468109131, 0.004894256591796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 4.0, 6.0, 6.0, 11.0, 6.0, 9.0, 7.0, 27.0, 15.0, 26.0, 23.0, 22.0, 19.0, 34.0, 34.0, 37.0, 42.0, 48.0, 40.0, 42.0, 40.0, 41.0, 57.0, 37.0, 36.0, 36.0, 32.0, 35.0, 29.0, 22.0, 18.0, 15.0, 22.0, 15.0, 13.0, 8.0, 11.0, 18.0, 9.0, 12.0, 2.0, 12.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.003513336181640625, -0.003403306007385254, -0.003293275833129883, -0.0031832456588745117, -0.0030732154846191406, -0.0029631853103637695, -0.0028531551361083984, -0.0027431249618530273, -0.0026330947875976562, -0.002523064613342285, -0.002413034439086914, -0.002303004264831543, -0.002192974090576172, -0.0020829439163208008, -0.0019729137420654297, -0.0018628835678100586, -0.0017528533935546875, -0.0016428232192993164, -0.0015327930450439453, -0.0014227628707885742, -0.0013127326965332031, -0.001202702522277832, -0.001092672348022461, -0.0009826421737670898, -0.0008726119995117188, -0.0007625818252563477, -0.0006525516510009766, -0.0005425214767456055, -0.0004324913024902344, -0.0003224611282348633, -0.0002124309539794922, -0.0001024007797241211, 7.62939453125e-06, 0.0001176595687866211, 0.0002276897430419922, 0.0003377199172973633, 0.0004477500915527344, 0.0005577802658081055, 0.0006678104400634766, 0.0007778406143188477, 0.0008878707885742188, 0.0009979009628295898, 0.001107931137084961, 0.001217961311340332, 0.0013279914855957031, 0.0014380216598510742, 0.0015480518341064453, 0.0016580820083618164, 0.0017681121826171875, 0.0018781423568725586, 0.0019881725311279297, 0.0020982027053833008, 0.002208232879638672, 0.002318263053894043, 0.002428293228149414, 0.002538323402404785, 0.0026483535766601562, 0.0027583837509155273, 0.0028684139251708984, 0.0029784440994262695, 0.0030884742736816406, 0.0031985044479370117, 0.003308534622192383, 0.003418564796447754, 0.003528594970703125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 10.0, 15.0, 17.0, 28.0, 24.0, 35.0, 52.0, 71.0, 90.0, 106.0, 182.0, 233.0, 274.0, 461.0, 668.0, 1013.0, 1659.0, 2898.0, 5302.0, 11764.0, 39399.0, 531727.0, 393518.0, 35376.0, 10960.0, 5097.0, 2769.0, 1614.0, 987.0, 661.0, 416.0, 311.0, 195.0, 163.0, 100.0, 81.0, 64.0, 40.0, 36.0, 36.0, 27.0, 14.0, 13.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.005641937255859375, -0.005459725856781006, -0.005277514457702637, -0.005095303058624268, -0.0049130916595458984, -0.004730880260467529, -0.00454866886138916, -0.004366457462310791, -0.004184246063232422, -0.004002034664154053, -0.0038198232650756836, -0.0036376118659973145, -0.0034554004669189453, -0.003273189067840576, -0.003090977668762207, -0.002908766269683838, -0.0027265548706054688, -0.0025443434715270996, -0.0023621320724487305, -0.0021799206733703613, -0.001997709274291992, -0.001815497875213623, -0.001633286476135254, -0.0014510750770568848, -0.0012688636779785156, -0.0010866522789001465, -0.0009044408798217773, -0.0007222294807434082, -0.0005400180816650391, -0.0003578066825866699, -0.00017559528350830078, 6.616115570068359e-06, 0.0001888275146484375, 0.00037103891372680664, 0.0005532503128051758, 0.0007354617118835449, 0.0009176731109619141, 0.0010998845100402832, 0.0012820959091186523, 0.0014643073081970215, 0.0016465187072753906, 0.0018287301063537598, 0.002010941505432129, 0.002193152904510498, 0.002375364303588867, 0.0025575757026672363, 0.0027397871017456055, 0.0029219985008239746, 0.0031042098999023438, 0.003286421298980713, 0.003468632698059082, 0.003650844097137451, 0.0038330554962158203, 0.0040152668952941895, 0.004197478294372559, 0.004379689693450928, 0.004561901092529297, 0.004744112491607666, 0.004926323890686035, 0.005108535289764404, 0.0052907466888427734, 0.005472958087921143, 0.005655169486999512, 0.005837380886077881, 0.00601959228515625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 9.0, 8.0, 18.0, 15.0, 13.0, 23.0, 27.0, 33.0, 24.0, 51.0, 31.0, 34.0, 36.0, 40.0, 43.0, 47.0, 46.0, 41.0, 43.0, 30.0, 46.0, 45.0, 45.0, 32.0, 22.0, 22.0, 27.0, 25.0, 23.0, 24.0, 10.0, 9.0, 6.0, 7.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0028629302978515625, -0.002786785364151001, -0.0027106404304504395, -0.002634495496749878, -0.0025583505630493164, -0.002482205629348755, -0.0024060606956481934, -0.002329915761947632, -0.0022537708282470703, -0.002177625894546509, -0.0021014809608459473, -0.0020253360271453857, -0.0019491910934448242, -0.0018730461597442627, -0.0017969012260437012, -0.0017207562923431396, -0.0016446113586425781, -0.0015684664249420166, -0.001492321491241455, -0.0014161765575408936, -0.001340031623840332, -0.0012638866901397705, -0.001187741756439209, -0.0011115968227386475, -0.001035451889038086, -0.0009593069553375244, -0.0008831620216369629, -0.0008070170879364014, -0.0007308721542358398, -0.0006547272205352783, -0.0005785822868347168, -0.0005024373531341553, -0.00042629241943359375, -0.0003501474857330322, -0.0002740025520324707, -0.00019785761833190918, -0.00012171268463134766, -4.556775093078613e-05, 3.057718276977539e-05, 0.00010672211647033691, 0.00018286705017089844, 0.00025901198387145996, 0.0003351569175720215, 0.000411301851272583, 0.00048744678497314453, 0.0005635917186737061, 0.0006397366523742676, 0.0007158815860748291, 0.0007920265197753906, 0.0008681714534759521, 0.0009443163871765137, 0.0010204613208770752, 0.0010966062545776367, 0.0011727511882781982, 0.0012488961219787598, 0.0013250410556793213, 0.0014011859893798828, 0.0014773309230804443, 0.0015534758567810059, 0.0016296207904815674, 0.001705765724182129, 0.0017819106578826904, 0.001858055591583252, 0.0019342005252838135, 0.002010345458984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 5.0, 13.0, 9.0, 18.0, 22.0, 18.0, 36.0, 56.0, 79.0, 94.0, 141.0, 188.0, 257.0, 405.0, 584.0, 972.0, 1650.0, 2924.0, 5727.0, 12982.0, 45307.0, 780713.0, 154418.0, 23425.0, 8442.0, 4090.0, 2260.0, 1279.0, 794.0, 535.0, 316.0, 220.0, 153.0, 123.0, 80.0, 47.0, 55.0, 28.0, 25.0, 15.0, 14.0, 8.0, 9.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0009050369262695312, -0.000875622034072876, -0.0008462071418762207, -0.0008167922496795654, -0.0007873773574829102, -0.0007579624652862549, -0.0007285475730895996, -0.0006991326808929443, -0.0006697177886962891, -0.0006403028964996338, -0.0006108880043029785, -0.0005814731121063232, -0.000552058219909668, -0.0005226433277130127, -0.0004932284355163574, -0.00046381354331970215, -0.0004343986511230469, -0.0004049837589263916, -0.00037556886672973633, -0.00034615397453308105, -0.0003167390823364258, -0.0002873241901397705, -0.00025790929794311523, -0.00022849440574645996, -0.0001990795135498047, -0.00016966462135314941, -0.00014024972915649414, -0.00011083483695983887, -8.14199447631836e-05, -5.200505256652832e-05, -2.2590160369873047e-05, 6.8247318267822266e-06, 3.62396240234375e-05, 6.565451622009277e-05, 9.506940841674805e-05, 0.00012448430061340332, 0.0001538991928100586, 0.00018331408500671387, 0.00021272897720336914, 0.00024214386940002441, 0.0002715587615966797, 0.00030097365379333496, 0.00033038854598999023, 0.0003598034381866455, 0.0003892183303833008, 0.00041863322257995605, 0.00044804811477661133, 0.0004774630069732666, 0.0005068778991699219, 0.0005362927913665771, 0.0005657076835632324, 0.0005951225757598877, 0.000624537467956543, 0.0006539523601531982, 0.0006833672523498535, 0.0007127821445465088, 0.0007421970367431641, 0.0007716119289398193, 0.0008010268211364746, 0.0008304417133331299, 0.0008598566055297852, 0.0008892714977264404, 0.0009186863899230957, 0.000948101282119751, 0.0009775161743164062]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 18.0, 11.0, 11.0, 14.0, 37.0, 25.0, 32.0, 36.0, 75.0, 30.0, 58.0, 43.0, 104.0, 57.0, 54.0, 97.0, 35.0, 37.0, 28.0, 54.0, 22.0, 14.0, 13.0, 22.0, 8.0, 7.0, 6.0, 10.0, 1.0, 4.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-06, -2.2491440176963806e-06, -2.173706889152527e-06, -2.098269760608673e-06, -2.0228326320648193e-06, -1.9473955035209656e-06, -1.8719583749771118e-06, -1.796521246433258e-06, -1.7210841178894043e-06, -1.6456469893455505e-06, -1.5702098608016968e-06, -1.494772732257843e-06, -1.4193356037139893e-06, -1.3438984751701355e-06, -1.2684613466262817e-06, -1.193024218082428e-06, -1.1175870895385742e-06, -1.0421499609947205e-06, -9.667128324508667e-07, -8.912757039070129e-07, -8.158385753631592e-07, -7.404014468193054e-07, -6.649643182754517e-07, -5.895271897315979e-07, -5.140900611877441e-07, -4.386529326438904e-07, -3.632158041000366e-07, -2.8777867555618286e-07, -2.123415470123291e-07, -1.3690441846847534e-07, -6.146728992462158e-08, 1.3969838619232178e-08, 8.940696716308594e-08, 1.648440957069397e-07, 2.4028122425079346e-07, 3.157183527946472e-07, 3.91155481338501e-07, 4.6659260988235474e-07, 5.420297384262085e-07, 6.174668669700623e-07, 6.92903995513916e-07, 7.683411240577698e-07, 8.437782526016235e-07, 9.192153811454773e-07, 9.94652509689331e-07, 1.0700896382331848e-06, 1.1455267667770386e-06, 1.2209638953208923e-06, 1.296401023864746e-06, 1.3718381524085999e-06, 1.4472752809524536e-06, 1.5227124094963074e-06, 1.5981495380401611e-06, 1.6735866665840149e-06, 1.7490237951278687e-06, 1.8244609236717224e-06, 1.8998980522155762e-06, 1.97533518075943e-06, 2.0507723093032837e-06, 2.1262094378471375e-06, 2.201646566390991e-06, 2.277083694934845e-06, 2.3525208234786987e-06, 2.4279579520225525e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 7.0, 18.0, 26.0, 27.0, 50.0, 59.0, 94.0, 137.0, 203.0, 308.0, 545.0, 875.0, 1527.0, 2504.0, 4507.0, 8427.0, 17190.0, 41192.0, 141639.0, 605703.0, 145183.0, 41571.0, 17204.0, 8458.0, 4602.0, 2622.0, 1443.0, 903.0, 530.0, 322.0, 231.0, 125.0, 98.0, 68.0, 40.0, 27.0, 23.0, 12.0, 11.0, 9.0, 4.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012159347534179688, -0.0011773407459259033, -0.0011387467384338379, -0.0011001527309417725, -0.001061558723449707, -0.0010229647159576416, -0.0009843707084655762, -0.0009457767009735107, -0.0009071826934814453, -0.0008685886859893799, -0.0008299946784973145, -0.000791400671005249, -0.0007528066635131836, -0.0007142126560211182, -0.0006756186485290527, -0.0006370246410369873, -0.0005984306335449219, -0.0005598366260528564, -0.000521242618560791, -0.0004826486110687256, -0.00044405460357666016, -0.0004054605960845947, -0.0003668665885925293, -0.00032827258110046387, -0.00028967857360839844, -0.000251084566116333, -0.00021249055862426758, -0.00017389655113220215, -0.00013530254364013672, -9.670853614807129e-05, -5.811452865600586e-05, -1.952052116394043e-05, 1.9073486328125e-05, 5.766749382019043e-05, 9.626150131225586e-05, 0.0001348555088043213, 0.00017344951629638672, 0.00021204352378845215, 0.0002506375312805176, 0.000289231538772583, 0.00032782554626464844, 0.00036641955375671387, 0.0004050135612487793, 0.0004436075687408447, 0.00048220157623291016, 0.0005207955837249756, 0.000559389591217041, 0.0005979835987091064, 0.0006365776062011719, 0.0006751716136932373, 0.0007137656211853027, 0.0007523596286773682, 0.0007909536361694336, 0.000829547643661499, 0.0008681416511535645, 0.0009067356586456299, 0.0009453296661376953, 0.0009839236736297607, 0.0010225176811218262, 0.0010611116886138916, 0.001099705696105957, 0.0011382997035980225, 0.0011768937110900879, 0.0012154877185821533, 0.0012540817260742188]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 8.0, 5.0, 9.0, 3.0, 10.0, 16.0, 17.0, 27.0, 46.0, 51.0, 86.0, 141.0, 213.0, 138.0, 65.0, 54.0, 29.0, 15.0, 11.0, 5.0, 4.0, 5.0, 5.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004067420959472656, -0.00039487332105636597, -0.0003830045461654663, -0.00037113577127456665, -0.000359266996383667, -0.00034739822149276733, -0.0003355294466018677, -0.000323660671710968, -0.00031179189682006836, -0.0002999231219291687, -0.00028805434703826904, -0.0002761855721473694, -0.0002643167972564697, -0.00025244802236557007, -0.0002405792474746704, -0.00022871047258377075, -0.0002168416976928711, -0.00020497292280197144, -0.00019310414791107178, -0.00018123537302017212, -0.00016936659812927246, -0.0001574978232383728, -0.00014562904834747314, -0.00013376027345657349, -0.00012189149856567383, -0.00011002272367477417, -9.815394878387451e-05, -8.628517389297485e-05, -7.44163990020752e-05, -6.254762411117554e-05, -5.067884922027588e-05, -3.881007432937622e-05, -2.6941299438476562e-05, -1.5072524547576904e-05, -3.203749656677246e-06, 8.665025234222412e-06, 2.053380012512207e-05, 3.240257501602173e-05, 4.427134990692139e-05, 5.6140124797821045e-05, 6.80088996887207e-05, 7.987767457962036e-05, 9.174644947052002e-05, 0.00010361522436141968, 0.00011548399925231934, 0.000127352774143219, 0.00013922154903411865, 0.0001510903239250183, 0.00016295909881591797, 0.00017482787370681763, 0.00018669664859771729, 0.00019856542348861694, 0.0002104341983795166, 0.00022230297327041626, 0.00023417174816131592, 0.0002460405230522156, 0.00025790929794311523, 0.0002697780728340149, 0.00028164684772491455, 0.0002935156226158142, 0.00030538439750671387, 0.0003172531723976135, 0.0003291219472885132, 0.00034099072217941284, 0.0003528594970703125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 5.0, 9.0, 6.0, 9.0, 9.0, 14.0, 28.0, 22.0, 28.0, 38.0, 67.0, 65.0, 78.0, 104.0, 102.0, 72.0, 66.0, 52.0, 50.0, 22.0, 27.0, 30.0, 29.0, 8.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.004126824904233217, -0.003975533880293369, -0.0038242428563535213, -0.0036729518324136734, -0.0035216608084738255, -0.0033703697845339775, -0.003219078527763486, -0.003067787503823638, -0.00291649647988379, -0.002765205455943942, -0.002613914432004094, -0.002462623408064246, -0.0023113321512937546, -0.0021600411273539066, -0.0020087501034140587, -0.0018574590794742107, -0.0017061680555343628, -0.0015548770315945148, -0.001403586007654667, -0.0012522948672994971, -0.0011010038433596492, -0.0009497128194198012, -0.0007984217372722924, -0.0006471306551247835, -0.0004958396311849356, -0.00034454857814125717, -0.00019325752509757876, -4.196647205390036e-05, 0.00010932458098977804, 0.000260615604929626, 0.00041190668707713485, 0.0005631977692246437, 0.000714489258825779, 0.0008657802827656269, 0.0010170713067054749, 0.0011683624470606446, 0.0013196534710004926, 0.0014709444949403405, 0.0016222356352955103, 0.0017735266592353582, 0.0019248176831752062, 0.002076108707115054, 0.002227399731054902, 0.00237869075499475, 0.0025299820117652416, 0.0026812730357050896, 0.0028325640596449375, 0.0029838550835847855, 0.0031351461075246334, 0.0032864371314644814, 0.0034377281554043293, 0.0035890191793441772, 0.003740310203284025, 0.003891601227223873, 0.004042892251163721, 0.004194183275103569, 0.004345474764704704, 0.004496765788644552, 0.0046480568125844, 0.004799347836524248, 0.004950638860464096, 0.005101929884403944, 0.005253220908343792, 0.005404512397944927, 0.005555802956223488]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 7.0, 6.0, 9.0, 7.0, 4.0, 15.0, 29.0, 18.0, 18.0, 24.0, 16.0, 25.0, 36.0, 34.0, 31.0, 37.0, 33.0, 38.0, 38.0, 46.0, 37.0, 36.0, 44.0, 38.0, 39.0, 30.0, 50.0, 23.0, 25.0, 18.0, 23.0, 26.0, 9.0, 15.0, 17.0, 10.0, 15.0, 7.0, 9.0, 9.0, 3.0, 5.0, 7.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.0031068657990545034, -0.003007764695212245, -0.0029086635913699865, -0.0028095622546970844, -0.002710461150854826, -0.0026113600470125675, -0.002512258943170309, -0.0024131578393280506, -0.002314056735485792, -0.0022149556316435337, -0.0021158545278012753, -0.002016753423959017, -0.0019176520872861147, -0.0018185509834438562, -0.0017194498796015978, -0.0016203487757593393, -0.0015212474390864372, -0.0014221463352441788, -0.0013230451149865985, -0.00122394401114434, -0.0011248427908867598, -0.0010257416870445013, -0.0009266405832022429, -0.0008275394211523235, -0.0007284382591024041, -0.0006293370970524848, -0.0005302359350025654, -0.00043113483116030693, -0.00033203366911038756, -0.0002329325070604682, -0.00013383140321820974, -3.473024116829038e-05, 6.437068805098534e-05, 0.00016347183554898947, 0.0002625729830469936, 0.0003616741159930825, 0.0004607752780430019, 0.0005598764400929213, 0.0006589775439351797, 0.0007580787059850991, 0.0008571798680350184, 0.0009562810300849378, 0.0010553821921348572, 0.0011544832959771156, 0.001253584399819374, 0.0013526856200769544, 0.0014517867239192128, 0.001550887944176793, 0.0016499890480190516, 0.00174909015186131, 0.0018481913721188903, 0.0019472924759611487, 0.002046393696218729, 0.0021454948000609875, 0.002244595903903246, 0.0023436970077455044, 0.002442798111587763, 0.0025418992154300213, 0.0026410003192722797, 0.002740101423114538, 0.0028392027597874403, 0.0029383038636296988, 0.003037404967471957, 0.0031365060713142157, 0.0032356074079871178]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 18.0, 14.0, 29.0, 34.0, 65.0, 80.0, 118.0, 173.0, 225.0, 353.0, 515.0, 684.0, 1013.0, 1449.0, 2160.0, 3283.0, 4915.0, 7532.0, 11861.0, 19055.0, 31434.0, 52649.0, 93591.0, 171239.0, 248007.0, 169350.0, 92562.0, 52111.0, 30950.0, 18898.0, 11676.0, 7444.0, 4924.0, 3171.0, 2171.0, 1480.0, 1058.0, 691.0, 466.0, 308.0, 240.0, 180.0, 104.0, 95.0, 54.0, 36.0, 23.0, 24.0, 15.0, 5.0, 11.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.006862640380859375, -0.006657719612121582, -0.006452798843383789, -0.006247878074645996, -0.006042957305908203, -0.00583803653717041, -0.005633115768432617, -0.005428194999694824, -0.005223274230957031, -0.005018353462219238, -0.004813432693481445, -0.004608511924743652, -0.004403591156005859, -0.004198670387268066, -0.0039937496185302734, -0.0037888288497924805, -0.0035839080810546875, -0.0033789873123168945, -0.0031740665435791016, -0.0029691457748413086, -0.0027642250061035156, -0.0025593042373657227, -0.0023543834686279297, -0.0021494626998901367, -0.0019445419311523438, -0.0017396211624145508, -0.0015347003936767578, -0.0013297796249389648, -0.0011248588562011719, -0.0009199380874633789, -0.0007150173187255859, -0.000510096549987793, -0.00030517578125, -0.00010025501251220703, 0.00010466575622558594, 0.0003095865249633789, 0.0005145072937011719, 0.0007194280624389648, 0.0009243488311767578, 0.0011292695999145508, 0.0013341903686523438, 0.0015391111373901367, 0.0017440319061279297, 0.0019489526748657227, 0.0021538734436035156, 0.0023587942123413086, 0.0025637149810791016, 0.0027686357498168945, 0.0029735565185546875, 0.0031784772872924805, 0.0033833980560302734, 0.0035883188247680664, 0.0037932395935058594, 0.003998160362243652, 0.004203081130981445, 0.004408001899719238, 0.004612922668457031, 0.004817843437194824, 0.005022764205932617, 0.00522768497467041, 0.005432605743408203, 0.005637526512145996, 0.005842447280883789, 0.006047368049621582, 0.006252288818359375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 2.0, 7.0, 7.0, 9.0, 14.0, 18.0, 15.0, 24.0, 22.0, 22.0, 27.0, 26.0, 35.0, 27.0, 39.0, 25.0, 39.0, 50.0, 33.0, 50.0, 46.0, 53.0, 42.0, 49.0, 39.0, 30.0, 31.0, 25.0, 24.0, 17.0, 26.0, 13.0, 18.0, 16.0, 8.0, 11.0, 11.0, 7.0, 7.0, 3.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.003086090087890625, -0.002991616725921631, -0.0028971433639526367, -0.0028026700019836426, -0.0027081966400146484, -0.0026137232780456543, -0.00251924991607666, -0.002424776554107666, -0.002330303192138672, -0.0022358298301696777, -0.0021413564682006836, -0.0020468831062316895, -0.0019524097442626953, -0.0018579363822937012, -0.001763463020324707, -0.0016689896583557129, -0.0015745162963867188, -0.0014800429344177246, -0.0013855695724487305, -0.0012910962104797363, -0.0011966228485107422, -0.001102149486541748, -0.001007676124572754, -0.0009132027626037598, -0.0008187294006347656, -0.0007242560386657715, -0.0006297826766967773, -0.0005353093147277832, -0.00044083595275878906, -0.0003463625907897949, -0.0002518892288208008, -0.00015741586685180664, -6.29425048828125e-05, 3.153085708618164e-05, 0.00012600421905517578, 0.00022047758102416992, 0.00031495094299316406, 0.0004094243049621582, 0.0005038976669311523, 0.0005983710289001465, 0.0006928443908691406, 0.0007873177528381348, 0.0008817911148071289, 0.000976264476776123, 0.0010707378387451172, 0.0011652112007141113, 0.0012596845626831055, 0.0013541579246520996, 0.0014486312866210938, 0.0015431046485900879, 0.001637578010559082, 0.0017320513725280762, 0.0018265247344970703, 0.0019209980964660645, 0.0020154714584350586, 0.0021099448204040527, 0.002204418182373047, 0.002298891544342041, 0.002393364906311035, 0.0024878382682800293, 0.0025823116302490234, 0.0026767849922180176, 0.0027712583541870117, 0.002865731716156006, 0.002960205078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 12.0, 16.0, 6.0, 23.0, 24.0, 46.0, 53.0, 62.0, 109.0, 157.0, 202.0, 302.0, 448.0, 649.0, 1051.0, 1586.0, 2500.0, 3769.0, 5866.0, 9335.0, 15184.0, 25315.0, 43026.0, 76624.0, 143393.0, 246883.0, 208672.0, 112260.0, 61158.0, 34548.0, 20819.0, 12561.0, 7703.0, 4875.0, 3069.0, 2081.0, 1370.0, 868.0, 564.0, 413.0, 270.0, 218.0, 155.0, 92.0, 64.0, 53.0, 29.0, 23.0, 13.0, 11.0, 12.0, 8.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006855010986328125, -0.0066394805908203125, -0.0064239501953125, -0.0062084197998046875, -0.005992889404296875, -0.0057773590087890625, -0.00556182861328125, -0.0053462982177734375, -0.005130767822265625, -0.0049152374267578125, -0.00469970703125, -0.0044841766357421875, -0.004268646240234375, -0.0040531158447265625, -0.00383758544921875, -0.0036220550537109375, -0.003406524658203125, -0.0031909942626953125, -0.0029754638671875, -0.0027599334716796875, -0.002544403076171875, -0.0023288726806640625, -0.00211334228515625, -0.0018978118896484375, -0.001682281494140625, -0.0014667510986328125, -0.001251220703125, -0.0010356903076171875, -0.000820159912109375, -0.0006046295166015625, -0.00038909912109375, -0.0001735687255859375, 4.1961669921875e-05, 0.0002574920654296875, 0.0004730224609375, 0.0006885528564453125, 0.000904083251953125, 0.0011196136474609375, 0.00133514404296875, 0.0015506744384765625, 0.001766204833984375, 0.0019817352294921875, 0.002197265625, 0.0024127960205078125, 0.002628326416015625, 0.0028438568115234375, 0.00305938720703125, 0.0032749176025390625, 0.003490447998046875, 0.0037059783935546875, 0.0039215087890625, 0.0041370391845703125, 0.004352569580078125, 0.0045680999755859375, 0.00478363037109375, 0.0049991607666015625, 0.005214691162109375, 0.0054302215576171875, 0.005645751953125, 0.0058612823486328125, 0.006076812744140625, 0.0062923431396484375, 0.00650787353515625, 0.0067234039306640625, 0.006938934326171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 7.0, 5.0, 7.0, 12.0, 13.0, 12.0, 14.0, 16.0, 15.0, 26.0, 23.0, 23.0, 24.0, 35.0, 33.0, 42.0, 35.0, 49.0, 42.0, 48.0, 40.0, 36.0, 44.0, 46.0, 50.0, 43.0, 31.0, 26.0, 22.0, 24.0, 28.0, 33.0, 22.0, 12.0, 9.0, 11.0, 10.0, 7.0, 8.0, 7.0, 3.0, 0.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017499923706054688, -0.0016845911741256714, -0.001619189977645874, -0.0015537887811660767, -0.0014883875846862793, -0.001422986388206482, -0.0013575851917266846, -0.0012921839952468872, -0.0012267827987670898, -0.0011613816022872925, -0.0010959804058074951, -0.0010305792093276978, -0.0009651780128479004, -0.000899776816368103, -0.0008343756198883057, -0.0007689744234085083, -0.0007035732269287109, -0.0006381720304489136, -0.0005727708339691162, -0.0005073696374893188, -0.0004419684410095215, -0.0003765672445297241, -0.00031116604804992676, -0.0002457648515701294, -0.00018036365509033203, -0.00011496245861053467, -4.9561262130737305e-05, 1.583993434906006e-05, 8.124113082885742e-05, 0.00014664232730865479, 0.00021204352378845215, 0.0002774447202682495, 0.0003428459167480469, 0.00040824711322784424, 0.0004736483097076416, 0.000539049506187439, 0.0006044507026672363, 0.0006698518991470337, 0.0007352530956268311, 0.0008006542921066284, 0.0008660554885864258, 0.0009314566850662231, 0.0009968578815460205, 0.0010622590780258179, 0.0011276602745056152, 0.0011930614709854126, 0.00125846266746521, 0.0013238638639450073, 0.0013892650604248047, 0.001454666256904602, 0.0015200674533843994, 0.0015854686498641968, 0.0016508698463439941, 0.0017162710428237915, 0.0017816722393035889, 0.0018470734357833862, 0.0019124746322631836, 0.001977875828742981, 0.0020432770252227783, 0.0021086782217025757, 0.002174079418182373, 0.0022394806146621704, 0.0023048818111419678, 0.002370283007621765, 0.0024356842041015625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 10.0, 10.0, 18.0, 24.0, 29.0, 34.0, 70.0, 98.0, 133.0, 185.0, 254.0, 373.0, 455.0, 611.0, 812.0, 1126.0, 1478.0, 2105.0, 2941.0, 4433.0, 7131.0, 13559.0, 40005.0, 308253.0, 565738.0, 57371.0, 16714.0, 8087.0, 4873.0, 3168.0, 2291.0, 1639.0, 1209.0, 863.0, 654.0, 542.0, 319.0, 255.0, 196.0, 141.0, 107.0, 74.0, 56.0, 36.0, 24.0, 22.0, 13.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0012731552124023438, -0.0012347102165222168, -0.0011962652206420898, -0.0011578202247619629, -0.001119375228881836, -0.001080930233001709, -0.001042485237121582, -0.001004040241241455, -0.0009655952453613281, -0.0009271502494812012, -0.0008887052536010742, -0.0008502602577209473, -0.0008118152618408203, -0.0007733702659606934, -0.0007349252700805664, -0.0006964802742004395, -0.0006580352783203125, -0.0006195902824401855, -0.0005811452865600586, -0.0005427002906799316, -0.0005042552947998047, -0.00046581029891967773, -0.0004273653030395508, -0.00038892030715942383, -0.0003504753112792969, -0.0003120303153991699, -0.00027358531951904297, -0.00023514032363891602, -0.00019669532775878906, -0.0001582503318786621, -0.00011980533599853516, -8.13603401184082e-05, -4.291534423828125e-05, -4.470348358154297e-06, 3.3974647521972656e-05, 7.241964340209961e-05, 0.00011086463928222656, 0.00014930963516235352, 0.00018775463104248047, 0.00022619962692260742, 0.0002646446228027344, 0.00030308961868286133, 0.0003415346145629883, 0.00037997961044311523, 0.0004184246063232422, 0.00045686960220336914, 0.0004953145980834961, 0.000533759593963623, 0.00057220458984375, 0.000610649585723877, 0.0006490945816040039, 0.0006875395774841309, 0.0007259845733642578, 0.0007644295692443848, 0.0008028745651245117, 0.0008413195610046387, 0.0008797645568847656, 0.0009182095527648926, 0.0009566545486450195, 0.0009950995445251465, 0.0010335445404052734, 0.0010719895362854004, 0.0011104345321655273, 0.0011488795280456543, 0.0011873245239257812]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 6.0, 0.0, 8.0, 0.0, 24.0, 0.0, 37.0, 0.0, 60.0, 0.0, 74.0, 0.0, 108.0, 0.0, 136.0, 0.0, 136.0, 0.0, 101.0, 0.0, 0.0, 102.0, 0.0, 75.0, 0.0, 49.0, 0.0, 32.0, 0.0, 21.0, 0.0, 13.0, 0.0, 12.0, 0.0, 6.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.055940270423889e-07, -7.767230272293091e-07, -7.478520274162292e-07, -7.189810276031494e-07, -6.901100277900696e-07, -6.612390279769897e-07, -6.323680281639099e-07, -6.034970283508301e-07, -5.746260285377502e-07, -5.457550287246704e-07, -5.168840289115906e-07, -4.880130290985107e-07, -4.591420292854309e-07, -4.302710294723511e-07, -4.0140002965927124e-07, -3.725290298461914e-07, -3.4365803003311157e-07, -3.1478703022003174e-07, -2.859160304069519e-07, -2.5704503059387207e-07, -2.2817403078079224e-07, -1.993030309677124e-07, -1.7043203115463257e-07, -1.4156103134155273e-07, -1.126900315284729e-07, -8.381903171539307e-08, -5.494803190231323e-08, -2.60770320892334e-08, 2.7939677238464355e-09, 3.166496753692627e-08, 6.05359673500061e-08, 8.940696716308594e-08, 1.1827796697616577e-07, 1.471489667892456e-07, 1.7601996660232544e-07, 2.0489096641540527e-07, 2.337619662284851e-07, 2.6263296604156494e-07, 2.915039658546448e-07, 3.203749656677246e-07, 3.4924596548080444e-07, 3.781169652938843e-07, 4.069879651069641e-07, 4.3585896492004395e-07, 4.647299647331238e-07, 4.936009645462036e-07, 5.224719643592834e-07, 5.513429641723633e-07, 5.802139639854431e-07, 6.09084963798523e-07, 6.379559636116028e-07, 6.668269634246826e-07, 6.956979632377625e-07, 7.245689630508423e-07, 7.534399628639221e-07, 7.82310962677002e-07, 8.111819624900818e-07, 8.400529623031616e-07, 8.689239621162415e-07, 8.977949619293213e-07, 9.266659617424011e-07, 9.55536961555481e-07, 9.844079613685608e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 16.0, 31.0, 37.0, 26.0, 41.0, 73.0, 91.0, 109.0, 151.0, 172.0, 194.0, 311.0, 353.0, 497.0, 669.0, 891.0, 1231.0, 1686.0, 2447.0, 3624.0, 5980.0, 11909.0, 41921.0, 804767.0, 130792.0, 17820.0, 7856.0, 4510.0, 2887.0, 1956.0, 1394.0, 996.0, 769.0, 505.0, 418.0, 284.0, 242.0, 194.0, 151.0, 128.0, 99.0, 68.0, 66.0, 57.0, 31.0, 19.0, 10.0, 18.0, 12.0, 9.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0022525787353515625, -0.0021792352199554443, -0.002105891704559326, -0.002032548189163208, -0.00195920467376709, -0.0018858611583709717, -0.0018125176429748535, -0.0017391741275787354, -0.0016658306121826172, -0.001592487096786499, -0.0015191435813903809, -0.0014458000659942627, -0.0013724565505981445, -0.0012991130352020264, -0.0012257695198059082, -0.00115242600440979, -0.0010790824890136719, -0.0010057389736175537, -0.0009323954582214355, -0.0008590519428253174, -0.0007857084274291992, -0.0007123649120330811, -0.0006390213966369629, -0.0005656778812408447, -0.0004923343658447266, -0.0004189908504486084, -0.00034564733505249023, -0.00027230381965637207, -0.0001989603042602539, -0.00012561678886413574, -5.227327346801758e-05, 2.1070241928100586e-05, 9.441375732421875e-05, 0.00016775727272033691, 0.00024110078811645508, 0.00031444430351257324, 0.0003877878189086914, 0.00046113133430480957, 0.0005344748497009277, 0.0006078183650970459, 0.0006811618804931641, 0.0007545053958892822, 0.0008278489112854004, 0.0009011924266815186, 0.0009745359420776367, 0.0010478794574737549, 0.001121222972869873, 0.0011945664882659912, 0.0012679100036621094, 0.0013412535190582275, 0.0014145970344543457, 0.0014879405498504639, 0.001561284065246582, 0.0016346275806427002, 0.0017079710960388184, 0.0017813146114349365, 0.0018546581268310547, 0.0019280016422271729, 0.002001345157623291, 0.002074688673019409, 0.0021480321884155273, 0.0022213757038116455, 0.0022947192192077637, 0.002368062734603882, 0.00244140625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 5.0, 4.0, 13.0, 12.0, 22.0, 50.0, 174.0, 398.0, 175.0, 69.0, 13.0, 9.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007390975952148438, -0.0007182508707046509, -0.000697404146194458, -0.0006765574216842651, -0.0006557106971740723, -0.0006348639726638794, -0.0006140172481536865, -0.0005931705236434937, -0.0005723237991333008, -0.0005514770746231079, -0.000530630350112915, -0.0005097836256027222, -0.0004889369010925293, -0.0004680901765823364, -0.00044724345207214355, -0.0004263967275619507, -0.0004055500030517578, -0.00038470327854156494, -0.00036385655403137207, -0.0003430098295211792, -0.00032216310501098633, -0.00030131638050079346, -0.0002804696559906006, -0.0002596229314804077, -0.00023877620697021484, -0.00021792948246002197, -0.0001970827579498291, -0.00017623603343963623, -0.00015538930892944336, -0.0001345425844192505, -0.00011369585990905762, -9.284913539886475e-05, -7.200241088867188e-05, -5.1155686378479004e-05, -3.0308961868286133e-05, -9.462237358093262e-06, 1.138448715209961e-05, 3.223121166229248e-05, 5.307793617248535e-05, 7.392466068267822e-05, 9.47713851928711e-05, 0.00011561810970306396, 0.00013646483421325684, 0.0001573115587234497, 0.00017815828323364258, 0.00019900500774383545, 0.00021985173225402832, 0.0002406984567642212, 0.00026154518127441406, 0.00028239190578460693, 0.0003032386302947998, 0.0003240853548049927, 0.00034493207931518555, 0.0003657788038253784, 0.0003866255283355713, 0.00040747225284576416, 0.00042831897735595703, 0.0004491657018661499, 0.0004700124263763428, 0.0004908591508865356, 0.0005117058753967285, 0.0005325525999069214, 0.0005533993244171143, 0.0005742460489273071, 0.0005950927734375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 6.0, 1.0, 4.0, 5.0, 3.0, 11.0, 5.0, 8.0, 11.0, 16.0, 28.0, 28.0, 33.0, 62.0, 71.0, 80.0, 95.0, 112.0, 87.0, 63.0, 53.0, 40.0, 36.0, 33.0, 19.0, 26.0, 17.0, 6.0, 10.0, 5.0, 5.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036887770984321833, -0.003537248121574521, -0.003385719144716859, -0.0032341901678591967, -0.0030826611910015345, -0.0029311322141438723, -0.0027796030044555664, -0.002628074027597904, -0.002476545050740242, -0.00232501607388258, -0.0021734870970249176, -0.0020219581201672554, -0.0018704291433095932, -0.001718900166451931, -0.001567371073178947, -0.0014158420963212848, -0.0012643132358789444, -0.0011127842590212822, -0.00096125528216362, -0.0008097262470982969, -0.0006581972702406347, -0.0005066682933829725, -0.00035513925831764936, -0.00020361028145998716, -5.208130460232496e-05, 9.944768680725247e-05, 0.0002509766782168299, 0.00040250568417832255, 0.0005540346610359848, 0.000705563637893647, 0.0008570926729589701, 0.0010086216498166323, 0.0011601503938436508, 0.001311679370701313, 0.0014632083475589752, 0.0016147373244166374, 0.0017662663012742996, 0.0019177952781319618, 0.002069324254989624, 0.0022208532318472862, 0.0023723822087049484, 0.0025239111855626106, 0.002675440162420273, 0.002826969139277935, 0.0029784981161355972, 0.0031300270929932594, 0.0032815560698509216, 0.003433085046708584, 0.0035846142563968897, 0.003736143233254552, 0.003887672210112214, 0.00403920141980052, 0.004190730396658182, 0.004342259373515844, 0.0044937883503735065, 0.004645317327231169, 0.004796846304088831, 0.004948375280946493, 0.005099904257804155, 0.0052514332346618176, 0.00540296221151948, 0.005554491188377142, 0.005706020165234804, 0.005857549142092466, 0.0060090781189501286]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 14.0, 19.0, 16.0, 29.0, 32.0, 26.0, 37.0, 31.0, 39.0, 36.0, 34.0, 57.0, 46.0, 33.0, 46.0, 36.0, 39.0, 35.0, 27.0, 38.0, 28.0, 24.0, 22.0, 20.0, 29.0, 22.0, 13.0, 12.0, 9.0, 9.0, 12.0, 11.0, 6.0, 4.0, 8.0, 6.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002762011718004942, -0.0026647301856428385, -0.0025674488861113787, -0.002470167353749275, -0.0023728858213871717, -0.0022756042890250683, -0.0021783229894936085, -0.002081041457131505, -0.0019837599247694016, -0.00188647850882262, -0.0017891969764605165, -0.0016919155605137348, -0.0015946340281516314, -0.0014973526122048497, -0.001400071196258068, -0.0013027896638959646, -0.0012055083643645048, -0.0011082269484177232, -0.0010109454160556197, -0.0009136640001088381, -0.0008163825259543955, -0.000719101051799953, -0.0006218196358531713, -0.0005245381616987288, -0.00042725668754428625, -0.0003299752133898437, -0.0002326937683392316, -0.00013541232328861952, -3.813084913417697e-05, 5.915062502026558e-05, 0.00015643204096704721, 0.00025371351512148976, 0.00035099522210657597, 0.0004482766962610185, 0.0005455581704154611, 0.0006428395863622427, 0.0007401210605166852, 0.0008374025346711278, 0.0009346839506179094, 0.001031965482980013, 0.0011292468989267945, 0.0012265283148735762, 0.0013238098472356796, 0.0014210912631824613, 0.001518372679129243, 0.0016156542114913464, 0.001712935627438128, 0.0018102170433849096, 0.001907498575747013, 0.0020047801081091166, 0.0021020614076405764, 0.00219934294000268, 0.0022966244723647833, 0.0023939060047268867, 0.0024911873042583466, 0.00258846883662045, 0.0026857503689825535, 0.002783031901344657, 0.0028803132008761168, 0.00297759473323822, 0.0030748762656003237, 0.003172157797962427, 0.003269439097493887, 0.0033667206298559904, 0.0034640019293874502]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 7.0, 14.0, 22.0, 26.0, 54.0, 72.0, 107.0, 146.0, 266.0, 401.0, 586.0, 915.0, 1382.0, 2093.0, 3331.0, 5248.0, 8243.0, 13509.0, 23208.0, 41987.0, 86655.0, 219073.0, 805767.0, 1871148.0, 737537.0, 196787.0, 78059.0, 39327.0, 21981.0, 12967.0, 7875.0, 5086.0, 3358.0, 2161.0, 1430.0, 1031.0, 726.0, 479.0, 327.0, 249.0, 176.0, 118.0, 103.0, 67.0, 53.0, 36.0, 19.0, 22.0, 9.0, 17.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.005176544189453125, -0.00498807430267334, -0.004799604415893555, -0.0046111345291137695, -0.004422664642333984, -0.004234194755554199, -0.004045724868774414, -0.003857254981994629, -0.0036687850952148438, -0.0034803152084350586, -0.0032918453216552734, -0.0031033754348754883, -0.002914905548095703, -0.002726435661315918, -0.002537965774536133, -0.0023494958877563477, -0.0021610260009765625, -0.0019725561141967773, -0.0017840862274169922, -0.001595616340637207, -0.0014071464538574219, -0.0012186765670776367, -0.0010302066802978516, -0.0008417367935180664, -0.0006532669067382812, -0.0004647970199584961, -0.00027632713317871094, -8.785724639892578e-05, 0.00010061264038085938, 0.00028908252716064453, 0.0004775524139404297, 0.0006660223007202148, 0.0008544921875, 0.0010429620742797852, 0.0012314319610595703, 0.0014199018478393555, 0.0016083717346191406, 0.0017968416213989258, 0.001985311508178711, 0.002173781394958496, 0.0023622512817382812, 0.0025507211685180664, 0.0027391910552978516, 0.0029276609420776367, 0.003116130828857422, 0.003304600715637207, 0.003493070602416992, 0.0036815404891967773, 0.0038700103759765625, 0.004058480262756348, 0.004246950149536133, 0.004435420036315918, 0.004623889923095703, 0.004812359809875488, 0.0050008296966552734, 0.005189299583435059, 0.005377769470214844, 0.005566239356994629, 0.005754709243774414, 0.005943179130554199, 0.006131649017333984, 0.0063201189041137695, 0.006508588790893555, 0.00669705867767334, 0.006885528564453125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 4.0, 4.0, 13.0, 9.0, 11.0, 16.0, 18.0, 8.0, 21.0, 29.0, 22.0, 27.0, 29.0, 30.0, 45.0, 34.0, 46.0, 37.0, 59.0, 45.0, 40.0, 44.0, 51.0, 45.0, 38.0, 41.0, 26.0, 26.0, 26.0, 14.0, 27.0, 22.0, 16.0, 13.0, 6.0, 15.0, 10.0, 6.0, 7.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0024242401123046875, -0.0023370087146759033, -0.002249777317047119, -0.002162545919418335, -0.0020753145217895508, -0.0019880831241607666, -0.0019008517265319824, -0.0018136203289031982, -0.001726388931274414, -0.0016391575336456299, -0.0015519261360168457, -0.0014646947383880615, -0.0013774633407592773, -0.0012902319431304932, -0.001203000545501709, -0.0011157691478729248, -0.0010285377502441406, -0.0009413063526153564, -0.0008540749549865723, -0.0007668435573577881, -0.0006796121597290039, -0.0005923807621002197, -0.0005051493644714355, -0.00041791796684265137, -0.0003306865692138672, -0.000243455171585083, -0.00015622377395629883, -6.899237632751465e-05, 1.823902130126953e-05, 0.00010547041893005371, 0.0001927018165588379, 0.00027993321418762207, 0.00036716461181640625, 0.00045439600944519043, 0.0005416274070739746, 0.0006288588047027588, 0.000716090202331543, 0.0008033215999603271, 0.0008905529975891113, 0.0009777843952178955, 0.0010650157928466797, 0.0011522471904754639, 0.001239478588104248, 0.0013267099857330322, 0.0014139413833618164, 0.0015011727809906006, 0.0015884041786193848, 0.001675635576248169, 0.0017628669738769531, 0.0018500983715057373, 0.0019373297691345215, 0.0020245611667633057, 0.00211179256439209, 0.002199023962020874, 0.002286255359649658, 0.0023734867572784424, 0.0024607181549072266, 0.0025479495525360107, 0.002635180950164795, 0.002722412347793579, 0.0028096437454223633, 0.0028968751430511475, 0.0029841065406799316, 0.003071337938308716, 0.0031585693359375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 4.0, 8.0, 14.0, 14.0, 18.0, 28.0, 68.0, 89.0, 107.0, 171.0, 242.0, 331.0, 491.0, 774.0, 1138.0, 1693.0, 2742.0, 4307.0, 6920.0, 11168.0, 19020.0, 33023.0, 60435.0, 117609.0, 252060.0, 653217.0, 1621303.0, 811980.0, 299426.0, 136183.0, 68324.0, 36971.0, 21087.0, 12466.0, 7512.0, 4667.0, 2887.0, 1997.0, 1289.0, 822.0, 548.0, 365.0, 254.0, 153.0, 119.0, 72.0, 56.0, 37.0, 22.0, 22.0, 12.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.00553131103515625, -0.005366683006286621, -0.005202054977416992, -0.005037426948547363, -0.004872798919677734, -0.0047081708908081055, -0.0045435428619384766, -0.004378914833068848, -0.004214286804199219, -0.00404965877532959, -0.003885030746459961, -0.003720402717590332, -0.003555774688720703, -0.0033911466598510742, -0.0032265186309814453, -0.0030618906021118164, -0.0028972625732421875, -0.0027326345443725586, -0.0025680065155029297, -0.0024033784866333008, -0.002238750457763672, -0.002074122428894043, -0.001909494400024414, -0.0017448663711547852, -0.0015802383422851562, -0.0014156103134155273, -0.0012509822845458984, -0.0010863542556762695, -0.0009217262268066406, -0.0007570981979370117, -0.0005924701690673828, -0.0004278421401977539, -0.000263214111328125, -9.85860824584961e-05, 6.604194641113281e-05, 0.00023066997528076172, 0.0003952980041503906, 0.0005599260330200195, 0.0007245540618896484, 0.0008891820907592773, 0.0010538101196289062, 0.0012184381484985352, 0.001383066177368164, 0.001547694206237793, 0.0017123222351074219, 0.0018769502639770508, 0.0020415782928466797, 0.0022062063217163086, 0.0023708343505859375, 0.0025354623794555664, 0.0027000904083251953, 0.0028647184371948242, 0.003029346466064453, 0.003193974494934082, 0.003358602523803711, 0.00352323055267334, 0.0036878585815429688, 0.0038524866104125977, 0.0040171146392822266, 0.0041817426681518555, 0.004346370697021484, 0.004510998725891113, 0.004675626754760742, 0.004840254783630371, 0.0050048828125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 20.0, 17.0, 28.0, 40.0, 37.0, 50.0, 73.0, 84.0, 128.0, 117.0, 168.0, 188.0, 230.0, 333.0, 403.0, 428.0, 356.0, 292.0, 226.0, 185.0, 112.0, 120.0, 84.0, 69.0, 64.0, 38.0, 40.0, 31.0, 19.0, 15.0, 12.0, 9.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017709732055664062, -0.00171583890914917, -0.0016607046127319336, -0.0016055703163146973, -0.001550436019897461, -0.0014953017234802246, -0.0014401674270629883, -0.001385033130645752, -0.0013298988342285156, -0.0012747645378112793, -0.001219630241394043, -0.0011644959449768066, -0.0011093616485595703, -0.001054227352142334, -0.0009990930557250977, -0.0009439587593078613, -0.000888824462890625, -0.0008336901664733887, -0.0007785558700561523, -0.000723421573638916, -0.0006682872772216797, -0.0006131529808044434, -0.000558018684387207, -0.0005028843879699707, -0.0004477500915527344, -0.00039261579513549805, -0.0003374814987182617, -0.0002823472023010254, -0.00022721290588378906, -0.00017207860946655273, -0.0001169443130493164, -6.181001663208008e-05, -6.67572021484375e-06, 4.845857620239258e-05, 0.0001035928726196289, 0.00015872716903686523, 0.00021386146545410156, 0.0002689957618713379, 0.0003241300582885742, 0.00037926435470581055, 0.0004343986511230469, 0.0004895329475402832, 0.0005446672439575195, 0.0005998015403747559, 0.0006549358367919922, 0.0007100701332092285, 0.0007652044296264648, 0.0008203387260437012, 0.0008754730224609375, 0.0009306073188781738, 0.0009857416152954102, 0.0010408759117126465, 0.0010960102081298828, 0.0011511445045471191, 0.0012062788009643555, 0.0012614130973815918, 0.0013165473937988281, 0.0013716816902160645, 0.0014268159866333008, 0.0014819502830505371, 0.0015370845794677734, 0.0015922188758850098, 0.001647353172302246, 0.0017024874687194824, 0.0017576217651367188]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 8.0, 8.0, 6.0, 10.0, 14.0, 21.0, 40.0, 29.0, 43.0, 65.0, 82.0, 93.0, 123.0, 108.0, 101.0, 68.0, 45.0, 32.0, 31.0, 14.0, 17.0, 14.0, 13.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005335601046681404, -0.005135165993124247, -0.004934730473905802, -0.004734295420348644, -0.004533859901130199, -0.004333424847573042, -0.004132989794015884, -0.00393255427479744, -0.003732119221240282, -0.003531683934852481, -0.0033312486484646797, -0.003130813594907522, -0.002930378308519721, -0.00272994302213192, -0.0025295079685747623, -0.002329072682186961, -0.00212863739579916, -0.0019282021094113588, -0.0017277669394388795, -0.0015273317694664001, -0.001326896483078599, -0.0011264611966907978, -0.0009260260267183185, -0.0007255908567458391, -0.000525155570358038, -0.0003247203421778977, -0.00012428511399775743, 7.615011418238282e-05, 0.0002765853423625231, 0.00047702062875032425, 0.0006774557987228036, 0.0008778909686952829, 0.001078326255083084, 0.0012787615414708853, 0.0014791967114433646, 0.001679631881415844, 0.0018800671678036451, 0.0020805024541914463, 0.002280937507748604, 0.002481372794136405, 0.002681808080524206, 0.0028822433669120073, 0.0030826786532998085, 0.003283113706856966, 0.003483548993244767, 0.0036839842796325684, 0.003884419333189726, 0.004084854386746883, 0.004285289905965328, 0.004485724959522486, 0.0046861604787409306, 0.004886595532298088, 0.005087031051516533, 0.00528746610507369, 0.005487901158630848, 0.005688336677849293, 0.00588877173140645, 0.006089206784963608, 0.006289642304182053, 0.00649007735773921, 0.006690512411296368, 0.0068909479305148125, 0.00709138298407197, 0.0072918180376291275, 0.007492253556847572]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 13.0, 14.0, 14.0, 12.0, 7.0, 15.0, 24.0, 20.0, 16.0, 30.0, 27.0, 29.0, 41.0, 35.0, 42.0, 36.0, 41.0, 49.0, 48.0, 37.0, 47.0, 28.0, 38.0, 39.0, 27.0, 31.0, 30.0, 23.0, 22.0, 23.0, 14.0, 20.0, 16.0, 14.0, 10.0, 17.0, 13.0, 3.0, 7.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002904309192672372, -0.0028063601348549128, -0.0027084110770374537, -0.0026104620192199945, -0.0025125129614025354, -0.0024145639035850763, -0.0023166146129369736, -0.0022186655551195145, -0.0021207164973020554, -0.0020227674394845963, -0.0019248183816671371, -0.001826869323849678, -0.001728920266032219, -0.0016309712082147598, -0.001533022033981979, -0.0014350729761645198, -0.0013371240347623825, -0.0012391749769449234, -0.0011412259191274643, -0.0010432768613100052, -0.0009453277452848852, -0.0008473786874674261, -0.000749429571442306, -0.0006514805136248469, -0.0005535314558073878, -0.0004555823979899287, -0.00035763331106863916, -0.0002596842241473496, -0.0001617351663298905, -6.378610851243138e-05, 3.416300751268864e-05, 0.00013211206533014774, 0.0002300608903169632, 0.0003280099481344223, 0.00042595903505571187, 0.0005239081219770014, 0.0006218571797944605, 0.0007198062376119196, 0.0008177553536370397, 0.0009157044114544988, 0.0010136534692719579, 0.001111602527089417, 0.001209551584906876, 0.001307500759139657, 0.0014054498169571161, 0.0015033988747745752, 0.0016013479325920343, 0.0016992969904094934, 0.0017972460482269526, 0.0018951951060444117, 0.0019931441638618708, 0.00209109322167933, 0.002189042279496789, 0.002286991337314248, 0.002384940627962351, 0.00248288968577981, 0.002580838743597269, 0.002678787801414728, 0.0027767368592321873, 0.0028746859170496464, 0.0029726349748671055, 0.0030705840326845646, 0.0031685330905020237, 0.003266482148319483, 0.003364431206136942]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 11.0, 8.0, 3.0, 11.0, 8.0, 23.0, 30.0, 59.0, 67.0, 103.0, 137.0, 202.0, 262.0, 383.0, 590.0, 783.0, 1172.0, 1787.0, 2675.0, 4201.0, 6873.0, 11074.0, 19080.0, 33616.0, 64800.0, 143071.0, 350956.0, 214949.0, 87171.0, 43502.0, 23775.0, 13724.0, 8358.0, 5125.0, 3298.0, 2106.0, 1457.0, 981.0, 614.0, 452.0, 319.0, 223.0, 147.0, 110.0, 69.0, 64.0, 53.0, 26.0, 20.0, 9.0, 15.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0], "bins": [-0.0013484954833984375, -0.001307263970375061, -0.0012660324573516846, -0.001224800944328308, -0.0011835694313049316, -0.0011423379182815552, -0.0011011064052581787, -0.0010598748922348022, -0.0010186433792114258, -0.0009774118661880493, -0.0009361803531646729, -0.0008949488401412964, -0.0008537173271179199, -0.0008124858140945435, -0.000771254301071167, -0.0007300227880477905, -0.0006887912750244141, -0.0006475597620010376, -0.0006063282489776611, -0.0005650967359542847, -0.0005238652229309082, -0.00048263370990753174, -0.0004414021968841553, -0.0004001706838607788, -0.00035893917083740234, -0.0003177076578140259, -0.0002764761447906494, -0.00023524463176727295, -0.00019401311874389648, -0.00015278160572052002, -0.00011155009269714355, -7.031857967376709e-05, -2.9087066650390625e-05, 1.214444637298584e-05, 5.3375959396362305e-05, 9.460747241973877e-05, 0.00013583898544311523, 0.0001770704984664917, 0.00021830201148986816, 0.00025953352451324463, 0.0003007650375366211, 0.00034199655055999756, 0.000383228063583374, 0.0004244595766067505, 0.00046569108963012695, 0.0005069226026535034, 0.0005481541156768799, 0.0005893856287002563, 0.0006306171417236328, 0.0006718486547470093, 0.0007130801677703857, 0.0007543116807937622, 0.0007955431938171387, 0.0008367747068405151, 0.0008780062198638916, 0.0009192377328872681, 0.0009604692459106445, 0.001001700758934021, 0.0010429322719573975, 0.001084163784980774, 0.0011253952980041504, 0.0011666268110275269, 0.0012078583240509033, 0.0012490898370742798, 0.0012903213500976562]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 7.0, 13.0, 7.0, 11.0, 9.0, 15.0, 14.0, 12.0, 17.0, 25.0, 17.0, 25.0, 26.0, 35.0, 36.0, 34.0, 37.0, 46.0, 44.0, 52.0, 35.0, 38.0, 45.0, 37.0, 45.0, 39.0, 34.0, 32.0, 24.0, 24.0, 19.0, 13.0, 22.0, 21.0, 14.0, 15.0, 16.0, 13.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0031280517578125, -0.0030224621295928955, -0.002916872501373291, -0.0028112828731536865, -0.002705693244934082, -0.0026001036167144775, -0.002494513988494873, -0.0023889243602752686, -0.002283334732055664, -0.0021777451038360596, -0.002072155475616455, -0.0019665658473968506, -0.001860976219177246, -0.0017553865909576416, -0.0016497969627380371, -0.0015442073345184326, -0.0014386177062988281, -0.0013330280780792236, -0.0012274384498596191, -0.0011218488216400146, -0.0010162591934204102, -0.0009106695652008057, -0.0008050799369812012, -0.0006994903087615967, -0.0005939006805419922, -0.0004883110523223877, -0.0003827214241027832, -0.0002771317958831787, -0.00017154216766357422, -6.595253944396973e-05, 3.9637088775634766e-05, 0.00014522671699523926, 0.00025081634521484375, 0.00035640597343444824, 0.00046199560165405273, 0.0005675852298736572, 0.0006731748580932617, 0.0007787644863128662, 0.0008843541145324707, 0.0009899437427520752, 0.0010955333709716797, 0.0012011229991912842, 0.0013067126274108887, 0.0014123022556304932, 0.0015178918838500977, 0.0016234815120697021, 0.0017290711402893066, 0.0018346607685089111, 0.0019402503967285156, 0.00204584002494812, 0.0021514296531677246, 0.002257019281387329, 0.0023626089096069336, 0.002468198537826538, 0.0025737881660461426, 0.002679377794265747, 0.0027849674224853516, 0.002890557050704956, 0.0029961466789245605, 0.003101736307144165, 0.0032073259353637695, 0.003312915563583374, 0.0034185051918029785, 0.003524094820022583, 0.0036296844482421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 9.0, 7.0, 17.0, 20.0, 24.0, 32.0, 41.0, 70.0, 121.0, 192.0, 403.0, 699.0, 1299.0, 2629.0, 5613.0, 13341.0, 37474.0, 172457.0, 653951.0, 111446.0, 28523.0, 10810.0, 4666.0, 2187.0, 1108.0, 583.0, 326.0, 176.0, 103.0, 57.0, 38.0, 34.0, 24.0, 11.0, 9.0, 18.0, 6.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002597808837890625, -0.002512305974960327, -0.0024268031120300293, -0.0023413002490997314, -0.0022557973861694336, -0.0021702945232391357, -0.002084791660308838, -0.00199928879737854, -0.0019137859344482422, -0.0018282830715179443, -0.0017427802085876465, -0.0016572773456573486, -0.0015717744827270508, -0.001486271619796753, -0.001400768756866455, -0.0013152658939361572, -0.0012297630310058594, -0.0011442601680755615, -0.0010587573051452637, -0.0009732544422149658, -0.000887751579284668, -0.0008022487163543701, -0.0007167458534240723, -0.0006312429904937744, -0.0005457401275634766, -0.0004602372646331787, -0.00037473440170288086, -0.000289231538772583, -0.00020372867584228516, -0.0001182258129119873, -3.272294998168945e-05, 5.27799129486084e-05, 0.00013828277587890625, 0.0002237856388092041, 0.00030928850173950195, 0.0003947913646697998, 0.00048029422760009766, 0.0005657970905303955, 0.0006512999534606934, 0.0007368028163909912, 0.0008223056793212891, 0.0009078085422515869, 0.0009933114051818848, 0.0010788142681121826, 0.0011643171310424805, 0.0012498199939727783, 0.0013353228569030762, 0.001420825719833374, 0.0015063285827636719, 0.0015918314456939697, 0.0016773343086242676, 0.0017628371715545654, 0.0018483400344848633, 0.0019338428974151611, 0.002019345760345459, 0.002104848623275757, 0.0021903514862060547, 0.0022758543491363525, 0.0023613572120666504, 0.0024468600749969482, 0.002532362937927246, 0.002617865800857544, 0.002703368663787842, 0.0027888715267181396, 0.0028743743896484375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 11.0, 4.0, 10.0, 7.0, 18.0, 10.0, 20.0, 26.0, 24.0, 31.0, 41.0, 53.0, 23.0, 27.0, 45.0, 33.0, 34.0, 53.0, 44.0, 36.0, 36.0, 36.0, 34.0, 41.0, 44.0, 28.0, 42.0, 36.0, 27.0, 22.0, 15.0, 17.0, 9.0, 14.0, 11.0, 6.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0021305084228515625, -0.002063244581222534, -0.001995980739593506, -0.0019287168979644775, -0.0018614530563354492, -0.001794189214706421, -0.0017269253730773926, -0.0016596615314483643, -0.001592397689819336, -0.0015251338481903076, -0.0014578700065612793, -0.001390606164932251, -0.0013233423233032227, -0.0012560784816741943, -0.001188814640045166, -0.0011215507984161377, -0.0010542869567871094, -0.000987023115158081, -0.0009197592735290527, -0.0008524954319000244, -0.0007852315902709961, -0.0007179677486419678, -0.0006507039070129395, -0.0005834400653839111, -0.0005161762237548828, -0.0004489123821258545, -0.00038164854049682617, -0.00031438469886779785, -0.00024712085723876953, -0.0001798570156097412, -0.00011259317398071289, -4.532933235168457e-05, 2.193450927734375e-05, 8.919835090637207e-05, 0.0001564621925354004, 0.0002237260341644287, 0.00029098987579345703, 0.00035825371742248535, 0.00042551755905151367, 0.000492781400680542, 0.0005600452423095703, 0.0006273090839385986, 0.000694572925567627, 0.0007618367671966553, 0.0008291006088256836, 0.0008963644504547119, 0.0009636282920837402, 0.0010308921337127686, 0.0010981559753417969, 0.0011654198169708252, 0.0012326836585998535, 0.0012999475002288818, 0.0013672113418579102, 0.0014344751834869385, 0.0015017390251159668, 0.0015690028667449951, 0.0016362667083740234, 0.0017035305500030518, 0.00177079439163208, 0.0018380582332611084, 0.0019053220748901367, 0.001972585916519165, 0.0020398497581481934, 0.0021071135997772217, 0.00217437744140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 3.0, 2.0, 9.0, 12.0, 23.0, 21.0, 31.0, 37.0, 31.0, 43.0, 78.0, 73.0, 107.0, 126.0, 181.0, 234.0, 361.0, 492.0, 703.0, 1400.0, 3883.0, 15905.0, 206034.0, 783348.0, 25553.0, 5317.0, 1755.0, 811.0, 531.0, 371.0, 246.0, 174.0, 141.0, 115.0, 84.0, 64.0, 42.0, 37.0, 36.0, 24.0, 16.0, 16.0, 19.0, 18.0, 11.0, 5.0, 6.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0], "bins": [-0.0007410049438476562, -0.0007186383008956909, -0.0006962716579437256, -0.0006739050149917603, -0.0006515383720397949, -0.0006291717290878296, -0.0006068050861358643, -0.0005844384431838989, -0.0005620718002319336, -0.0005397051572799683, -0.0005173385143280029, -0.0004949718713760376, -0.00047260522842407227, -0.00045023858547210693, -0.0004278719425201416, -0.00040550529956817627, -0.00038313865661621094, -0.0003607720136642456, -0.0003384053707122803, -0.00031603872776031494, -0.0002936720848083496, -0.0002713054418563843, -0.00024893879890441895, -0.0002265721559524536, -0.00020420551300048828, -0.00018183887004852295, -0.00015947222709655762, -0.00013710558414459229, -0.00011473894119262695, -9.237229824066162e-05, -7.000565528869629e-05, -4.763901233673096e-05, -2.5272369384765625e-05, -2.905726432800293e-06, 1.946091651916504e-05, 4.182755947113037e-05, 6.41942024230957e-05, 8.656084537506104e-05, 0.00010892748832702637, 0.0001312941312789917, 0.00015366077423095703, 0.00017602741718292236, 0.0001983940601348877, 0.00022076070308685303, 0.00024312734603881836, 0.0002654939889907837, 0.000287860631942749, 0.00031022727489471436, 0.0003325939178466797, 0.000354960560798645, 0.00037732720375061035, 0.0003996938467025757, 0.000422060489654541, 0.00044442713260650635, 0.0004667937755584717, 0.000489160418510437, 0.0005115270614624023, 0.0005338937044143677, 0.000556260347366333, 0.0005786269903182983, 0.0006009936332702637, 0.000623360276222229, 0.0006457269191741943, 0.0006680935621261597, 0.000690460205078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 9.0, 3.0, 2.0, 5.0, 8.0, 4.0, 11.0, 15.0, 12.0, 39.0, 44.0, 23.0, 73.0, 34.0, 79.0, 82.0, 39.0, 82.0, 68.0, 45.0, 82.0, 58.0, 16.0, 43.0, 17.0, 23.0, 20.0, 12.0, 24.0, 12.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.9420480132102966e-06, -2.8442591428756714e-06, -2.746470272541046e-06, -2.648681402206421e-06, -2.5508925318717957e-06, -2.4531036615371704e-06, -2.355314791202545e-06, -2.25752592086792e-06, -2.1597370505332947e-06, -2.0619481801986694e-06, -1.964159309864044e-06, -1.866370439529419e-06, -1.7685815691947937e-06, -1.6707926988601685e-06, -1.5730038285255432e-06, -1.475214958190918e-06, -1.3774260878562927e-06, -1.2796372175216675e-06, -1.1818483471870422e-06, -1.084059476852417e-06, -9.862706065177917e-07, -8.884817361831665e-07, -7.906928658485413e-07, -6.92903995513916e-07, -5.951151251792908e-07, -4.973262548446655e-07, -3.995373845100403e-07, -3.0174851417541504e-07, -2.039596438407898e-07, -1.0617077350616455e-07, -8.381903171539307e-09, 8.940696716308594e-08, 1.8719583749771118e-07, 2.849847078323364e-07, 3.8277357816696167e-07, 4.805624485015869e-07, 5.783513188362122e-07, 6.761401891708374e-07, 7.739290595054626e-07, 8.717179298400879e-07, 9.695068001747131e-07, 1.0672956705093384e-06, 1.1650845408439636e-06, 1.2628734111785889e-06, 1.3606622815132141e-06, 1.4584511518478394e-06, 1.5562400221824646e-06, 1.6540288925170898e-06, 1.751817762851715e-06, 1.8496066331863403e-06, 1.9473955035209656e-06, 2.045184373855591e-06, 2.142973244190216e-06, 2.2407621145248413e-06, 2.3385509848594666e-06, 2.436339855194092e-06, 2.534128725528717e-06, 2.6319175958633423e-06, 2.7297064661979675e-06, 2.8274953365325928e-06, 2.925284206867218e-06, 3.0230730772018433e-06, 3.1208619475364685e-06, 3.2186508178710938e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 4.0, 11.0, 6.0, 14.0, 30.0, 37.0, 48.0, 54.0, 90.0, 113.0, 178.0, 238.0, 326.0, 496.0, 815.0, 1377.0, 2928.0, 8026.0, 25410.0, 100287.0, 645088.0, 200403.0, 41512.0, 12092.0, 4251.0, 1786.0, 969.0, 614.0, 371.0, 288.0, 202.0, 147.0, 83.0, 73.0, 58.0, 37.0, 22.0, 14.0, 13.0, 11.0, 11.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006785392761230469, -0.0006584003567695618, -0.0006382614374160767, -0.0006181225180625916, -0.0005979835987091064, -0.0005778446793556213, -0.0005577057600021362, -0.0005375668406486511, -0.000517427921295166, -0.0004972890019416809, -0.0004771500825881958, -0.0004570111632347107, -0.0004368722438812256, -0.0004167333245277405, -0.00039659440517425537, -0.00037645548582077026, -0.00035631656646728516, -0.00033617764711380005, -0.00031603872776031494, -0.00029589980840682983, -0.0002757608890533447, -0.0002556219696998596, -0.0002354830503463745, -0.0002153441309928894, -0.0001952052116394043, -0.0001750662922859192, -0.00015492737293243408, -0.00013478845357894897, -0.00011464953422546387, -9.451061487197876e-05, -7.437169551849365e-05, -5.4232776165008545e-05, -3.409385681152344e-05, -1.395493745803833e-05, 6.183981895446777e-06, 2.6322901248931885e-05, 4.646182060241699e-05, 6.66007399559021e-05, 8.673965930938721e-05, 0.00010687857866287231, 0.00012701749801635742, 0.00014715641736984253, 0.00016729533672332764, 0.00018743425607681274, 0.00020757317543029785, 0.00022771209478378296, 0.00024785101413726807, 0.0002679899334907532, 0.0002881288528442383, 0.0003082677721977234, 0.0003284066915512085, 0.0003485456109046936, 0.0003686845302581787, 0.0003888234496116638, 0.0004089623689651489, 0.00042910128831863403, 0.00044924020767211914, 0.00046937912702560425, 0.0004895180463790894, 0.0005096569657325745, 0.0005297958850860596, 0.0005499348044395447, 0.0005700737237930298, 0.0005902126431465149, 0.0006103515625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 23.0, 67.0, 101.0, 205.0, 290.0, 133.0, 76.0, 49.0, 17.0, 5.0, 8.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017535686492919922, -0.00016957707703113556, -0.0001637972891330719, -0.00015801750123500824, -0.00015223771333694458, -0.00014645792543888092, -0.00014067813754081726, -0.0001348983496427536, -0.00012911856174468994, -0.00012333877384662628, -0.00011755898594856262, -0.00011177919805049896, -0.0001059994101524353, -0.00010021962225437164, -9.443983435630798e-05, -8.866004645824432e-05, -8.288025856018066e-05, -7.7100470662117e-05, -7.132068276405334e-05, -6.554089486598969e-05, -5.9761106967926025e-05, -5.3981319069862366e-05, -4.8201531171798706e-05, -4.2421743273735046e-05, -3.664195537567139e-05, -3.086216747760773e-05, -2.5082379579544067e-05, -1.9302591681480408e-05, -1.3522803783416748e-05, -7.743015885353088e-06, -1.9632279872894287e-06, 3.816559910774231e-06, 9.59634780883789e-06, 1.537613570690155e-05, 2.115592360496521e-05, 2.693571150302887e-05, 3.271549940109253e-05, 3.849528729915619e-05, 4.427507519721985e-05, 5.005486309528351e-05, 5.583465099334717e-05, 6.161443889141083e-05, 6.739422678947449e-05, 7.317401468753815e-05, 7.89538025856018e-05, 8.473359048366547e-05, 9.051337838172913e-05, 9.629316627979279e-05, 0.00010207295417785645, 0.0001078527420759201, 0.00011363252997398376, 0.00011941231787204742, 0.00012519210577011108, 0.00013097189366817474, 0.0001367516815662384, 0.00014253146946430206, 0.00014831125736236572, 0.00015409104526042938, 0.00015987083315849304, 0.0001656506210565567, 0.00017143040895462036, 0.00017721019685268402, 0.00018298998475074768, 0.00018876977264881134, 0.000194549560546875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 8.0, 14.0, 35.0, 25.0, 29.0, 50.0, 63.0, 83.0, 95.0, 120.0, 105.0, 98.0, 70.0, 43.0, 31.0, 33.0, 15.0, 17.0, 12.0, 11.0, 12.0, 3.0, 1.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005497945472598076, -0.005298672243952751, -0.005099398549646139, -0.0049001253210008144, -0.004700851626694202, -0.004501578398048878, -0.004302304703742266, -0.004103031475096941, -0.003903757780790329, -0.0037044843193143606, -0.0035052108578383923, -0.003305937396362424, -0.0031066639348864555, -0.002907390706241131, -0.002708117011934519, -0.002508843783289194, -0.0023095703218132257, -0.0021102968603372574, -0.001911023398861289, -0.0017117499373853207, -0.0015124764759093523, -0.0013132031308487058, -0.0011139296693727374, -0.000914656207896769, -0.0007153827464208007, -0.0005161092849448323, -0.0003168358525726944, -0.00011756242020055652, 8.171104127541184e-05, 0.0002809844445437193, 0.00048025790601968765, 0.000679531367495656, 0.0008788048289716244, 0.0010780782904475927, 0.001277351751923561, 0.0014766252133995295, 0.0016758986748754978, 0.0018751720199361444, 0.0020744455978274345, 0.0022737188264727592, 0.0024729925207793713, 0.0026722659822553396, 0.002871539443731308, 0.0030708129052072763, 0.0032700863666832447, 0.0034693595953285694, 0.0036686332896351814, 0.003867906518280506, 0.004067179746925831, 0.0042664529755711555, 0.0044657266698777676, 0.004664999898523092, 0.004864273592829704, 0.005063546821475029, 0.005262820515781641, 0.005462093744426966, 0.005661367438733578, 0.0058606406673789024, 0.0060599143616855145, 0.006259187590330839, 0.006458461284637451, 0.006657734513282776, 0.006857008207589388, 0.007056281436234713, 0.007255555130541325]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 11.0, 10.0, 14.0, 11.0, 14.0, 8.0, 18.0, 22.0, 19.0, 16.0, 36.0, 21.0, 33.0, 37.0, 33.0, 42.0, 41.0, 46.0, 45.0, 47.0, 37.0, 48.0, 25.0, 46.0, 31.0, 26.0, 33.0, 32.0, 24.0, 22.0, 22.0, 13.0, 16.0, 18.0, 14.0, 12.0, 17.0, 10.0, 4.0, 7.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0029267724603414536, -0.0028281693812459707, -0.002729566302150488, -0.002630963223055005, -0.0025323601439595222, -0.0024337570648640394, -0.0023351539857685566, -0.00223655067384243, -0.002137947827577591, -0.002039344748482108, -0.0019407416693866253, -0.0018421385902911425, -0.0017435355111956596, -0.0016449324321001768, -0.0015463292365893722, -0.0014477261574938893, -0.0013491229619830847, -0.0012505198828876019, -0.001151916803792119, -0.0010533137246966362, -0.0009547105873934925, -0.0008561075082980096, -0.0007575043709948659, -0.0006589012918993831, -0.0005602982128039002, -0.0004616951337084174, -0.00036309202550910413, -0.00026448891730979085, -0.00016588583821430802, -6.72827591188252e-05, 3.132037818431854e-05, 0.00012992345727980137, 0.0002285265363752842, 0.000327129615470767, 0.0004257327236700803, 0.0005243358318693936, 0.0006229389109648764, 0.0007215419900603592, 0.000820145127363503, 0.0009187482064589858, 0.0010173512855544686, 0.0011159543646499515, 0.0012145574437454343, 0.001313160639256239, 0.0014117637183517218, 0.0015103667974472046, 0.0016089698765426874, 0.0017075729556381702, 0.001806176034733653, 0.001904779113829136, 0.0020033821929246187, 0.0021019852720201015, 0.0022005883511155844, 0.002299191430211067, 0.0023977947421371937, 0.002496397588402033, 0.0025950009003281593, 0.002693603979423642, 0.002792207058519125, 0.002890810137614608, 0.0029894132167100906, 0.0030880162958055735, 0.0031866193749010563, 0.0032852226868271828, 0.003383825533092022]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 16.0, 20.0, 28.0, 39.0, 56.0, 77.0, 111.0, 151.0, 250.0, 329.0, 504.0, 655.0, 925.0, 1348.0, 1904.0, 2728.0, 3997.0, 6026.0, 9154.0, 13876.0, 21755.0, 35040.0, 58570.0, 99503.0, 164752.0, 214287.0, 160906.0, 97058.0, 57419.0, 34381.0, 21328.0, 13790.0, 8721.0, 5893.0, 3985.0, 2682.0, 1942.0, 1284.0, 918.0, 660.0, 416.0, 314.0, 237.0, 182.0, 116.0, 71.0, 53.0, 26.0, 24.0, 14.0, 10.0, 11.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.005603790283203125, -0.005425751209259033, -0.005247712135314941, -0.00506967306137085, -0.004891633987426758, -0.004713594913482666, -0.004535555839538574, -0.004357516765594482, -0.004179477691650391, -0.004001438617706299, -0.003823399543762207, -0.0036453604698181152, -0.0034673213958740234, -0.0032892823219299316, -0.00311124324798584, -0.002933204174041748, -0.0027551651000976562, -0.0025771260261535645, -0.0023990869522094727, -0.002221047878265381, -0.002043008804321289, -0.0018649697303771973, -0.0016869306564331055, -0.0015088915824890137, -0.0013308525085449219, -0.00115281343460083, -0.0009747743606567383, -0.0007967352867126465, -0.0006186962127685547, -0.0004406571388244629, -0.0002626180648803711, -8.45789909362793e-05, 9.34600830078125e-05, 0.0002714991569519043, 0.0004495382308959961, 0.0006275773048400879, 0.0008056163787841797, 0.0009836554527282715, 0.0011616945266723633, 0.001339733600616455, 0.0015177726745605469, 0.0016958117485046387, 0.0018738508224487305, 0.0020518898963928223, 0.002229928970336914, 0.002407968044281006, 0.0025860071182250977, 0.0027640461921691895, 0.0029420852661132812, 0.003120124340057373, 0.003298163414001465, 0.0034762024879455566, 0.0036542415618896484, 0.0038322806358337402, 0.004010319709777832, 0.004188358783721924, 0.004366397857666016, 0.004544436931610107, 0.004722476005554199, 0.004900515079498291, 0.005078554153442383, 0.005256593227386475, 0.005434632301330566, 0.005612671375274658, 0.00579071044921875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 6.0, 5.0, 9.0, 7.0, 8.0, 14.0, 12.0, 14.0, 20.0, 23.0, 18.0, 24.0, 34.0, 24.0, 37.0, 33.0, 42.0, 38.0, 43.0, 48.0, 41.0, 53.0, 42.0, 36.0, 42.0, 33.0, 26.0, 36.0, 24.0, 33.0, 20.0, 17.0, 17.0, 18.0, 15.0, 15.0, 12.0, 10.0, 14.0, 10.0, 10.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0029773712158203125, -0.0028819739818573, -0.002786576747894287, -0.0026911795139312744, -0.0025957822799682617, -0.002500385046005249, -0.0024049878120422363, -0.0023095905780792236, -0.002214193344116211, -0.0021187961101531982, -0.0020233988761901855, -0.0019280016422271729, -0.0018326044082641602, -0.0017372071743011475, -0.0016418099403381348, -0.001546412706375122, -0.0014510154724121094, -0.0013556182384490967, -0.001260221004486084, -0.0011648237705230713, -0.0010694265365600586, -0.0009740293025970459, -0.0008786320686340332, -0.0007832348346710205, -0.0006878376007080078, -0.0005924403667449951, -0.0004970431327819824, -0.0004016458988189697, -0.00030624866485595703, -0.00021085143089294434, -0.00011545419692993164, -2.0056962966918945e-05, 7.534027099609375e-05, 0.00017073750495910645, 0.00026613473892211914, 0.00036153197288513184, 0.00045692920684814453, 0.0005523264408111572, 0.0006477236747741699, 0.0007431209087371826, 0.0008385181427001953, 0.000933915376663208, 0.0010293126106262207, 0.0011247098445892334, 0.001220107078552246, 0.0013155043125152588, 0.0014109015464782715, 0.0015062987804412842, 0.0016016960144042969, 0.0016970932483673096, 0.0017924904823303223, 0.001887887716293335, 0.0019832849502563477, 0.0020786821842193604, 0.002174079418182373, 0.0022694766521453857, 0.0023648738861083984, 0.002460271120071411, 0.002555668354034424, 0.0026510655879974365, 0.0027464628219604492, 0.002841860055923462, 0.0029372572898864746, 0.0030326545238494873, 0.0031280517578125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 14.0, 19.0, 35.0, 54.0, 81.0, 96.0, 163.0, 228.0, 298.0, 486.0, 701.0, 981.0, 1485.0, 2117.0, 3000.0, 4390.0, 6456.0, 9569.0, 14590.0, 21876.0, 34407.0, 54877.0, 89237.0, 146910.0, 215329.0, 166051.0, 101173.0, 61762.0, 38495.0, 24360.0, 16054.0, 10571.0, 7107.0, 4804.0, 3312.0, 2323.0, 1611.0, 1117.0, 768.0, 515.0, 358.0, 244.0, 177.0, 117.0, 79.0, 51.0, 36.0, 33.0, 14.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0057830810546875, -0.0056002140045166016, -0.005417346954345703, -0.005234479904174805, -0.005051612854003906, -0.004868745803833008, -0.004685878753662109, -0.004503011703491211, -0.0043201446533203125, -0.004137277603149414, -0.003954410552978516, -0.003771543502807617, -0.0035886764526367188, -0.0034058094024658203, -0.003222942352294922, -0.0030400753021240234, -0.002857208251953125, -0.0026743412017822266, -0.002491474151611328, -0.0023086071014404297, -0.0021257400512695312, -0.0019428730010986328, -0.0017600059509277344, -0.001577138900756836, -0.0013942718505859375, -0.001211404800415039, -0.0010285377502441406, -0.0008456707000732422, -0.0006628036499023438, -0.0004799365997314453, -0.0002970695495605469, -0.00011420249938964844, 6.866455078125e-05, 0.00025153160095214844, 0.0004343986511230469, 0.0006172657012939453, 0.0008001327514648438, 0.0009829998016357422, 0.0011658668518066406, 0.001348733901977539, 0.0015316009521484375, 0.001714468002319336, 0.0018973350524902344, 0.002080202102661133, 0.0022630691528320312, 0.0024459362030029297, 0.002628803253173828, 0.0028116703033447266, 0.002994537353515625, 0.0031774044036865234, 0.003360271453857422, 0.0035431385040283203, 0.0037260055541992188, 0.003908872604370117, 0.004091739654541016, 0.004274606704711914, 0.0044574737548828125, 0.004640340805053711, 0.004823207855224609, 0.005006074905395508, 0.005188941955566406, 0.005371809005737305, 0.005554676055908203, 0.0057375431060791016, 0.00592041015625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 3.0, 2.0, 17.0, 15.0, 14.0, 15.0, 17.0, 16.0, 20.0, 27.0, 28.0, 24.0, 34.0, 33.0, 30.0, 43.0, 38.0, 46.0, 37.0, 46.0, 40.0, 46.0, 43.0, 34.0, 35.0, 32.0, 38.0, 27.0, 27.0, 28.0, 19.0, 17.0, 16.0, 15.0, 14.0, 9.0, 15.0, 8.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0020847320556640625, -0.002018958330154419, -0.0019531846046447754, -0.0018874108791351318, -0.0018216371536254883, -0.0017558634281158447, -0.0016900897026062012, -0.0016243159770965576, -0.001558542251586914, -0.0014927685260772705, -0.001426994800567627, -0.0013612210750579834, -0.0012954473495483398, -0.0012296736240386963, -0.0011638998985290527, -0.0010981261730194092, -0.0010323524475097656, -0.0009665787220001221, -0.0009008049964904785, -0.000835031270980835, -0.0007692575454711914, -0.0007034838199615479, -0.0006377100944519043, -0.0005719363689422607, -0.0005061626434326172, -0.00044038891792297363, -0.0003746151924133301, -0.0003088414669036865, -0.00024306774139404297, -0.00017729401588439941, -0.00011152029037475586, -4.5746564865112305e-05, 2.002716064453125e-05, 8.58008861541748e-05, 0.00015157461166381836, 0.00021734833717346191, 0.00028312206268310547, 0.000348895788192749, 0.0004146695137023926, 0.00048044323921203613, 0.0005462169647216797, 0.0006119906902313232, 0.0006777644157409668, 0.0007435381412506104, 0.0008093118667602539, 0.0008750855922698975, 0.000940859317779541, 0.0010066330432891846, 0.0010724067687988281, 0.0011381804943084717, 0.0012039542198181152, 0.0012697279453277588, 0.0013355016708374023, 0.001401275396347046, 0.0014670491218566895, 0.001532822847366333, 0.0015985965728759766, 0.0016643702983856201, 0.0017301440238952637, 0.0017959177494049072, 0.0018616914749145508, 0.0019274652004241943, 0.001993238925933838, 0.0020590126514434814, 0.002124786376953125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 12.0, 8.0, 19.0, 26.0, 34.0, 47.0, 56.0, 62.0, 102.0, 127.0, 198.0, 275.0, 416.0, 531.0, 841.0, 1545.0, 3236.0, 8316.0, 26606.0, 111031.0, 653158.0, 183969.0, 37941.0, 10939.0, 4079.0, 1879.0, 934.0, 665.0, 427.0, 296.0, 217.0, 139.0, 95.0, 86.0, 54.0, 44.0, 40.0, 25.0, 17.0, 16.0, 9.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00431060791015625, -0.004174351692199707, -0.004038095474243164, -0.003901839256286621, -0.003765583038330078, -0.003629326820373535, -0.003493070602416992, -0.0033568143844604492, -0.0032205581665039062, -0.0030843019485473633, -0.0029480457305908203, -0.0028117895126342773, -0.0026755332946777344, -0.0025392770767211914, -0.0024030208587646484, -0.0022667646408081055, -0.0021305084228515625, -0.0019942522048950195, -0.0018579959869384766, -0.0017217397689819336, -0.0015854835510253906, -0.0014492273330688477, -0.0013129711151123047, -0.0011767148971557617, -0.0010404586791992188, -0.0009042024612426758, -0.0007679462432861328, -0.0006316900253295898, -0.0004954338073730469, -0.0003591775894165039, -0.00022292137145996094, -8.666515350341797e-05, 4.9591064453125e-05, 0.00018584728240966797, 0.00032210350036621094, 0.0004583597183227539, 0.0005946159362792969, 0.0007308721542358398, 0.0008671283721923828, 0.0010033845901489258, 0.0011396408081054688, 0.0012758970260620117, 0.0014121532440185547, 0.0015484094619750977, 0.0016846656799316406, 0.0018209218978881836, 0.0019571781158447266, 0.0020934343338012695, 0.0022296905517578125, 0.0023659467697143555, 0.0025022029876708984, 0.0026384592056274414, 0.0027747154235839844, 0.0029109716415405273, 0.0030472278594970703, 0.0031834840774536133, 0.0033197402954101562, 0.0034559965133666992, 0.003592252731323242, 0.003728508949279785, 0.003864765167236328, 0.004001021385192871, 0.004137277603149414, 0.004273533821105957, 0.0044097900390625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 0.0, 8.0, 0.0, 14.0, 0.0, 14.0, 0.0, 36.0, 0.0, 31.0, 0.0, 37.0, 0.0, 64.0, 0.0, 74.0, 0.0, 102.0, 0.0, 98.0, 0.0, 109.0, 0.0, 93.0, 0.0, 79.0, 0.0, 68.0, 0.0, 54.0, 0.0, 32.0, 0.0, 34.0, 0.0, 19.0, 0.0, 15.0, 0.0, 15.0, 0.0, 7.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.834766387939453e-07, -9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 12.0, 9.0, 14.0, 24.0, 21.0, 32.0, 31.0, 50.0, 68.0, 87.0, 110.0, 146.0, 226.0, 270.0, 400.0, 533.0, 739.0, 1172.0, 1840.0, 2776.0, 4432.0, 7355.0, 12713.0, 24260.0, 51683.0, 146124.0, 502333.0, 172220.0, 57530.0, 26115.0, 13811.0, 7878.0, 4591.0, 2876.0, 1919.0, 1265.0, 813.0, 569.0, 397.0, 278.0, 190.0, 149.0, 120.0, 96.0, 83.0, 40.0, 45.0, 37.0, 24.0, 13.0, 15.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.002529144287109375, -0.002446383237838745, -0.0023636221885681152, -0.0022808611392974854, -0.0021981000900268555, -0.0021153390407562256, -0.0020325779914855957, -0.0019498169422149658, -0.001867055892944336, -0.001784294843673706, -0.0017015337944030762, -0.0016187727451324463, -0.0015360116958618164, -0.0014532506465911865, -0.0013704895973205566, -0.0012877285480499268, -0.0012049674987792969, -0.001122206449508667, -0.0010394454002380371, -0.0009566843509674072, -0.0008739233016967773, -0.0007911622524261475, -0.0007084012031555176, -0.0006256401538848877, -0.0005428791046142578, -0.00046011805534362793, -0.00037735700607299805, -0.00029459595680236816, -0.00021183490753173828, -0.0001290738582611084, -4.6312808990478516e-05, 3.644824028015137e-05, 0.00011920928955078125, 0.00020197033882141113, 0.000284731388092041, 0.0003674924373626709, 0.0004502534866333008, 0.0005330145359039307, 0.0006157755851745605, 0.0006985366344451904, 0.0007812976837158203, 0.0008640587329864502, 0.0009468197822570801, 0.00102958083152771, 0.0011123418807983398, 0.0011951029300689697, 0.0012778639793395996, 0.0013606250286102295, 0.0014433860778808594, 0.0015261471271514893, 0.0016089081764221191, 0.001691669225692749, 0.001774430274963379, 0.0018571913242340088, 0.0019399523735046387, 0.0020227134227752686, 0.0021054744720458984, 0.0021882355213165283, 0.002270996570587158, 0.002353757619857788, 0.002436518669128418, 0.002519279718399048, 0.0026020407676696777, 0.0026848018169403076, 0.0027675628662109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 3.0, 12.0, 9.0, 15.0, 24.0, 30.0, 31.0, 39.0, 83.0, 93.0, 93.0, 102.0, 108.0, 83.0, 72.0, 54.0, 28.0, 30.0, 18.0, 12.0, 16.0, 12.0, 3.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005865097045898438, -0.0005658045411109924, -0.0005450993776321411, -0.0005243942141532898, -0.0005036890506744385, -0.00048298388719558716, -0.00046227872371673584, -0.0004415735602378845, -0.0004208683967590332, -0.0004001632332801819, -0.00037945806980133057, -0.00035875290632247925, -0.00033804774284362793, -0.0003173425793647766, -0.0002966374158859253, -0.000275932252407074, -0.00025522708892822266, -0.00023452192544937134, -0.00021381676197052002, -0.0001931115984916687, -0.00017240643501281738, -0.00015170127153396606, -0.00013099610805511475, -0.00011029094457626343, -8.958578109741211e-05, -6.888061761856079e-05, -4.817545413970947e-05, -2.7470290660858154e-05, -6.765127182006836e-06, 1.3940036296844482e-05, 3.46451997756958e-05, 5.535036325454712e-05, 7.605552673339844e-05, 9.676069021224976e-05, 0.00011746585369110107, 0.0001381710171699524, 0.0001588761806488037, 0.00017958134412765503, 0.00020028650760650635, 0.00022099167108535767, 0.00024169683456420898, 0.0002624019980430603, 0.0002831071615219116, 0.00030381232500076294, 0.00032451748847961426, 0.0003452226519584656, 0.0003659278154373169, 0.0003866329789161682, 0.00040733814239501953, 0.00042804330587387085, 0.00044874846935272217, 0.0004694536328315735, 0.0004901587963104248, 0.0005108639597892761, 0.0005315691232681274, 0.0005522742867469788, 0.0005729794502258301, 0.0005936846137046814, 0.0006143897771835327, 0.000635094940662384, 0.0006558001041412354, 0.0006765052676200867, 0.000697210431098938, 0.0007179155945777893, 0.0007386207580566406]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 7.0, 17.0, 13.0, 13.0, 29.0, 35.0, 41.0, 65.0, 68.0, 96.0, 104.0, 105.0, 101.0, 59.0, 51.0, 49.0, 42.0, 28.0, 16.0, 13.0, 13.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0064142560586333275, -0.00620603421702981, -0.00599781284108758, -0.005789590999484062, -0.005581369623541832, -0.0053731477819383144, -0.005164925940334797, -0.004956704564392567, -0.004748482722789049, -0.004540260881185532, -0.004332039505243301, -0.004123817663639784, -0.003915595822036266, -0.003707374446094036, -0.0034991526044905186, -0.0032909309957176447, -0.003082709386944771, -0.002874487778171897, -0.002666266169399023, -0.0024580443277955055, -0.0022498227190226316, -0.0020416011102497578, -0.001833379385061562, -0.0016251576598733664, -0.0014169360511004925, -0.0012087144423276186, -0.001000492717139423, -0.0007922710501588881, -0.0005840493831783533, -0.00037582777440547943, -0.00016760604921728373, 4.061567597091198e-05, 0.00024883681908249855, 0.00045705848606303334, 0.0006652801530435681, 0.0008735018200241029, 0.0010817234870046377, 0.0012899450957775116, 0.0014981668209657073, 0.001706388546153903, 0.0019146101549267769, 0.0021228317636996508, 0.0023310533724725246, 0.002539275214076042, 0.002747496822848916, 0.00295571843162179, 0.0031639402732253075, 0.0033721618819981813, 0.0035803834907710552, 0.003788605099543929, 0.003996826708316803, 0.0042050485499203205, 0.004413270391523838, 0.004621491767466068, 0.004829713609069586, 0.005037935450673103, 0.0052461568266153336, 0.005454378668218851, 0.005662600044161081, 0.005870821885764599, 0.006079043261706829, 0.006287265103310347, 0.006495486944913864, 0.006703708320856094, 0.006911930162459612]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 7.0, 6.0, 7.0, 12.0, 11.0, 11.0, 15.0, 21.0, 23.0, 26.0, 40.0, 32.0, 32.0, 31.0, 38.0, 32.0, 49.0, 47.0, 48.0, 52.0, 44.0, 48.0, 41.0, 37.0, 41.0, 30.0, 27.0, 24.0, 20.0, 18.0, 20.0, 22.0, 16.0, 12.0, 14.0, 6.0, 12.0, 9.0, 2.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003445139154791832, -0.0033185624051839113, -0.0031919858884066343, -0.0030654091387987137, -0.002938832389190793, -0.0028122556395828724, -0.0026856791228055954, -0.0025591023731976748, -0.002432525623589754, -0.0023059488739818335, -0.0021793723572045565, -0.002052795607596636, -0.0019262188579887152, -0.0017996422247961164, -0.0016730655916035175, -0.0015464888419955969, -0.00141991232521832, -0.001293335692025721, -0.0011667589424178004, -0.0010401823092252016, -0.0009136056178249419, -0.0007870289264246821, -0.0006604522932320833, -0.0005338756018318236, -0.00040729891043156385, -0.0002807222190313041, -0.00015414555673487484, -2.7568894438445568e-05, 9.900779696181417e-05, 0.0002255844883620739, 0.0003521611215546727, 0.00047873781295493245, 0.0006053145043551922, 0.0007318911957554519, 0.0008584678871557117, 0.0009850445203483105, 0.0011116212699562311, 0.00123819790314883, 0.0013647745363414288, 0.0014913512859493494, 0.0016179279191419482, 0.001744504552334547, 0.0018710813019424677, 0.0019976580515503883, 0.0021242345683276653, 0.002250811317935586, 0.0023773880675435066, 0.0025039645843207836, 0.0026305413339287043, 0.002757118083536625, 0.002883694600313902, 0.0030102713499218225, 0.003136848099529743, 0.00326342461630702, 0.003390001365914941, 0.0035165781155228615, 0.0036431546323001385, 0.003769731381908059, 0.003896307898685336, 0.004022884648293257, 0.004149461165070534, 0.004276038147509098, 0.004402614664286375, 0.004529191181063652, 0.004655768163502216]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 9.0, 14.0, 10.0, 16.0, 11.0, 25.0, 21.0, 23.0, 33.0, 27.0, 57.0, 55.0, 60.0, 70.0, 73.0, 113.0, 151.0, 348.0, 1140.0, 3803.0, 515640.0, 1322.0, 422.0, 177.0, 105.0, 74.0, 75.0, 61.0, 44.0, 48.0, 51.0, 37.0, 25.0, 22.0, 19.0, 16.0, 18.0, 11.0, 7.0, 8.0, 6.0, 8.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08651912957429886, -0.08382194489240646, -0.08112476021051407, -0.07842757552862167, -0.07573039084672928, -0.07303320616483688, -0.07033602893352509, -0.06763884425163269, -0.0649416595697403, -0.0622444748878479, -0.059547290205955505, -0.05685010552406311, -0.054152920842170715, -0.05145573616027832, -0.048758555203676224, -0.04606137052178383, -0.043364182114601135, -0.04066699743270874, -0.037969812750816345, -0.03527262806892395, -0.032575443387031555, -0.02987826056778431, -0.027181077748537064, -0.02448389306664467, -0.021786708384752274, -0.01908952370285988, -0.016392339020967484, -0.013695156201720238, -0.010997971519827843, -0.008300786837935448, -0.005603604018688202, -0.002906419336795807, -0.00020923465490341187, 0.002487949561327696, 0.0051851337775588036, 0.007882317528128624, 0.010579502210021019, 0.013276686891913414, 0.01597386971116066, 0.018671054393053055, 0.02136823907494545, 0.024065423756837845, 0.02676260843873024, 0.029459791257977486, 0.03215697407722473, 0.034854158759117126, 0.03755134344100952, 0.040248528122901917, 0.04294571280479431, 0.04564289748668671, 0.0483400821685791, 0.0510372668504715, 0.05373445153236389, 0.05643163621425629, 0.05912881717085838, 0.06182600185275078, 0.06452319025993347, 0.06722037494182587, 0.06991755962371826, 0.07261474430561066, 0.07531192898750305, 0.07800911366939545, 0.08070629835128784, 0.08340348303318024, 0.08610066026449203]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 8.0, 7.0, 15.0, 9.0, 18.0, 18.0, 23.0, 29.0, 29.0, 42.0, 34.0, 22.0, 39.0, 37.0, 47.0, 45.0, 42.0, 1073.0, 58.0, 44.0, 44.0, 37.0, 35.0, 33.0, 30.0, 31.0, 21.0, 17.0, 23.0, 14.0, 15.0, 15.0, 13.0, 10.0, 7.0, 9.0, 5.0, 1.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09995340555906296, -0.09629634022712708, -0.0926392674446106, -0.08898220211267471, -0.08532513678073883, -0.08166806399822235, -0.07801099866628647, -0.07435393333435059, -0.0706968605518341, -0.06703979521989822, -0.06338272243738174, -0.05972565710544586, -0.05606858804821968, -0.0524115189909935, -0.04875445365905762, -0.045097384601831436, -0.041440315544605255, -0.037783246487379074, -0.03412617743015289, -0.03046911209821701, -0.02681204304099083, -0.02315497398376465, -0.019497906789183617, -0.015840839594602585, -0.012183770537376404, -0.008526702411472797, -0.004869634285569191, -0.0012125661596655846, 0.002444501966238022, 0.006101571023464203, 0.009758638218045235, 0.013415705412626266, 0.017072781920433044, 0.020729850977659225, 0.024386918172240257, 0.02804398536682129, 0.03170105442404747, 0.03535812348127365, 0.039015188813209534, 0.042672257870435715, 0.046329326927661896, 0.04998639598488808, 0.05364346504211426, 0.05730053037405014, 0.06095759943127632, 0.0646146684885025, 0.06827173382043839, 0.07192879915237427, 0.07558587193489075, 0.07924293726682663, 0.08290001004934311, 0.08655707538127899, 0.09021414816379547, 0.09387121349573135, 0.09752827882766724, 0.10118535161018372, 0.1048424169421196, 0.10849948227405548, 0.11215655505657196, 0.11581362038850784, 0.11947068572044373, 0.1231277585029602, 0.12678483128547668, 0.13044188916683197, 0.13409896194934845]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 3.0, 6.0, 8.0, 5.0, 12.0, 13.0, 11.0, 19.0, 35.0, 39.0, 51.0, 80.0, 126.0, 218.0, 341.0, 419.0, 565.0, 774.0, 911.0, 1082.0, 1441.0, 2445.0, 2573.0, 31199214.0, 19487.0, 21513.0, 1813.0, 255.0, 228.0, 546.0, 58.0, 46.0, 41.0, 34.0, 28.0, 15.0, 9.0, 5.0, 5.0, 3.0, 1.0], "bins": [-21232.0, -20778.1875, -20324.375, -19870.5625, -19416.75, -18962.9375, -18509.125, -18055.3125, -17601.5, -17147.6875, -16693.875, -16240.0625, -15786.25, -15332.4375, -14878.625, -14424.8125, -13971.0, -13517.1875, -13063.375, -12609.5625, -12155.75, -11701.9375, -11248.125, -10794.3125, -10340.5, -9886.6875, -9432.875, -8979.0625, -8525.25, -8071.4375, -7617.625, -7163.8125, -6710.0, -6256.1875, -5802.375, -5348.5625, -4894.75, -4440.9375, -3987.125, -3533.3125, -3079.5, -2625.6875, -2171.875, -1718.0625, -1264.25, -810.4375, -356.625, 97.1875, 551.0, 1004.8125, 1458.625, 1912.4375, 2366.25, 2820.0625, 3273.875, 3727.6875, 4181.5, 4635.3125, 5089.125, 5542.9375, 5996.75, 6450.5625, 6904.375, 7358.1875, 7812.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 11.0, 17.0, 38.0, 56.0, 73.0, 95.0, 141.0, 224.0, 359.0, 573.0, 902.0, 1405.0, 2250.0, 3410.0, 5437.0, 8812.0, 14278.0, 23575.0, 40810.0, 68910.0, 122204.0, 231381.0, 573084.0, 3884417.0, 729828.0, 259875.0, 133051.0, 75141.0, 43483.0, 25799.0, 16030.0, 9810.0, 5945.0, 3601.0, 2243.0, 1499.0, 945.0, 586.0, 379.0, 250.0, 167.0, 103.0, 69.0, 61.0, 40.0, 16.0, 13.0, 12.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-117.0625, -113.2333984375, -109.404296875, -105.5751953125, -101.74609375, -97.9169921875, -94.087890625, -90.2587890625, -86.4296875, -82.6005859375, -78.771484375, -74.9423828125, -71.11328125, -67.2841796875, -63.455078125, -59.6259765625, -55.796875, -51.9677734375, -48.138671875, -44.3095703125, -40.48046875, -36.6513671875, -32.822265625, -28.9931640625, -25.1640625, -21.3349609375, -17.505859375, -13.6767578125, -9.84765625, -6.0185546875, -2.189453125, 1.6396484375, 5.46875, 9.2978515625, 13.126953125, 16.9560546875, 20.78515625, 24.6142578125, 28.443359375, 32.2724609375, 36.1015625, 39.9306640625, 43.759765625, 47.5888671875, 51.41796875, 55.2470703125, 59.076171875, 62.9052734375, 66.734375, 70.5634765625, 74.392578125, 78.2216796875, 82.05078125, 85.8798828125, 89.708984375, 93.5380859375, 97.3671875, 101.1962890625, 105.025390625, 108.8544921875, 112.68359375, 116.5126953125, 120.341796875, 124.1708984375, 128.0]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 6.0, 8.0, 7.0, 7.0, 10.0, 12.0, 15.0, 13.0, 16.0, 24.0, 29.0, 38.0, 64.0, 76.0, 119.0, 192.0, 347.0, 556.0, 86.0, 63.0, 50.0, 40.0, 34.0, 27.0, 22.0, 22.0, 24.0, 18.0, 13.0, 13.0, 17.0, 10.0, 10.0, 7.0, 4.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-235.375, -228.72265625, -222.0703125, -215.41796875, -208.765625, -202.11328125, -195.4609375, -188.80859375, -182.15625, -175.50390625, -168.8515625, -162.19921875, -155.546875, -148.89453125, -142.2421875, -135.58984375, -128.9375, -122.28515625, -115.6328125, -108.98046875, -102.328125, -95.67578125, -89.0234375, -82.37109375, -75.71875, -69.06640625, -62.4140625, -55.76171875, -49.109375, -42.45703125, -35.8046875, -29.15234375, -22.5, -15.84765625, -9.1953125, -2.54296875, 4.109375, 10.76171875, 17.4140625, 24.06640625, 30.71875, 37.37109375, 44.0234375, 50.67578125, 57.328125, 63.98046875, 70.6328125, 77.28515625, 83.9375, 90.58984375, 97.2421875, 103.89453125, 110.546875, 117.19921875, 123.8515625, 130.50390625, 137.15625, 143.80859375, 150.4609375, 157.11328125, 163.765625, 170.41796875, 177.0703125, 183.72265625, 190.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 0.0, 6.0, 4.0, 14.0, 9.0, 23.0, 34.0, 26.0, 45.0, 68.0, 82.0, 114.0, 210.0, 254.0, 313.0, 545.0, 781.0, 1195.0, 1771.0, 2653.0, 4667.0, 7440.0, 13170.0, 25264.0, 56603.0, 151797.0, 897629.0, 4732145.0, 243519.0, 77212.0, 33418.0, 16467.0, 9105.0, 5178.0, 3165.0, 2066.0, 1401.0, 899.0, 626.0, 449.0, 279.0, 220.0, 147.0, 132.0, 75.0, 57.0, 41.0, 39.0, 27.0, 21.0, 9.0, 9.0, 0.0, 6.0, 9.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-260.25, -251.90234375, -243.5546875, -235.20703125, -226.859375, -218.51171875, -210.1640625, -201.81640625, -193.46875, -185.12109375, -176.7734375, -168.42578125, -160.078125, -151.73046875, -143.3828125, -135.03515625, -126.6875, -118.33984375, -109.9921875, -101.64453125, -93.296875, -84.94921875, -76.6015625, -68.25390625, -59.90625, -51.55859375, -43.2109375, -34.86328125, -26.515625, -18.16796875, -9.8203125, -1.47265625, 6.875, 15.22265625, 23.5703125, 31.91796875, 40.265625, 48.61328125, 56.9609375, 65.30859375, 73.65625, 82.00390625, 90.3515625, 98.69921875, 107.046875, 115.39453125, 123.7421875, 132.08984375, 140.4375, 148.78515625, 157.1328125, 165.48046875, 173.828125, 182.17578125, 190.5234375, 198.87109375, 207.21875, 215.56640625, 223.9140625, 232.26171875, 240.609375, 248.95703125, 257.3046875, 265.65234375, 274.0]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 1.0, 5.0, 3.0, 5.0, 10.0, 9.0, 15.0, 21.0, 20.0, 26.0, 44.0, 69.0, 126.0, 184.0, 464.0, 577.0, 111.0, 57.0, 56.0, 42.0, 29.0, 21.0, 26.0, 16.0, 13.0, 9.0, 8.0, 6.0, 5.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 7.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-369.25, -357.41015625, -345.5703125, -333.73046875, -321.890625, -310.05078125, -298.2109375, -286.37109375, -274.53125, -262.69140625, -250.8515625, -239.01171875, -227.171875, -215.33203125, -203.4921875, -191.65234375, -179.8125, -167.97265625, -156.1328125, -144.29296875, -132.453125, -120.61328125, -108.7734375, -96.93359375, -85.09375, -73.25390625, -61.4140625, -49.57421875, -37.734375, -25.89453125, -14.0546875, -2.21484375, 9.625, 21.46484375, 33.3046875, 45.14453125, 56.984375, 68.82421875, 80.6640625, 92.50390625, 104.34375, 116.18359375, 128.0234375, 139.86328125, 151.703125, 163.54296875, 175.3828125, 187.22265625, 199.0625, 210.90234375, 222.7421875, 234.58203125, 246.421875, 258.26171875, 270.1015625, 281.94140625, 293.78125, 305.62109375, 317.4609375, 329.30078125, 341.140625, 352.98046875, 364.8203125, 376.66015625, 388.5]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [9.0, 0.0, 2.0, 4.0, 12.0, 6.0, 0.0, 9.0, 5.0, 10.0, 8.0, 35.0, 38.0, 44.0, 25.0, 76.0, 52.0, 50.0, 104.0, 143.0, 161.0, 240.0, 372.0, 486.0, 758.0, 1135.0, 1954.0, 3409.0, 7142.0, 18364.0, 90722.0, 6096800.0, 43651.0, 12555.0, 5493.0, 2799.0, 1455.0, 1001.0, 582.0, 419.0, 321.0, 226.0, 188.0, 121.0, 96.0, 77.0, 70.0, 49.0, 49.0, 38.0, 10.0, 10.0, 11.0, 3.0, 17.0, 1.0, 6.0, 5.0, 19.0, 0.0, 0.0, 6.0, 0.0, 3.0], "bins": [-2332.0, -2257.5625, -2183.125, -2108.6875, -2034.25, -1959.8125, -1885.375, -1810.9375, -1736.5, -1662.0625, -1587.625, -1513.1875, -1438.75, -1364.3125, -1289.875, -1215.4375, -1141.0, -1066.5625, -992.125, -917.6875, -843.25, -768.8125, -694.375, -619.9375, -545.5, -471.0625, -396.625, -322.1875, -247.75, -173.3125, -98.875, -24.4375, 50.0, 124.4375, 198.875, 273.3125, 347.75, 422.1875, 496.625, 571.0625, 645.5, 719.9375, 794.375, 868.8125, 943.25, 1017.6875, 1092.125, 1166.5625, 1241.0, 1315.4375, 1389.875, 1464.3125, 1538.75, 1613.1875, 1687.625, 1762.0625, 1836.5, 1910.9375, 1985.375, 2059.8125, 2134.25, 2208.6875, 2283.125, 2357.5625, 2432.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 7.0, 7.0, 5.0, 4.0, 5.0, 10.0, 15.0, 10.0, 13.0, 17.0, 19.0, 25.0, 32.0, 60.0, 125.0, 291.0, 943.0, 157.0, 72.0, 42.0, 32.0, 21.0, 14.0, 15.0, 17.0, 11.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-772.0, -747.5546875, -723.109375, -698.6640625, -674.21875, -649.7734375, -625.328125, -600.8828125, -576.4375, -551.9921875, -527.546875, -503.1015625, -478.65625, -454.2109375, -429.765625, -405.3203125, -380.875, -356.4296875, -331.984375, -307.5390625, -283.09375, -258.6484375, -234.203125, -209.7578125, -185.3125, -160.8671875, -136.421875, -111.9765625, -87.53125, -63.0859375, -38.640625, -14.1953125, 10.25, 34.6953125, 59.140625, 83.5859375, 108.03125, 132.4765625, 156.921875, 181.3671875, 205.8125, 230.2578125, 254.703125, 279.1484375, 303.59375, 328.0390625, 352.484375, 376.9296875, 401.375, 425.8203125, 450.265625, 474.7109375, 499.15625, 523.6015625, 548.046875, 572.4921875, 596.9375, 621.3828125, 645.828125, 670.2734375, 694.71875, 719.1640625, 743.609375, 768.0546875, 792.5]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 7.0, 14.0, 19.0, 35.0, 656.0, 240.0, 18.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-14771.30078125, -14502.5732421875, -14233.845703125, -13965.1181640625, -13696.390625, -13427.6630859375, -13158.935546875, -12890.20703125, -12621.48046875, -12352.7529296875, -12084.025390625, -11815.2978515625, -11546.5703125, -11277.8427734375, -11009.115234375, -10740.38671875, -10471.6591796875, -10202.931640625, -9934.2041015625, -9665.4765625, -9396.7490234375, -9128.021484375, -8859.2939453125, -8590.56640625, -8321.837890625, -8053.1103515625, -7784.3828125, -7515.6552734375, -7246.927734375, -6978.2001953125, -6709.47216796875, -6440.74462890625, -6172.017578125, -5903.2900390625, -5634.5625, -5365.8349609375, -5097.107421875, -4828.3798828125, -4559.65185546875, -4290.92431640625, -4022.197021484375, -3753.469482421875, -3484.74169921875, -3216.01416015625, -2947.28662109375, -2678.55908203125, -2409.83154296875, -2141.103759765625, -1872.376220703125, -1603.648681640625, -1334.9210205078125, -1066.193359375, -797.4658203125, -528.73828125, -260.0106201171875, 8.717041015625, 277.444580078125, 546.1721801757812, 814.8997802734375, 1083.62744140625, 1352.35498046875, 1621.08251953125, 1889.8101806640625, 2158.537841796875, 2427.265380859375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 9.0, 9.0, 13.0, 18.0, 23.0, 36.0, 759.0, 32.0, 18.0, 19.0, 13.0, 11.0, 7.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5487.4111328125, -5358.158203125, -5228.9052734375, -5099.65234375, -4970.3994140625, -4841.146484375, -4711.8935546875, -4582.640625, -4453.3876953125, -4324.134765625, -4194.8818359375, -4065.62890625, -3936.3759765625, -3807.123046875, -3677.870361328125, -3548.617431640625, -3419.36474609375, -3290.11181640625, -3160.85888671875, -3031.60595703125, -2902.35302734375, -2773.10009765625, -2643.847412109375, -2514.594482421875, -2385.341552734375, -2256.088623046875, -2126.835693359375, -1997.5828857421875, -1868.3299560546875, -1739.0770263671875, -1609.82421875, -1480.5712890625, -1351.318359375, -1222.0654296875, -1092.8125, -963.5596923828125, -834.3067626953125, -705.0538330078125, -575.8009643554688, -446.548095703125, -317.295166015625, -188.04226684570312, -58.78936767578125, 70.46353149414062, 199.7164306640625, 328.9693603515625, 458.22222900390625, 587.47509765625, 716.72802734375, 845.98095703125, 975.2338256835938, 1104.4866943359375, 1233.7396240234375, 1362.9925537109375, 1492.245361328125, 1621.498291015625, 1750.751220703125, 1880.004150390625, 2009.257080078125, 2138.510009765625, 2267.7626953125, 2397.015625, 2526.2685546875, 2655.521484375, 2784.7744140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 17.0, 17.0, 15.0, 24.0, 37.0, 41.0, 69.0, 107.0, 130.0, 188.0, 259.0, 355.0, 534.0, 745.0, 1228.0, 2434.0, 5570.0, 17802.0, 127353.0, 3825317.0, 177984.0, 20937.0, 6863.0, 2857.0, 1398.0, 691.0, 389.0, 229.0, 160.0, 93.0, 89.0, 75.0, 58.0, 44.0, 42.0, 30.0, 25.0, 10.0, 13.0, 12.0, 11.0, 9.0, 8.0, 9.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.859375, -23.989013671875, -23.11865234375, -22.248291015625, -21.3779296875, -20.507568359375, -19.63720703125, -18.766845703125, -17.896484375, -17.026123046875, -16.15576171875, -15.285400390625, -14.4150390625, -13.544677734375, -12.67431640625, -11.803955078125, -10.93359375, -10.063232421875, -9.19287109375, -8.322509765625, -7.4521484375, -6.581787109375, -5.71142578125, -4.841064453125, -3.970703125, -3.100341796875, -2.22998046875, -1.359619140625, -0.4892578125, 0.381103515625, 1.25146484375, 2.121826171875, 2.9921875, 3.862548828125, 4.73291015625, 5.603271484375, 6.4736328125, 7.343994140625, 8.21435546875, 9.084716796875, 9.955078125, 10.825439453125, 11.69580078125, 12.566162109375, 13.4365234375, 14.306884765625, 15.17724609375, 16.047607421875, 16.91796875, 17.788330078125, 18.65869140625, 19.529052734375, 20.3994140625, 21.269775390625, 22.14013671875, 23.010498046875, 23.880859375, 24.751220703125, 25.62158203125, 26.491943359375, 27.3623046875, 28.232666015625, 29.10302734375, 29.973388671875, 30.84375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 10.0, 27.0, 40.0, 52.0, 82.0, 138.0, 163.0, 157.0, 125.0, 105.0, 44.0, 25.0, 11.0, 5.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.064453125, -1.031005859375, -0.99755859375, -0.964111328125, -0.9306640625, -0.897216796875, -0.86376953125, -0.830322265625, -0.796875, -0.763427734375, -0.72998046875, -0.696533203125, -0.6630859375, -0.629638671875, -0.59619140625, -0.562744140625, -0.529296875, -0.495849609375, -0.46240234375, -0.428955078125, -0.3955078125, -0.362060546875, -0.32861328125, -0.295166015625, -0.26171875, -0.228271484375, -0.19482421875, -0.161376953125, -0.1279296875, -0.094482421875, -0.06103515625, -0.027587890625, 0.005859375, 0.039306640625, 0.07275390625, 0.106201171875, 0.1396484375, 0.173095703125, 0.20654296875, 0.239990234375, 0.2734375, 0.306884765625, 0.34033203125, 0.373779296875, 0.4072265625, 0.440673828125, 0.47412109375, 0.507568359375, 0.541015625, 0.574462890625, 0.60791015625, 0.641357421875, 0.6748046875, 0.708251953125, 0.74169921875, 0.775146484375, 0.80859375, 0.842041015625, 0.87548828125, 0.908935546875, 0.9423828125, 0.975830078125, 1.00927734375, 1.042724609375, 1.076171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 12.0, 14.0, 33.0, 30.0, 59.0, 68.0, 94.0, 151.0, 284.0, 491.0, 996.0, 2268.0, 7460.0, 36503.0, 510620.0, 3533991.0, 83406.0, 11938.0, 3187.0, 1196.0, 544.0, 286.0, 175.0, 128.0, 88.0, 51.0, 54.0, 29.0, 16.0, 20.0, 14.0, 16.0, 10.0, 10.0, 11.0, 1.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.203125, -17.481201171875, -16.75927734375, -16.037353515625, -15.3154296875, -14.593505859375, -13.87158203125, -13.149658203125, -12.427734375, -11.705810546875, -10.98388671875, -10.261962890625, -9.5400390625, -8.818115234375, -8.09619140625, -7.374267578125, -6.65234375, -5.930419921875, -5.20849609375, -4.486572265625, -3.7646484375, -3.042724609375, -2.32080078125, -1.598876953125, -0.876953125, -0.155029296875, 0.56689453125, 1.288818359375, 2.0107421875, 2.732666015625, 3.45458984375, 4.176513671875, 4.8984375, 5.620361328125, 6.34228515625, 7.064208984375, 7.7861328125, 8.508056640625, 9.22998046875, 9.951904296875, 10.673828125, 11.395751953125, 12.11767578125, 12.839599609375, 13.5615234375, 14.283447265625, 15.00537109375, 15.727294921875, 16.44921875, 17.171142578125, 17.89306640625, 18.614990234375, 19.3369140625, 20.058837890625, 20.78076171875, 21.502685546875, 22.224609375, 22.946533203125, 23.66845703125, 24.390380859375, 25.1123046875, 25.834228515625, 26.55615234375, 27.278076171875, 28.0]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 13.0, 7.0, 9.0, 12.0, 12.0, 13.0, 17.0, 25.0, 23.0, 52.0, 58.0, 61.0, 82.0, 104.0, 116.0, 166.0, 211.0, 270.0, 397.0, 953.0, 434.0, 280.0, 215.0, 160.0, 100.0, 70.0, 58.0, 40.0, 31.0, 16.0, 22.0, 9.0, 9.0, 10.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.7929840087890625, -2.718780517578125, -2.6445770263671875, -2.57037353515625, -2.4961700439453125, -2.421966552734375, -2.3477630615234375, -2.2735595703125, -2.1993560791015625, -2.125152587890625, -2.0509490966796875, -1.97674560546875, -1.9025421142578125, -1.828338623046875, -1.7541351318359375, -1.679931640625, -1.6057281494140625, -1.531524658203125, -1.4573211669921875, -1.38311767578125, -1.3089141845703125, -1.234710693359375, -1.1605072021484375, -1.0863037109375, -1.0121002197265625, -0.937896728515625, -0.8636932373046875, -0.78948974609375, -0.7152862548828125, -0.641082763671875, -0.5668792724609375, -0.49267578125, -0.4184722900390625, -0.344268798828125, -0.2700653076171875, -0.19586181640625, -0.1216583251953125, -0.047454833984375, 0.0267486572265625, 0.1009521484375, 0.1751556396484375, 0.249359130859375, 0.3235626220703125, 0.39776611328125, 0.4719696044921875, 0.546173095703125, 0.6203765869140625, 0.694580078125, 0.7687835693359375, 0.842987060546875, 0.9171905517578125, 0.99139404296875, 1.0655975341796875, 1.139801025390625, 1.2140045166015625, 1.2882080078125, 1.3624114990234375, 1.436614990234375, 1.5108184814453125, 1.58502197265625, 1.6592254638671875, 1.733428955078125, 1.8076324462890625, 1.8818359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 7.0, 8.0, 34.0, 104.0, 326.0, 509.0, 24.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-271.809326171875, -265.9299621582031, -260.0505676269531, -254.17120361328125, -248.29183959960938, -242.41246032714844, -236.5330810546875, -230.65371704101562, -224.7743377685547, -218.89495849609375, -213.01559448242188, -207.13621520996094, -201.2568359375, -195.37747192382812, -189.4980926513672, -183.61871337890625, -177.73934936523438, -171.85997009277344, -165.98060607910156, -160.10122680664062, -154.22186279296875, -148.3424835205078, -142.46310424804688, -136.583740234375, -130.70436096191406, -124.82498931884766, -118.94561767578125, -113.06623840332031, -107.1868667602539, -101.3074951171875, -95.42811584472656, -89.54874420166016, -83.66937255859375, -77.79000091552734, -71.91062927246094, -66.03125, -60.151878356933594, -54.27250671386719, -48.393131256103516, -42.513755798339844, -36.63438415527344, -30.7550106048584, -24.87563705444336, -18.99626350402832, -13.116889953613281, -7.237516403198242, -1.3581428527832031, 4.521232604980469, 10.400604248046875, 16.279977798461914, 22.159351348876953, 28.038724899291992, 33.91809844970703, 39.79747009277344, 45.67684555053711, 51.55622100830078, 57.43559265136719, 63.314964294433594, 69.1943359375, 75.07371520996094, 80.95308685302734, 86.83245849609375, 92.71183776855469, 98.5912094116211, 104.4705810546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 9.0, 16.0, 18.0, 21.0, 43.0, 38.0, 63.0, 64.0, 98.0, 91.0, 94.0, 94.0, 74.0, 76.0, 55.0, 42.0, 32.0, 20.0, 24.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.99345016479492, -46.60926818847656, -45.2250862121582, -43.840904235839844, -42.456722259521484, -41.072540283203125, -39.688358306884766, -38.304176330566406, -36.91999435424805, -35.53581237792969, -34.15163040161133, -32.76744842529297, -31.38326644897461, -29.99908447265625, -28.61490249633789, -27.23072052001953, -25.84653663635254, -24.46235466003418, -23.07817268371582, -21.69399070739746, -20.3098087310791, -18.925626754760742, -17.54144287109375, -16.15726089477539, -14.773079872131348, -13.388897895812988, -12.004715919494629, -10.620532989501953, -9.236351013183594, -7.852169513702393, -6.467987060546875, -5.083805084228516, -3.6996231079101562, -2.315441131591797, -0.9312589168548584, 0.4529232978820801, 1.8371052742004395, 3.221287250518799, 4.605469703674316, 5.989651679992676, 7.373833656311035, 8.758015632629395, 10.142197608947754, 11.52638053894043, 12.910562515258789, 14.294744491577148, 15.678926467895508, 17.063108444213867, 18.447290420532227, 19.831472396850586, 21.215654373168945, 22.599836349487305, 23.984018325805664, 25.368200302124023, 26.752384185791016, 28.136566162109375, 29.520748138427734, 30.904930114746094, 32.28911209106445, 33.67329406738281, 35.05747604370117, 36.44165802001953, 37.82583999633789, 39.21002197265625, 40.59420394897461]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 12.0, 13.0, 30.0, 16.0, 25.0, 30.0, 52.0, 80.0, 75.0, 129.0, 151.0, 260.0, 373.0, 546.0, 858.0, 1379.0, 2524.0, 5013.0, 14703.0, 70060.0, 665135.0, 236220.0, 33180.0, 8859.0, 3653.0, 1863.0, 1052.0, 688.0, 445.0, 304.0, 217.0, 156.0, 122.0, 65.0, 49.0, 63.0, 38.0, 23.0, 21.0, 18.0, 14.0, 5.0, 4.0, 2.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.5, -8.24072265625, -7.9814453125, -7.72216796875, -7.462890625, -7.20361328125, -6.9443359375, -6.68505859375, -6.42578125, -6.16650390625, -5.9072265625, -5.64794921875, -5.388671875, -5.12939453125, -4.8701171875, -4.61083984375, -4.3515625, -4.09228515625, -3.8330078125, -3.57373046875, -3.314453125, -3.05517578125, -2.7958984375, -2.53662109375, -2.27734375, -2.01806640625, -1.7587890625, -1.49951171875, -1.240234375, -0.98095703125, -0.7216796875, -0.46240234375, -0.203125, 0.05615234375, 0.3154296875, 0.57470703125, 0.833984375, 1.09326171875, 1.3525390625, 1.61181640625, 1.87109375, 2.13037109375, 2.3896484375, 2.64892578125, 2.908203125, 3.16748046875, 3.4267578125, 3.68603515625, 3.9453125, 4.20458984375, 4.4638671875, 4.72314453125, 4.982421875, 5.24169921875, 5.5009765625, 5.76025390625, 6.01953125, 6.27880859375, 6.5380859375, 6.79736328125, 7.056640625, 7.31591796875, 7.5751953125, 7.83447265625, 8.09375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 11.0, 27.0, 48.0, 65.0, 98.0, 127.0, 136.0, 155.0, 112.0, 64.0, 62.0, 22.0, 20.0, 8.0, 4.0, 0.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2568359375, -1.2257919311523438, -1.1947479248046875, -1.1637039184570312, -1.132659912109375, -1.1016159057617188, -1.0705718994140625, -1.0395278930664062, -1.00848388671875, -0.9774398803710938, -0.9463958740234375, -0.9153518676757812, -0.884307861328125, -0.8532638549804688, -0.8222198486328125, -0.7911758422851562, -0.7601318359375, -0.7290878295898438, -0.6980438232421875, -0.6669998168945312, -0.635955810546875, -0.6049118041992188, -0.5738677978515625, -0.5428237915039062, -0.51177978515625, -0.48073577880859375, -0.4496917724609375, -0.41864776611328125, -0.387603759765625, -0.35655975341796875, -0.3255157470703125, -0.29447174072265625, -0.263427734375, -0.23238372802734375, -0.2013397216796875, -0.17029571533203125, -0.139251708984375, -0.10820770263671875, -0.0771636962890625, -0.04611968994140625, -0.01507568359375, 0.01596832275390625, 0.0470123291015625, 0.07805633544921875, 0.109100341796875, 0.14014434814453125, 0.1711883544921875, 0.20223236083984375, 0.2332763671875, 0.26432037353515625, 0.2953643798828125, 0.32640838623046875, 0.357452392578125, 0.38849639892578125, 0.4195404052734375, 0.45058441162109375, 0.48162841796875, 0.5126724243164062, 0.5437164306640625, 0.5747604370117188, 0.605804443359375, 0.6368484497070312, 0.6678924560546875, 0.6989364624023438, 0.72998046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 12.0, 12.0, 18.0, 36.0, 55.0, 154.0, 326.0, 883.0, 2650.0, 14076.0, 413344.0, 596855.0, 15669.0, 2924.0, 876.0, 338.0, 141.0, 70.0, 40.0, 18.0, 17.0, 12.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.09375, -27.31396484375, -26.5341796875, -25.75439453125, -24.974609375, -24.19482421875, -23.4150390625, -22.63525390625, -21.85546875, -21.07568359375, -20.2958984375, -19.51611328125, -18.736328125, -17.95654296875, -17.1767578125, -16.39697265625, -15.6171875, -14.83740234375, -14.0576171875, -13.27783203125, -12.498046875, -11.71826171875, -10.9384765625, -10.15869140625, -9.37890625, -8.59912109375, -7.8193359375, -7.03955078125, -6.259765625, -5.47998046875, -4.7001953125, -3.92041015625, -3.140625, -2.36083984375, -1.5810546875, -0.80126953125, -0.021484375, 0.75830078125, 1.5380859375, 2.31787109375, 3.09765625, 3.87744140625, 4.6572265625, 5.43701171875, 6.216796875, 6.99658203125, 7.7763671875, 8.55615234375, 9.3359375, 10.11572265625, 10.8955078125, 11.67529296875, 12.455078125, 13.23486328125, 14.0146484375, 14.79443359375, 15.57421875, 16.35400390625, 17.1337890625, 17.91357421875, 18.693359375, 19.47314453125, 20.2529296875, 21.03271484375, 21.8125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 12.0, 20.0, 23.0, 23.0, 37.0, 33.0, 33.0, 63.0, 68.0, 65.0, 72.0, 70.0, 63.0, 65.0, 56.0, 45.0, 52.0, 44.0, 30.0, 25.0, 16.0, 21.0, 16.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.2115478515625, -5.020751953125, -4.8299560546875, -4.63916015625, -4.4483642578125, -4.257568359375, -4.0667724609375, -3.8759765625, -3.6851806640625, -3.494384765625, -3.3035888671875, -3.11279296875, -2.9219970703125, -2.731201171875, -2.5404052734375, -2.349609375, -2.1588134765625, -1.968017578125, -1.7772216796875, -1.58642578125, -1.3956298828125, -1.204833984375, -1.0140380859375, -0.8232421875, -0.6324462890625, -0.441650390625, -0.2508544921875, -0.06005859375, 0.1307373046875, 0.321533203125, 0.5123291015625, 0.703125, 0.8939208984375, 1.084716796875, 1.2755126953125, 1.46630859375, 1.6571044921875, 1.847900390625, 2.0386962890625, 2.2294921875, 2.4202880859375, 2.611083984375, 2.8018798828125, 2.99267578125, 3.1834716796875, 3.374267578125, 3.5650634765625, 3.755859375, 3.9466552734375, 4.137451171875, 4.3282470703125, 4.51904296875, 4.7098388671875, 4.900634765625, 5.0914306640625, 5.2822265625, 5.4730224609375, 5.663818359375, 5.8546142578125, 6.04541015625, 6.2362060546875, 6.427001953125, 6.6177978515625, 6.80859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 3.0, 6.0, 11.0, 9.0, 20.0, 16.0, 37.0, 76.0, 183.0, 414.0, 1239.0, 12699.0, 1027252.0, 5032.0, 951.0, 288.0, 138.0, 62.0, 47.0, 18.0, 12.0, 13.0, 7.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.25, -157.52734375, -152.8046875, -148.08203125, -143.359375, -138.63671875, -133.9140625, -129.19140625, -124.46875, -119.74609375, -115.0234375, -110.30078125, -105.578125, -100.85546875, -96.1328125, -91.41015625, -86.6875, -81.96484375, -77.2421875, -72.51953125, -67.796875, -63.07421875, -58.3515625, -53.62890625, -48.90625, -44.18359375, -39.4609375, -34.73828125, -30.015625, -25.29296875, -20.5703125, -15.84765625, -11.125, -6.40234375, -1.6796875, 3.04296875, 7.765625, 12.48828125, 17.2109375, 21.93359375, 26.65625, 31.37890625, 36.1015625, 40.82421875, 45.546875, 50.26953125, 54.9921875, 59.71484375, 64.4375, 69.16015625, 73.8828125, 78.60546875, 83.328125, 88.05078125, 92.7734375, 97.49609375, 102.21875, 106.94140625, 111.6640625, 116.38671875, 121.109375, 125.83203125, 130.5546875, 135.27734375, 140.0]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 3.0, 4.0, 3.0, 7.0, 14.0, 19.0, 49.0, 183.0, 401.0, 184.0, 64.0, 27.0, 17.0, 8.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008707046508789062, -0.0008210986852645874, -0.0007714927196502686, -0.0007218867540359497, -0.0006722807884216309, -0.000622674822807312, -0.0005730688571929932, -0.0005234628915786743, -0.00047385692596435547, -0.0004242509603500366, -0.0003746449947357178, -0.0003250390291213989, -0.0002754330635070801, -0.00022582709789276123, -0.00017622113227844238, -0.00012661516666412354, -7.700920104980469e-05, -2.740323543548584e-05, 2.2202730178833008e-05, 7.180869579315186e-05, 0.0001214146614074707, 0.00017102062702178955, 0.0002206265926361084, 0.00027023255825042725, 0.0003198385238647461, 0.00036944448947906494, 0.0004190504550933838, 0.00046865642070770264, 0.0005182623863220215, 0.0005678683519363403, 0.0006174743175506592, 0.000667080283164978, 0.0007166862487792969, 0.0007662922143936157, 0.0008158981800079346, 0.0008655041456222534, 0.0009151101112365723, 0.0009647160768508911, 0.00101432204246521, 0.0010639280080795288, 0.0011135339736938477, 0.0011631399393081665, 0.0012127459049224854, 0.0012623518705368042, 0.001311957836151123, 0.001361563801765442, 0.0014111697673797607, 0.0014607757329940796, 0.0015103816986083984, 0.0015599876642227173, 0.0016095936298370361, 0.001659199595451355, 0.0017088055610656738, 0.0017584115266799927, 0.0018080174922943115, 0.0018576234579086304, 0.0019072294235229492, 0.001956835389137268, 0.002006441354751587, 0.0020560473203659058, 0.0021056532859802246, 0.0021552592515945435, 0.0022048652172088623, 0.002254471182823181, 0.0023040771484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 0.0, 6.0, 9.0, 6.0, 12.0, 15.0, 11.0, 39.0, 36.0, 50.0, 70.0, 76.0, 147.0, 219.0, 375.0, 601.0, 1132.0, 2358.0, 5451.0, 18366.0, 810817.0, 185539.0, 13937.0, 4726.0, 1999.0, 1034.0, 542.0, 297.0, 193.0, 152.0, 95.0, 68.0, 31.0, 39.0, 23.0, 20.0, 19.0, 14.0, 7.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.8125, -25.916015625, -25.01953125, -24.123046875, -23.2265625, -22.330078125, -21.43359375, -20.537109375, -19.640625, -18.744140625, -17.84765625, -16.951171875, -16.0546875, -15.158203125, -14.26171875, -13.365234375, -12.46875, -11.572265625, -10.67578125, -9.779296875, -8.8828125, -7.986328125, -7.08984375, -6.193359375, -5.296875, -4.400390625, -3.50390625, -2.607421875, -1.7109375, -0.814453125, 0.08203125, 0.978515625, 1.875, 2.771484375, 3.66796875, 4.564453125, 5.4609375, 6.357421875, 7.25390625, 8.150390625, 9.046875, 9.943359375, 10.83984375, 11.736328125, 12.6328125, 13.529296875, 14.42578125, 15.322265625, 16.21875, 17.115234375, 18.01171875, 18.908203125, 19.8046875, 20.701171875, 21.59765625, 22.494140625, 23.390625, 24.287109375, 25.18359375, 26.080078125, 26.9765625, 27.873046875, 28.76953125, 29.666015625, 30.5625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 5.0, 7.0, 7.0, 9.0, 11.0, 17.0, 32.0, 61.0, 252.0, 354.0, 124.0, 33.0, 20.0, 11.0, 11.0, 6.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-18.5625, -18.064453125, -17.56640625, -17.068359375, -16.5703125, -16.072265625, -15.57421875, -15.076171875, -14.578125, -14.080078125, -13.58203125, -13.083984375, -12.5859375, -12.087890625, -11.58984375, -11.091796875, -10.59375, -10.095703125, -9.59765625, -9.099609375, -8.6015625, -8.103515625, -7.60546875, -7.107421875, -6.609375, -6.111328125, -5.61328125, -5.115234375, -4.6171875, -4.119140625, -3.62109375, -3.123046875, -2.625, -2.126953125, -1.62890625, -1.130859375, -0.6328125, -0.134765625, 0.36328125, 0.861328125, 1.359375, 1.857421875, 2.35546875, 2.853515625, 3.3515625, 3.849609375, 4.34765625, 4.845703125, 5.34375, 5.841796875, 6.33984375, 6.837890625, 7.3359375, 7.833984375, 8.33203125, 8.830078125, 9.328125, 9.826171875, 10.32421875, 10.822265625, 11.3203125, 11.818359375, 12.31640625, 12.814453125, 13.3125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 20.0, 63.0, 132.0, 394.0, 264.0, 75.0, 23.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.96810913085938, -172.7336883544922, -165.499267578125, -158.2648468017578, -151.03042602539062, -143.7960205078125, -136.56158447265625, -129.32717895507812, -122.09275817871094, -114.85833740234375, -107.62391662597656, -100.38949584960938, -93.15508270263672, -85.92066192626953, -78.68624114990234, -71.45182800292969, -64.21739959716797, -56.98297882080078, -49.74856185913086, -42.51414108276367, -35.27972412109375, -28.045303344726562, -20.810882568359375, -13.576465606689453, -6.342044830322266, 0.8923745155334473, 8.12679386138916, 15.361213684082031, 22.595632553100586, 29.83005142211914, 37.06447219848633, 44.29888916015625, 51.53330993652344, 58.767730712890625, 66.00215148925781, 73.236572265625, 80.47098541259766, 87.70540618896484, 94.93982696533203, 102.17424011230469, 109.40866088867188, 116.64308166503906, 123.87750244140625, 131.11192321777344, 138.34634399414062, 145.58074951171875, 152.815185546875, 160.04959106445312, 167.28402709960938, 174.51844787597656, 181.75286865234375, 188.98728942871094, 196.22171020507812, 203.45611572265625, 210.6905517578125, 217.92495727539062, 225.1593780517578, 232.393798828125, 239.6282196044922, 246.86264038085938, 254.09706115722656, 261.33148193359375, 268.5658874511719, 275.8003234863281, 283.03472900390625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 17.0, 16.0, 27.0, 36.0, 56.0, 73.0, 86.0, 102.0, 100.0, 97.0, 92.0, 72.0, 61.0, 42.0, 39.0, 18.0, 10.0, 12.0, 3.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.634521484375, -71.15935516357422, -68.68419647216797, -66.20903015136719, -63.73386764526367, -61.258705139160156, -58.783538818359375, -56.30837631225586, -53.833213806152344, -51.35805130004883, -48.88288497924805, -46.40772247314453, -43.932559967041016, -41.4573974609375, -38.98223114013672, -36.5070686340332, -34.03190231323242, -31.556737899780273, -29.081575393676758, -26.60641098022461, -24.131248474121094, -21.656084060668945, -19.180919647216797, -16.70575714111328, -14.230592727661133, -11.7554292678833, -9.280265808105469, -6.80510139465332, -4.329937934875488, -1.8547744750976562, 0.6203899383544922, 3.095552444458008, 5.570716857910156, 8.045880317687988, 10.52104377746582, 12.996208190917969, 15.4713716506958, 17.946535110473633, 20.42169952392578, 22.896862030029297, 25.372026443481445, 27.847190856933594, 30.32235336303711, 32.797515869140625, 35.272682189941406, 37.74784469604492, 40.22300720214844, 42.69817352294922, 45.173336029052734, 47.64849853515625, 50.12366485595703, 52.59882736206055, 55.07398986816406, 57.549156188964844, 60.02431869506836, 62.499481201171875, 64.97464752197266, 67.44981384277344, 69.92497253417969, 72.40013885498047, 74.87530517578125, 77.3504638671875, 79.82563018798828, 82.30079650878906, 84.77595520019531]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 9.0, 14.0, 21.0, 33.0, 131.0, 717.0, 4183262.0, 9850.0, 160.0, 37.0, 20.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2039.0, -1987.765625, -1936.53125, -1885.296875, -1834.0625, -1782.828125, -1731.59375, -1680.359375, -1629.125, -1577.890625, -1526.65625, -1475.421875, -1424.1875, -1372.953125, -1321.71875, -1270.484375, -1219.25, -1168.015625, -1116.78125, -1065.546875, -1014.3125, -963.078125, -911.84375, -860.609375, -809.375, -758.140625, -706.90625, -655.671875, -604.4375, -553.203125, -501.96875, -450.734375, -399.5, -348.265625, -297.03125, -245.796875, -194.5625, -143.328125, -92.09375, -40.859375, 10.375, 61.609375, 112.84375, 164.078125, 215.3125, 266.546875, 317.78125, 369.015625, 420.25, 471.484375, 522.71875, 573.953125, 625.1875, 676.421875, 727.65625, 778.890625, 830.125, 881.359375, 932.59375, 983.828125, 1035.0625, 1086.296875, 1137.53125, 1188.765625, 1240.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 13.0, 9.0, 28.0, 25.0, 60.0, 73.0, 91.0, 108.0, 114.0, 102.0, 104.0, 80.0, 59.0, 36.0, 27.0, 21.0, 12.0, 8.0, 3.0, 6.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.3743438720703125, -1.340484619140625, -1.3066253662109375, -1.27276611328125, -1.2389068603515625, -1.205047607421875, -1.1711883544921875, -1.1373291015625, -1.1034698486328125, -1.069610595703125, -1.0357513427734375, -1.00189208984375, -0.9680328369140625, -0.934173583984375, -0.9003143310546875, -0.866455078125, -0.8325958251953125, -0.798736572265625, -0.7648773193359375, -0.73101806640625, -0.6971588134765625, -0.663299560546875, -0.6294403076171875, -0.5955810546875, -0.5617218017578125, -0.527862548828125, -0.4940032958984375, -0.46014404296875, -0.4262847900390625, -0.392425537109375, -0.3585662841796875, -0.32470703125, -0.2908477783203125, -0.256988525390625, -0.2231292724609375, -0.18927001953125, -0.1554107666015625, -0.121551513671875, -0.0876922607421875, -0.0538330078125, -0.0199737548828125, 0.013885498046875, 0.0477447509765625, 0.08160400390625, 0.1154632568359375, 0.149322509765625, 0.1831817626953125, 0.217041015625, 0.2509002685546875, 0.284759521484375, 0.3186187744140625, 0.35247802734375, 0.3863372802734375, 0.420196533203125, 0.4540557861328125, 0.4879150390625, 0.5217742919921875, 0.555633544921875, 0.5894927978515625, 0.62335205078125, 0.6572113037109375, 0.691070556640625, 0.7249298095703125, 0.7587890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 11.0, 26.0, 108.0, 382.0, 4183171.0, 9476.0, 447.0, 266.0, 174.0, 110.0, 52.0, 33.0, 17.0, 6.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.0, -89.484375, -73.96875, -58.453125, -42.9375, -27.421875, -11.90625, 3.609375, 19.125, 34.640625, 50.15625, 65.671875, 81.1875, 96.703125, 112.21875, 127.734375, 143.25, 158.765625, 174.28125, 189.796875, 205.3125, 220.828125, 236.34375, 251.859375, 267.375, 282.890625, 298.40625, 313.921875, 329.4375, 344.953125, 360.46875, 375.984375, 391.5, 407.015625, 422.53125, 438.046875, 453.5625, 469.078125, 484.59375, 500.109375, 515.625, 531.140625, 546.65625, 562.171875, 577.6875, 593.203125, 608.71875, 624.234375, 639.75, 655.265625, 670.78125, 686.296875, 701.8125, 717.328125, 732.84375, 748.359375, 763.875, 779.390625, 794.90625, 810.421875, 825.9375, 841.453125, 856.96875, 872.484375, 888.0]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 10.0, 32.0, 43.0, 83.0, 246.0, 1566.0, 974.0, 462.0, 282.0, 184.0, 82.0, 50.0, 26.0, 16.0, 12.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.732391357421875, -2.58001708984375, -2.427642822265625, -2.2752685546875, -2.122894287109375, -1.97052001953125, -1.818145751953125, -1.665771484375, -1.513397216796875, -1.36102294921875, -1.208648681640625, -1.0562744140625, -0.903900146484375, -0.75152587890625, -0.599151611328125, -0.44677734375, -0.294403076171875, -0.14202880859375, 0.010345458984375, 0.1627197265625, 0.315093994140625, 0.46746826171875, 0.619842529296875, 0.772216796875, 0.924591064453125, 1.07696533203125, 1.229339599609375, 1.3817138671875, 1.534088134765625, 1.68646240234375, 1.838836669921875, 1.9912109375, 2.143585205078125, 2.29595947265625, 2.448333740234375, 2.6007080078125, 2.753082275390625, 2.90545654296875, 3.057830810546875, 3.210205078125, 3.362579345703125, 3.51495361328125, 3.667327880859375, 3.8197021484375, 3.972076416015625, 4.12445068359375, 4.276824951171875, 4.42919921875, 4.581573486328125, 4.73394775390625, 4.886322021484375, 5.0386962890625, 5.191070556640625, 5.34344482421875, 5.495819091796875, 5.648193359375, 5.800567626953125, 5.95294189453125, 6.105316162109375, 6.2576904296875, 6.410064697265625, 6.56243896484375, 6.714813232421875, 6.8671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [612.0, 391.0, 16.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.79662322998047, 3.957538604736328, 64.71170043945312, 125.46585845947266, 186.22003173828125, 246.97418212890625, 307.72833251953125, 368.4825134277344, 429.2366638183594, 489.9908142089844, 550.7449951171875, 611.4991455078125, 672.2532958984375, 733.0074462890625, 793.7615966796875, 854.5158081054688, 915.2699584960938, 976.0241088867188, 1036.7783203125, 1097.532470703125, 1158.28662109375, 1219.040771484375, 1279.794921875, 1340.549072265625, 1401.30322265625, 1462.057373046875, 1522.8115234375, 1583.565673828125, 1644.31982421875, 1705.073974609375, 1765.828125, 1826.5823974609375, 1887.3365478515625, 1948.0906982421875, 2008.8448486328125, 2069.59912109375, 2130.353271484375, 2191.107421875, 2251.861572265625, 2312.61572265625, 2373.369873046875, 2434.1240234375, 2494.878173828125, 2555.63232421875, 2616.386474609375, 2677.140625, 2737.894775390625, 2798.64892578125, 2859.403076171875, 2920.1572265625, 2980.911376953125, 3041.66552734375, 3102.419677734375, 3163.173828125, 3223.927978515625, 3284.68212890625, 3345.4365234375, 3406.190673828125, 3466.94482421875, 3527.698974609375, 3588.453125, 3649.207275390625, 3709.96142578125, 3770.715576171875, 3831.4697265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 15.0, 28.0, 42.0, 81.0, 107.0, 146.0, 165.0, 142.0, 112.0, 82.0, 40.0, 19.0, 9.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.37444305419922, -54.753570556640625, -50.13269805908203, -45.51182556152344, -40.890953063964844, -36.27008056640625, -31.649208068847656, -27.028335571289062, -22.40746307373047, -17.786590576171875, -13.165718078613281, -8.544845581054688, -3.9239730834960938, 0.6968994140625, 5.317771911621094, 9.938644409179688, 14.559516906738281, 19.180389404296875, 23.80126190185547, 28.422134399414062, 33.043006896972656, 37.66387939453125, 42.284751892089844, 46.90562438964844, 51.52649688720703, 56.147369384765625, 60.76824188232422, 65.38911437988281, 70.0099868774414, 74.630859375, 79.2517318725586, 83.87260437011719, 88.49346923828125, 93.11434173583984, 97.73521423339844, 102.35608673095703, 106.97695922851562, 111.59783172607422, 116.21870422363281, 120.8395767211914, 125.46044921875, 130.08132934570312, 134.7021942138672, 139.32305908203125, 143.94393920898438, 148.5648193359375, 153.18568420410156, 157.80654907226562, 162.42742919921875, 167.04830932617188, 171.66917419433594, 176.2900390625, 180.91091918945312, 185.53179931640625, 190.1526641845703, 194.77352905273438, 199.3944091796875, 204.01528930664062, 208.6361541748047, 213.25701904296875, 217.87789916992188, 222.498779296875, 227.11964416503906, 231.74050903320312, 236.36138916015625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 5.0, 13.0, 17.0, 16.0, 29.0, 33.0, 51.0, 67.0, 94.0, 157.0, 239.0, 376.0, 630.0, 1151.0, 1975.0, 3994.0, 8749.0, 22778.0, 79935.0, 537640.0, 304284.0, 54487.0, 17206.0, 7057.0, 3252.0, 1685.0, 1023.0, 558.0, 357.0, 205.0, 141.0, 98.0, 68.0, 48.0, 30.0, 24.0, 17.0, 20.0, 11.0, 5.0, 9.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.77587890625, -10.4267578125, -10.07763671875, -9.728515625, -9.37939453125, -9.0302734375, -8.68115234375, -8.33203125, -7.98291015625, -7.6337890625, -7.28466796875, -6.935546875, -6.58642578125, -6.2373046875, -5.88818359375, -5.5390625, -5.18994140625, -4.8408203125, -4.49169921875, -4.142578125, -3.79345703125, -3.4443359375, -3.09521484375, -2.74609375, -2.39697265625, -2.0478515625, -1.69873046875, -1.349609375, -1.00048828125, -0.6513671875, -0.30224609375, 0.046875, 0.39599609375, 0.7451171875, 1.09423828125, 1.443359375, 1.79248046875, 2.1416015625, 2.49072265625, 2.83984375, 3.18896484375, 3.5380859375, 3.88720703125, 4.236328125, 4.58544921875, 4.9345703125, 5.28369140625, 5.6328125, 5.98193359375, 6.3310546875, 6.68017578125, 7.029296875, 7.37841796875, 7.7275390625, 8.07666015625, 8.42578125, 8.77490234375, 9.1240234375, 9.47314453125, 9.822265625, 10.17138671875, 10.5205078125, 10.86962890625, 11.21875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 7.0, 9.0, 15.0, 22.0, 37.0, 34.0, 56.0, 78.0, 82.0, 85.0, 107.0, 112.0, 91.0, 74.0, 58.0, 44.0, 27.0, 20.0, 13.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.380859375, -1.3483505249023438, -1.3158416748046875, -1.2833328247070312, -1.250823974609375, -1.2183151245117188, -1.1858062744140625, -1.1532974243164062, -1.12078857421875, -1.0882797241210938, -1.0557708740234375, -1.0232620239257812, -0.990753173828125, -0.9582443237304688, -0.9257354736328125, -0.8932266235351562, -0.8607177734375, -0.8282089233398438, -0.7957000732421875, -0.7631912231445312, -0.730682373046875, -0.6981735229492188, -0.6656646728515625, -0.6331558227539062, -0.60064697265625, -0.5681381225585938, -0.5356292724609375, -0.5031204223632812, -0.470611572265625, -0.43810272216796875, -0.4055938720703125, -0.37308502197265625, -0.340576171875, -0.30806732177734375, -0.2755584716796875, -0.24304962158203125, -0.210540771484375, -0.17803192138671875, -0.1455230712890625, -0.11301422119140625, -0.08050537109375, -0.04799652099609375, -0.0154876708984375, 0.01702117919921875, 0.049530029296875, 0.08203887939453125, 0.1145477294921875, 0.14705657958984375, 0.1795654296875, 0.21207427978515625, 0.2445831298828125, 0.27709197998046875, 0.309600830078125, 0.34210968017578125, 0.3746185302734375, 0.40712738037109375, 0.43963623046875, 0.47214508056640625, 0.5046539306640625, 0.5371627807617188, 0.569671630859375, 0.6021804809570312, 0.6346893310546875, 0.6671981811523438, 0.69970703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 10.0, 6.0, 8.0, 16.0, 16.0, 16.0, 29.0, 39.0, 39.0, 99.0, 340.0, 3429.0, 206081.0, 828438.0, 9057.0, 628.0, 104.0, 46.0, 22.0, 20.0, 24.0, 14.0, 11.0, 14.0, 14.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.65625, -36.55322265625, -35.4501953125, -34.34716796875, -33.244140625, -32.14111328125, -31.0380859375, -29.93505859375, -28.83203125, -27.72900390625, -26.6259765625, -25.52294921875, -24.419921875, -23.31689453125, -22.2138671875, -21.11083984375, -20.0078125, -18.90478515625, -17.8017578125, -16.69873046875, -15.595703125, -14.49267578125, -13.3896484375, -12.28662109375, -11.18359375, -10.08056640625, -8.9775390625, -7.87451171875, -6.771484375, -5.66845703125, -4.5654296875, -3.46240234375, -2.359375, -1.25634765625, -0.1533203125, 0.94970703125, 2.052734375, 3.15576171875, 4.2587890625, 5.36181640625, 6.46484375, 7.56787109375, 8.6708984375, 9.77392578125, 10.876953125, 11.97998046875, 13.0830078125, 14.18603515625, 15.2890625, 16.39208984375, 17.4951171875, 18.59814453125, 19.701171875, 20.80419921875, 21.9072265625, 23.01025390625, 24.11328125, 25.21630859375, 26.3193359375, 27.42236328125, 28.525390625, 29.62841796875, 30.7314453125, 31.83447265625, 32.9375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 8.0, 11.0, 18.0, 20.0, 23.0, 25.0, 21.0, 23.0, 29.0, 41.0, 42.0, 38.0, 46.0, 53.0, 41.0, 54.0, 44.0, 55.0, 49.0, 32.0, 28.0, 32.0, 29.0, 29.0, 19.0, 26.0, 22.0, 24.0, 20.0, 17.0, 7.0, 11.0, 7.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.029296875, -2.92852783203125, -2.8277587890625, -2.72698974609375, -2.626220703125, -2.52545166015625, -2.4246826171875, -2.32391357421875, -2.22314453125, -2.12237548828125, -2.0216064453125, -1.92083740234375, -1.820068359375, -1.71929931640625, -1.6185302734375, -1.51776123046875, -1.4169921875, -1.31622314453125, -1.2154541015625, -1.11468505859375, -1.013916015625, -0.91314697265625, -0.8123779296875, -0.71160888671875, -0.61083984375, -0.51007080078125, -0.4093017578125, -0.30853271484375, -0.207763671875, -0.10699462890625, -0.0062255859375, 0.09454345703125, 0.1953125, 0.29608154296875, 0.3968505859375, 0.49761962890625, 0.598388671875, 0.69915771484375, 0.7999267578125, 0.90069580078125, 1.00146484375, 1.10223388671875, 1.2030029296875, 1.30377197265625, 1.404541015625, 1.50531005859375, 1.6060791015625, 1.70684814453125, 1.8076171875, 1.90838623046875, 2.0091552734375, 2.10992431640625, 2.210693359375, 2.31146240234375, 2.4122314453125, 2.51300048828125, 2.61376953125, 2.71453857421875, 2.8153076171875, 2.91607666015625, 3.016845703125, 3.11761474609375, 3.2183837890625, 3.31915283203125, 3.419921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 15.0, 33.0, 75.0, 386.0, 6521.0, 1039963.0, 1302.0, 167.0, 48.0, 13.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-397.75, -388.11328125, -378.4765625, -368.83984375, -359.203125, -349.56640625, -339.9296875, -330.29296875, -320.65625, -311.01953125, -301.3828125, -291.74609375, -282.109375, -272.47265625, -262.8359375, -253.19921875, -243.5625, -233.92578125, -224.2890625, -214.65234375, -205.015625, -195.37890625, -185.7421875, -176.10546875, -166.46875, -156.83203125, -147.1953125, -137.55859375, -127.921875, -118.28515625, -108.6484375, -99.01171875, -89.375, -79.73828125, -70.1015625, -60.46484375, -50.828125, -41.19140625, -31.5546875, -21.91796875, -12.28125, -2.64453125, 6.9921875, 16.62890625, 26.265625, 35.90234375, 45.5390625, 55.17578125, 64.8125, 74.44921875, 84.0859375, 93.72265625, 103.359375, 112.99609375, 122.6328125, 132.26953125, 141.90625, 151.54296875, 161.1796875, 170.81640625, 180.453125, 190.08984375, 199.7265625, 209.36328125, 219.0]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 9.0, 15.0, 28.0, 69.0, 152.0, 295.0, 220.0, 77.0, 43.0, 27.0, 14.0, 14.0, 8.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007638931274414062, -0.000738188624382019, -0.0007124841213226318, -0.0006867796182632446, -0.0006610751152038574, -0.0006353706121444702, -0.000609666109085083, -0.0005839616060256958, -0.0005582571029663086, -0.0005325525999069214, -0.0005068480968475342, -0.00048114359378814697, -0.00045543909072875977, -0.00042973458766937256, -0.00040403008460998535, -0.00037832558155059814, -0.00035262107849121094, -0.00032691657543182373, -0.0003012120723724365, -0.0002755075693130493, -0.0002498030662536621, -0.0002240985631942749, -0.0001983940601348877, -0.0001726895570755005, -0.00014698505401611328, -0.00012128055095672607, -9.557604789733887e-05, -6.987154483795166e-05, -4.416704177856445e-05, -1.8462538719177246e-05, 7.241964340209961e-06, 3.294646739959717e-05, 5.8650970458984375e-05, 8.435547351837158e-05, 0.00011005997657775879, 0.000135764479637146, 0.0001614689826965332, 0.0001871734857559204, 0.00021287798881530762, 0.00023858249187469482, 0.00026428699493408203, 0.00028999149799346924, 0.00031569600105285645, 0.00034140050411224365, 0.00036710500717163086, 0.00039280951023101807, 0.0004185140132904053, 0.0004442185163497925, 0.0004699230194091797, 0.0004956275224685669, 0.0005213320255279541, 0.0005470365285873413, 0.0005727410316467285, 0.0005984455347061157, 0.0006241500377655029, 0.0006498545408248901, 0.0006755590438842773, 0.0007012635469436646, 0.0007269680500030518, 0.000752672553062439, 0.0007783770561218262, 0.0008040815591812134, 0.0008297860622406006, 0.0008554905652999878, 0.000881195068359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 1.0, 4.0, 4.0, 10.0, 21.0, 34.0, 59.0, 83.0, 149.0, 240.0, 485.0, 853.0, 1742.0, 3948.0, 11079.0, 78522.0, 915925.0, 23559.0, 6407.0, 2589.0, 1174.0, 691.0, 390.0, 215.0, 134.0, 104.0, 44.0, 31.0, 19.0, 11.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-54.90625, -53.5078125, -52.109375, -50.7109375, -49.3125, -47.9140625, -46.515625, -45.1171875, -43.71875, -42.3203125, -40.921875, -39.5234375, -38.125, -36.7265625, -35.328125, -33.9296875, -32.53125, -31.1328125, -29.734375, -28.3359375, -26.9375, -25.5390625, -24.140625, -22.7421875, -21.34375, -19.9453125, -18.546875, -17.1484375, -15.75, -14.3515625, -12.953125, -11.5546875, -10.15625, -8.7578125, -7.359375, -5.9609375, -4.5625, -3.1640625, -1.765625, -0.3671875, 1.03125, 2.4296875, 3.828125, 5.2265625, 6.625, 8.0234375, 9.421875, 10.8203125, 12.21875, 13.6171875, 15.015625, 16.4140625, 17.8125, 19.2109375, 20.609375, 22.0078125, 23.40625, 24.8046875, 26.203125, 27.6015625, 29.0, 30.3984375, 31.796875, 33.1953125, 34.59375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 4.0, 7.0, 13.0, 8.0, 26.0, 54.0, 120.0, 486.0, 143.0, 54.0, 22.0, 10.0, 10.0, 12.0, 2.0, 2.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.163818359375, -17.45263671875, -16.741455078125, -16.0302734375, -15.319091796875, -14.60791015625, -13.896728515625, -13.185546875, -12.474365234375, -11.76318359375, -11.052001953125, -10.3408203125, -9.629638671875, -8.91845703125, -8.207275390625, -7.49609375, -6.784912109375, -6.07373046875, -5.362548828125, -4.6513671875, -3.940185546875, -3.22900390625, -2.517822265625, -1.806640625, -1.095458984375, -0.38427734375, 0.326904296875, 1.0380859375, 1.749267578125, 2.46044921875, 3.171630859375, 3.8828125, 4.593994140625, 5.30517578125, 6.016357421875, 6.7275390625, 7.438720703125, 8.14990234375, 8.861083984375, 9.572265625, 10.283447265625, 10.99462890625, 11.705810546875, 12.4169921875, 13.128173828125, 13.83935546875, 14.550537109375, 15.26171875, 15.972900390625, 16.68408203125, 17.395263671875, 18.1064453125, 18.817626953125, 19.52880859375, 20.239990234375, 20.951171875, 21.662353515625, 22.37353515625, 23.084716796875, 23.7958984375, 24.507080078125, 25.21826171875, 25.929443359375, 26.640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 34.0, 288.0, 596.0, 74.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.26786804199219, -103.86064147949219, -92.45341491699219, -81.04619598388672, -69.63896942138672, -58.23174285888672, -46.82452392578125, -35.41729736328125, -24.01007080078125, -12.602846145629883, -1.1956214904785156, 10.211601257324219, 21.61882781982422, 33.02605438232422, 44.43327331542969, 55.84049987792969, 67.24772644042969, 78.65495300292969, 90.06217956542969, 101.46939849853516, 112.87662506103516, 124.28385162353516, 135.69107055664062, 147.09829711914062, 158.50552368164062, 169.91275024414062, 181.31997680664062, 192.72720336914062, 204.13442993164062, 215.54165649414062, 226.94886779785156, 238.35609436035156, 249.7633056640625, 261.1705322265625, 272.5777587890625, 283.9849853515625, 295.3922119140625, 306.7994384765625, 318.2066650390625, 329.6138916015625, 341.0211181640625, 352.4283447265625, 363.8355712890625, 375.2427978515625, 386.6500244140625, 398.0572509765625, 409.4644775390625, 420.8717041015625, 432.2789001464844, 443.6861267089844, 455.0933532714844, 466.5005798339844, 477.9078063964844, 489.3150329589844, 500.72222900390625, 512.1294555664062, 523.5366821289062, 534.9439086914062, 546.3511352539062, 557.7583618164062, 569.1655883789062, 580.5728149414062, 591.9800415039062, 603.3872680664062, 614.7944946289062]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 2.0, 8.0, 15.0, 12.0, 18.0, 28.0, 35.0, 40.0, 45.0, 66.0, 50.0, 69.0, 69.0, 57.0, 83.0, 73.0, 52.0, 49.0, 33.0, 43.0, 25.0, 27.0, 23.0, 17.0, 12.0, 10.0, 5.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.27056121826172, -44.96403503417969, -43.657508850097656, -42.35097885131836, -41.04445266723633, -39.7379264831543, -38.431396484375, -37.12487030029297, -35.81834411621094, -34.511817932128906, -33.205291748046875, -31.898761749267578, -30.592235565185547, -29.285709381103516, -27.97918128967285, -26.672653198242188, -25.366127014160156, -24.059600830078125, -22.75307273864746, -21.446544647216797, -20.140018463134766, -18.833492279052734, -17.52696418762207, -16.220436096191406, -14.913909912109375, -13.607382774353027, -12.30085563659668, -10.994328498840332, -9.687801361083984, -8.381274223327637, -7.074747085571289, -5.768219947814941, -4.461692810058594, -3.155165672302246, -1.8486385345458984, -0.5421113967895508, 0.7644157409667969, 2.0709428787231445, 3.377470016479492, 4.68399715423584, 5.9905242919921875, 7.297051429748535, 8.603578567504883, 9.91010570526123, 11.216632843017578, 12.523159980773926, 13.829687118530273, 15.136214256286621, 16.44274139404297, 17.749267578125, 19.055795669555664, 20.362323760986328, 21.66884994506836, 22.97537612915039, 24.281904220581055, 25.58843231201172, 26.89495849609375, 28.20148468017578, 29.508012771606445, 30.81454086303711, 32.12106704711914, 33.42759323120117, 34.73412322998047, 36.0406494140625, 37.34717559814453]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 6.0, 2.0, 2.0, 2.0, 8.0, 0.0, 12.0, 6.0, 0.0, 10.0, 4.0, 13.0, 25.0, 30.0, 12.0, 26.0, 56.0, 243.0, 4181962.0, 11473.0, 198.0, 48.0, 28.0, 24.0, 16.0, 22.0, 12.0, 10.0, 8.0, 6.0, 8.0, 6.0, 0.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-527.5, -504.4609375, -481.421875, -458.3828125, -435.34375, -412.3046875, -389.265625, -366.2265625, -343.1875, -320.1484375, -297.109375, -274.0703125, -251.03125, -227.9921875, -204.953125, -181.9140625, -158.875, -135.8359375, -112.796875, -89.7578125, -66.71875, -43.6796875, -20.640625, 2.3984375, 25.4375, 48.4765625, 71.515625, 94.5546875, 117.59375, 140.6328125, 163.671875, 186.7109375, 209.75, 232.7890625, 255.828125, 278.8671875, 301.90625, 324.9453125, 347.984375, 371.0234375, 394.0625, 417.1015625, 440.140625, 463.1796875, 486.21875, 509.2578125, 532.296875, 555.3359375, 578.375, 601.4140625, 624.453125, 647.4921875, 670.53125, 693.5703125, 716.609375, 739.6484375, 762.6875, 785.7265625, 808.765625, 831.8046875, 854.84375, 877.8828125, 900.921875, 923.9609375, 947.0]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 9.0, 18.0, 26.0, 29.0, 47.0, 66.0, 66.0, 71.0, 102.0, 95.0, 114.0, 88.0, 84.0, 45.0, 41.0, 33.0, 22.0, 11.0, 11.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.482421875, -1.442901611328125, -1.40338134765625, -1.363861083984375, -1.3243408203125, -1.284820556640625, -1.24530029296875, -1.205780029296875, -1.166259765625, -1.126739501953125, -1.08721923828125, -1.047698974609375, -1.0081787109375, -0.968658447265625, -0.92913818359375, -0.889617919921875, -0.85009765625, -0.810577392578125, -0.77105712890625, -0.731536865234375, -0.6920166015625, -0.652496337890625, -0.61297607421875, -0.573455810546875, -0.533935546875, -0.494415283203125, -0.45489501953125, -0.415374755859375, -0.3758544921875, -0.336334228515625, -0.29681396484375, -0.257293701171875, -0.2177734375, -0.178253173828125, -0.13873291015625, -0.099212646484375, -0.0596923828125, -0.020172119140625, 0.01934814453125, 0.058868408203125, 0.098388671875, 0.137908935546875, 0.17742919921875, 0.216949462890625, 0.2564697265625, 0.295989990234375, 0.33551025390625, 0.375030517578125, 0.41455078125, 0.454071044921875, 0.49359130859375, 0.533111572265625, 0.5726318359375, 0.612152099609375, 0.65167236328125, 0.691192626953125, 0.730712890625, 0.770233154296875, 0.80975341796875, 0.849273681640625, 0.8887939453125, 0.928314208984375, 0.96783447265625, 1.007354736328125, 1.046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 94.0, 853.0, 4193204.0, 121.0, 13.0, 4.0], "bins": [-2226.0, -2189.087890625, -2152.17578125, -2115.263671875, -2078.3515625, -2041.439453125, -2004.52734375, -1967.615234375, -1930.703125, -1893.791015625, -1856.87890625, -1819.966796875, -1783.0546875, -1746.142578125, -1709.23046875, -1672.318359375, -1635.40625, -1598.494140625, -1561.58203125, -1524.669921875, -1487.7578125, -1450.845703125, -1413.93359375, -1377.021484375, -1340.109375, -1303.197265625, -1266.28515625, -1229.373046875, -1192.4609375, -1155.548828125, -1118.63671875, -1081.724609375, -1044.8125, -1007.900390625, -970.98828125, -934.076171875, -897.1640625, -860.251953125, -823.33984375, -786.427734375, -749.515625, -712.603515625, -675.69140625, -638.779296875, -601.8671875, -564.955078125, -528.04296875, -491.130859375, -454.21875, -417.306640625, -380.39453125, -343.482421875, -306.5703125, -269.658203125, -232.74609375, -195.833984375, -158.921875, -122.009765625, -85.09765625, -48.185546875, -11.2734375, 25.638671875, 62.55078125, 99.462890625, 136.375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 16.0, 28.0, 44.0, 115.0, 406.0, 3032.0, 296.0, 66.0, 33.0, 19.0, 7.0, 8.0, 3.0, 4.0, 1.0], "bins": [-12.84375, -12.608154296875, -12.37255859375, -12.136962890625, -11.9013671875, -11.665771484375, -11.43017578125, -11.194580078125, -10.958984375, -10.723388671875, -10.48779296875, -10.252197265625, -10.0166015625, -9.781005859375, -9.54541015625, -9.309814453125, -9.07421875, -8.838623046875, -8.60302734375, -8.367431640625, -8.1318359375, -7.896240234375, -7.66064453125, -7.425048828125, -7.189453125, -6.953857421875, -6.71826171875, -6.482666015625, -6.2470703125, -6.011474609375, -5.77587890625, -5.540283203125, -5.3046875, -5.069091796875, -4.83349609375, -4.597900390625, -4.3623046875, -4.126708984375, -3.89111328125, -3.655517578125, -3.419921875, -3.184326171875, -2.94873046875, -2.713134765625, -2.4775390625, -2.241943359375, -2.00634765625, -1.770751953125, -1.53515625, -1.299560546875, -1.06396484375, -0.828369140625, -0.5927734375, -0.357177734375, -0.12158203125, 0.114013671875, 0.349609375, 0.585205078125, 0.82080078125, 1.056396484375, 1.2919921875, 1.527587890625, 1.76318359375, 1.998779296875, 2.234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1013.0, 7.0], "bins": [-5447.3291015625, -5360.4169921875, -5273.5048828125, -5186.5927734375, -5099.6806640625, -5012.7685546875, -4925.8564453125, -4838.9443359375, -4752.0322265625, -4665.1201171875, -4578.2080078125, -4491.2958984375, -4404.3837890625, -4317.4716796875, -4230.5595703125, -4143.6474609375, -4056.73486328125, -3969.82275390625, -3882.91064453125, -3795.99853515625, -3709.08642578125, -3622.174072265625, -3535.261962890625, -3448.349853515625, -3361.437744140625, -3274.525634765625, -3187.613525390625, -3100.701416015625, -3013.7890625, -2926.876953125, -2839.96484375, -2753.052734375, -2666.140869140625, -2579.228759765625, -2492.316650390625, -2405.404541015625, -2318.4921875, -2231.580078125, -2144.66796875, -2057.755859375, -1970.8436279296875, -1883.9315185546875, -1797.019287109375, -1710.107177734375, -1623.195068359375, -1536.282958984375, -1449.370849609375, -1362.4586181640625, -1275.5465087890625, -1188.6343994140625, -1101.72216796875, -1014.81005859375, -927.89794921875, -840.98583984375, -754.0736694335938, -667.1614990234375, -580.2493896484375, -493.3372497558594, -406.42510986328125, -319.5129699707031, -232.600830078125, -145.68869018554688, -58.77655029296875, 28.1356201171875, 115.04772186279297]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 11.0, 37.0, 72.0, 151.0, 214.0, 236.0, 153.0, 74.0, 40.0, 15.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-270.3216552734375, -264.8896179199219, -259.45758056640625, -254.02554321289062, -248.59352111816406, -243.16148376464844, -237.7294464111328, -232.2974090576172, -226.86538696289062, -221.433349609375, -216.00131225585938, -210.56927490234375, -205.1372528076172, -199.70521545410156, -194.27317810058594, -188.8411407470703, -183.4091033935547, -177.97706604003906, -172.54502868652344, -167.11300659179688, -161.68096923828125, -156.24893188476562, -150.81689453125, -145.38485717773438, -139.95281982421875, -134.52078247070312, -129.0887451171875, -123.6567153930664, -118.22468566894531, -112.79264831542969, -107.36061096191406, -101.92857360839844, -96.4965591430664, -91.06452178955078, -85.63249206542969, -80.20045471191406, -74.76841735839844, -69.33638763427734, -63.90435028076172, -58.47231674194336, -53.040283203125, -47.60824966430664, -42.17621612548828, -36.744178771972656, -31.312145233154297, -25.880111694335938, -20.448074340820312, -15.016040802001953, -9.584007263183594, -4.151972770690918, 1.2800617218017578, 6.71209716796875, 12.14413070678711, 17.57616424560547, 23.008201599121094, 28.440235137939453, 33.87226867675781, 39.30430221557617, 44.73633575439453, 50.168373107910156, 55.600406646728516, 61.032440185546875, 66.4644775390625, 71.89651489257812, 77.32854461669922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 8.0, 4.0, 9.0, 12.0, 7.0, 8.0, 12.0, 26.0, 23.0, 28.0, 28.0, 31.0, 44.0, 66.0, 72.0, 156.0, 1075.0, 280996.0, 763930.0, 1490.0, 167.0, 68.0, 51.0, 42.0, 31.0, 21.0, 29.0, 24.0, 16.0, 17.0, 11.0, 10.0, 7.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-214.125, -207.4453125, -200.765625, -194.0859375, -187.40625, -180.7265625, -174.046875, -167.3671875, -160.6875, -154.0078125, -147.328125, -140.6484375, -133.96875, -127.2890625, -120.609375, -113.9296875, -107.25, -100.5703125, -93.890625, -87.2109375, -80.53125, -73.8515625, -67.171875, -60.4921875, -53.8125, -47.1328125, -40.453125, -33.7734375, -27.09375, -20.4140625, -13.734375, -7.0546875, -0.375, 6.3046875, 12.984375, 19.6640625, 26.34375, 33.0234375, 39.703125, 46.3828125, 53.0625, 59.7421875, 66.421875, 73.1015625, 79.78125, 86.4609375, 93.140625, 99.8203125, 106.5, 113.1796875, 119.859375, 126.5390625, 133.21875, 139.8984375, 146.578125, 153.2578125, 159.9375, 166.6171875, 173.296875, 179.9765625, 186.65625, 193.3359375, 200.015625, 206.6953125, 213.375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 30.0, 153.0, 335.0, 304.0, 148.0, 35.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.792236328125, -34.14697265625, -33.501708984375, -32.8564453125, -32.211181640625, -31.56591796875, -30.920654296875, -30.275390625, -29.630126953125, -28.98486328125, -28.339599609375, -27.6943359375, -27.049072265625, -26.40380859375, -25.758544921875, -25.11328125, -24.468017578125, -23.82275390625, -23.177490234375, -22.5322265625, -21.886962890625, -21.24169921875, -20.596435546875, -19.951171875, -19.305908203125, -18.66064453125, -18.015380859375, -17.3701171875, -16.724853515625, -16.07958984375, -15.434326171875, -14.7890625, -14.143798828125, -13.49853515625, -12.853271484375, -12.2080078125, -11.562744140625, -10.91748046875, -10.272216796875, -9.626953125, -8.981689453125, -8.33642578125, -7.691162109375, -7.0458984375, -6.400634765625, -5.75537109375, -5.110107421875, -4.46484375, -3.819580078125, -3.17431640625, -2.529052734375, -1.8837890625, -1.238525390625, -0.59326171875, 0.052001953125, 0.697265625, 1.342529296875, 1.98779296875, 2.633056640625, 3.2783203125, 3.923583984375, 4.56884765625, 5.214111328125, 5.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 5.0, 7.0, 13.0, 19.0, 22.0, 17.0, 25.0, 36.0, 47.0, 81.0, 150.0, 354.0, 1151.0, 10549.0, 575117.0, 449389.0, 9652.0, 1152.0, 324.0, 147.0, 73.0, 61.0, 25.0, 22.0, 20.0, 22.0, 14.0, 8.0, 11.0, 3.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-129.875, -125.232421875, -120.58984375, -115.947265625, -111.3046875, -106.662109375, -102.01953125, -97.376953125, -92.734375, -88.091796875, -83.44921875, -78.806640625, -74.1640625, -69.521484375, -64.87890625, -60.236328125, -55.59375, -50.951171875, -46.30859375, -41.666015625, -37.0234375, -32.380859375, -27.73828125, -23.095703125, -18.453125, -13.810546875, -9.16796875, -4.525390625, 0.1171875, 4.759765625, 9.40234375, 14.044921875, 18.6875, 23.330078125, 27.97265625, 32.615234375, 37.2578125, 41.900390625, 46.54296875, 51.185546875, 55.828125, 60.470703125, 65.11328125, 69.755859375, 74.3984375, 79.041015625, 83.68359375, 88.326171875, 92.96875, 97.611328125, 102.25390625, 106.896484375, 111.5390625, 116.181640625, 120.82421875, 125.466796875, 130.109375, 134.751953125, 139.39453125, 144.037109375, 148.6796875, 153.322265625, 157.96484375, 162.607421875, 167.25]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 10.0, 9.0, 23.0, 20.0, 19.0, 28.0, 29.0, 33.0, 33.0, 43.0, 50.0, 49.0, 54.0, 71.0, 61.0, 80.0, 46.0, 51.0, 39.0, 38.0, 36.0, 26.0, 29.0, 18.0, 11.0, 19.0, 18.0, 5.0, 11.0, 7.0, 7.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.46875, -30.302734375, -29.13671875, -27.970703125, -26.8046875, -25.638671875, -24.47265625, -23.306640625, -22.140625, -20.974609375, -19.80859375, -18.642578125, -17.4765625, -16.310546875, -15.14453125, -13.978515625, -12.8125, -11.646484375, -10.48046875, -9.314453125, -8.1484375, -6.982421875, -5.81640625, -4.650390625, -3.484375, -2.318359375, -1.15234375, 0.013671875, 1.1796875, 2.345703125, 3.51171875, 4.677734375, 5.84375, 7.009765625, 8.17578125, 9.341796875, 10.5078125, 11.673828125, 12.83984375, 14.005859375, 15.171875, 16.337890625, 17.50390625, 18.669921875, 19.8359375, 21.001953125, 22.16796875, 23.333984375, 24.5, 25.666015625, 26.83203125, 27.998046875, 29.1640625, 30.330078125, 31.49609375, 32.662109375, 33.828125, 34.994140625, 36.16015625, 37.326171875, 38.4921875, 39.658203125, 40.82421875, 41.990234375, 43.15625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 11.0, 8.0, 22.0, 35.0, 70.0, 142.0, 309.0, 1058.0, 5573.0, 1002753.0, 35118.0, 2471.0, 569.0, 209.0, 95.0, 51.0, 21.0, 7.0, 13.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.75, -200.12109375, -190.4921875, -180.86328125, -171.234375, -161.60546875, -151.9765625, -142.34765625, -132.71875, -123.08984375, -113.4609375, -103.83203125, -94.203125, -84.57421875, -74.9453125, -65.31640625, -55.6875, -46.05859375, -36.4296875, -26.80078125, -17.171875, -7.54296875, 2.0859375, 11.71484375, 21.34375, 30.97265625, 40.6015625, 50.23046875, 59.859375, 69.48828125, 79.1171875, 88.74609375, 98.375, 108.00390625, 117.6328125, 127.26171875, 136.890625, 146.51953125, 156.1484375, 165.77734375, 175.40625, 185.03515625, 194.6640625, 204.29296875, 213.921875, 223.55078125, 233.1796875, 242.80859375, 252.4375, 262.06640625, 271.6953125, 281.32421875, 290.953125, 300.58203125, 310.2109375, 319.83984375, 329.46875, 339.09765625, 348.7265625, 358.35546875, 367.984375, 377.61328125, 387.2421875, 396.87109375, 406.5]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 9.0, 5.0, 19.0, 19.0, 19.0, 33.0, 37.0, 64.0, 73.0, 103.0, 126.0, 137.0, 90.0, 71.0, 52.0, 41.0, 28.0, 19.0, 15.0, 12.0, 9.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00238800048828125, -0.0022989511489868164, -0.002209901809692383, -0.0021208524703979492, -0.0020318031311035156, -0.001942753791809082, -0.0018537044525146484, -0.0017646551132202148, -0.0016756057739257812, -0.0015865564346313477, -0.001497507095336914, -0.0014084577560424805, -0.0013194084167480469, -0.0012303590774536133, -0.0011413097381591797, -0.001052260398864746, -0.0009632110595703125, -0.0008741617202758789, -0.0007851123809814453, -0.0006960630416870117, -0.0006070137023925781, -0.0005179643630981445, -0.00042891502380371094, -0.00033986568450927734, -0.00025081634521484375, -0.00016176700592041016, -7.271766662597656e-05, 1.633167266845703e-05, 0.00010538101196289062, 0.00019443035125732422, 0.0002834796905517578, 0.0003725290298461914, 0.000461578369140625, 0.0005506277084350586, 0.0006396770477294922, 0.0007287263870239258, 0.0008177757263183594, 0.000906825065612793, 0.0009958744049072266, 0.0010849237442016602, 0.0011739730834960938, 0.0012630224227905273, 0.001352071762084961, 0.0014411211013793945, 0.0015301704406738281, 0.0016192197799682617, 0.0017082691192626953, 0.001797318458557129, 0.0018863677978515625, 0.001975417137145996, 0.0020644664764404297, 0.0021535158157348633, 0.002242565155029297, 0.0023316144943237305, 0.002420663833618164, 0.0025097131729125977, 0.0025987625122070312, 0.002687811851501465, 0.0027768611907958984, 0.002865910530090332, 0.0029549598693847656, 0.0030440092086791992, 0.003133058547973633, 0.0032221078872680664, 0.0033111572265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 6.0, 18.0, 14.0, 35.0, 82.0, 481.0, 4000.0, 1030560.0, 12066.0, 1026.0, 149.0, 43.0, 25.0, 20.0, 4.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-456.5, -443.33984375, -430.1796875, -417.01953125, -403.859375, -390.69921875, -377.5390625, -364.37890625, -351.21875, -338.05859375, -324.8984375, -311.73828125, -298.578125, -285.41796875, -272.2578125, -259.09765625, -245.9375, -232.77734375, -219.6171875, -206.45703125, -193.296875, -180.13671875, -166.9765625, -153.81640625, -140.65625, -127.49609375, -114.3359375, -101.17578125, -88.015625, -74.85546875, -61.6953125, -48.53515625, -35.375, -22.21484375, -9.0546875, 4.10546875, 17.265625, 30.42578125, 43.5859375, 56.74609375, 69.90625, 83.06640625, 96.2265625, 109.38671875, 122.546875, 135.70703125, 148.8671875, 162.02734375, 175.1875, 188.34765625, 201.5078125, 214.66796875, 227.828125, 240.98828125, 254.1484375, 267.30859375, 280.46875, 293.62890625, 306.7890625, 319.94921875, 333.109375, 346.26953125, 359.4296875, 372.58984375, 385.75]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 8.0, 15.0, 42.0, 147.0, 544.0, 149.0, 35.0, 13.0, 11.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-100.8125, -97.888671875, -94.96484375, -92.041015625, -89.1171875, -86.193359375, -83.26953125, -80.345703125, -77.421875, -74.498046875, -71.57421875, -68.650390625, -65.7265625, -62.802734375, -59.87890625, -56.955078125, -54.03125, -51.107421875, -48.18359375, -45.259765625, -42.3359375, -39.412109375, -36.48828125, -33.564453125, -30.640625, -27.716796875, -24.79296875, -21.869140625, -18.9453125, -16.021484375, -13.09765625, -10.173828125, -7.25, -4.326171875, -1.40234375, 1.521484375, 4.4453125, 7.369140625, 10.29296875, 13.216796875, 16.140625, 19.064453125, 21.98828125, 24.912109375, 27.8359375, 30.759765625, 33.68359375, 36.607421875, 39.53125, 42.455078125, 45.37890625, 48.302734375, 51.2265625, 54.150390625, 57.07421875, 59.998046875, 62.921875, 65.845703125, 68.76953125, 71.693359375, 74.6171875, 77.541015625, 80.46484375, 83.388671875, 86.3125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 11.0, 311.0, 610.0, 50.0, 15.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-386.14691162109375, -331.39495849609375, -276.64300537109375, -221.89105224609375, -167.13909912109375, -112.38714599609375, -57.63519287109375, -2.88323974609375, 51.86871337890625, 106.62066650390625, 161.37261962890625, 216.12457275390625, 270.87652587890625, 325.62847900390625, 380.38043212890625, 435.13238525390625, 489.88433837890625, 544.6362915039062, 599.3882446289062, 654.1401977539062, 708.8921508789062, 763.6441040039062, 818.3960571289062, 873.1480102539062, 927.8999633789062, 982.6519165039062, 1037.40380859375, 1092.15576171875, 1146.90771484375, 1201.65966796875, 1256.41162109375, 1311.16357421875, 1365.91552734375, 1420.66748046875, 1475.41943359375, 1530.17138671875, 1584.92333984375, 1639.67529296875, 1694.42724609375, 1749.17919921875, 1803.93115234375, 1858.68310546875, 1913.43505859375, 1968.18701171875, 2022.93896484375, 2077.69091796875, 2132.44287109375, 2187.19482421875, 2241.94677734375, 2296.69873046875, 2351.45068359375, 2406.20263671875, 2460.95458984375, 2515.70654296875, 2570.45849609375, 2625.21044921875, 2679.96240234375, 2734.71435546875, 2789.46630859375, 2844.21826171875, 2898.97021484375, 2953.72216796875, 3008.47412109375, 3063.22607421875, 3117.97802734375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 14.0, 31.0, 31.0, 44.0, 60.0, 98.0, 92.0, 97.0, 100.0, 88.0, 94.0, 73.0, 58.0, 47.0, 34.0, 14.0, 12.0, 10.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-522.893798828125, -507.7615661621094, -492.6293640136719, -477.49713134765625, -462.36492919921875, -447.2326965332031, -432.1004638671875, -416.96826171875, -401.8360595703125, -386.7038269042969, -371.5716247558594, -356.43939208984375, -341.30718994140625, -326.1749572753906, -311.042724609375, -295.9105224609375, -280.7782897949219, -265.64605712890625, -250.51385498046875, -235.38162231445312, -220.24942016601562, -205.1171875, -189.98497009277344, -174.85275268554688, -159.7205352783203, -144.58831787109375, -129.4561004638672, -114.3238754272461, -99.19165802001953, -84.05944061279297, -68.92721557617188, -53.79499816894531, -38.662811279296875, -23.53059196472168, -8.398372650146484, 6.733848571777344, 21.866065979003906, 36.99828338623047, 52.13050842285156, 67.26272583007812, 82.39494323730469, 97.52716064453125, 112.65937805175781, 127.7916030883789, 142.923828125, 158.0560302734375, 173.18826293945312, 188.3204803466797, 203.45269775390625, 218.5849151611328, 233.71713256835938, 248.849365234375, 263.9815673828125, 279.1138000488281, 294.24603271484375, 309.37823486328125, 324.51043701171875, 339.6426696777344, 354.7748718261719, 369.9071044921875, 385.039306640625, 400.1715393066406, 415.30377197265625, 430.43597412109375, 445.5682067871094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 11.0, 40.0, 108.0, 527.0, 4815.0, 4187837.0, 713.0, 184.0, 35.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0], "bins": [-1503.0, -1475.30078125, -1447.6015625, -1419.90234375, -1392.203125, -1364.50390625, -1336.8046875, -1309.10546875, -1281.40625, -1253.70703125, -1226.0078125, -1198.30859375, -1170.609375, -1142.91015625, -1115.2109375, -1087.51171875, -1059.8125, -1032.11328125, -1004.4140625, -976.71484375, -949.015625, -921.31640625, -893.6171875, -865.91796875, -838.21875, -810.51953125, -782.8203125, -755.12109375, -727.421875, -699.72265625, -672.0234375, -644.32421875, -616.625, -588.92578125, -561.2265625, -533.52734375, -505.828125, -478.12890625, -450.4296875, -422.73046875, -395.03125, -367.33203125, -339.6328125, -311.93359375, -284.234375, -256.53515625, -228.8359375, -201.13671875, -173.4375, -145.73828125, -118.0390625, -90.33984375, -62.640625, -34.94140625, -7.2421875, 20.45703125, 48.15625, 75.85546875, 103.5546875, 131.25390625, 158.953125, 186.65234375, 214.3515625, 242.05078125, 269.75]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 13.0, 24.0, 119.0, 235.0, 253.0, 208.0, 109.0, 38.0, 14.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.5, -36.79803466796875, -36.0960693359375, -35.39410400390625, -34.692138671875, -33.99017333984375, -33.2882080078125, -32.58624267578125, -31.88427734375, -31.18231201171875, -30.4803466796875, -29.77838134765625, -29.076416015625, -28.37445068359375, -27.6724853515625, -26.97052001953125, -26.2685546875, -25.56658935546875, -24.8646240234375, -24.16265869140625, -23.460693359375, -22.75872802734375, -22.0567626953125, -21.35479736328125, -20.65283203125, -19.95086669921875, -19.2489013671875, -18.54693603515625, -17.844970703125, -17.14300537109375, -16.4410400390625, -15.73907470703125, -15.037109375, -14.33514404296875, -13.6331787109375, -12.93121337890625, -12.229248046875, -11.52728271484375, -10.8253173828125, -10.12335205078125, -9.42138671875, -8.71942138671875, -8.0174560546875, -7.31549072265625, -6.613525390625, -5.91156005859375, -5.2095947265625, -4.50762939453125, -3.8056640625, -3.10369873046875, -2.4017333984375, -1.69976806640625, -0.997802734375, -0.29583740234375, 0.4061279296875, 1.10809326171875, 1.81005859375, 2.51202392578125, 3.2139892578125, 3.91595458984375, 4.617919921875, 5.31988525390625, 6.0218505859375, 6.72381591796875, 7.42578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 9.0, 17.0, 91.0, 218.0, 380.0, 1836.0, 4191208.0, 284.0, 162.0, 68.0, 14.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3990.0, -3910.484375, -3830.96875, -3751.453125, -3671.9375, -3592.421875, -3512.90625, -3433.390625, -3353.875, -3274.359375, -3194.84375, -3115.328125, -3035.8125, -2956.296875, -2876.78125, -2797.265625, -2717.75, -2638.234375, -2558.71875, -2479.203125, -2399.6875, -2320.171875, -2240.65625, -2161.140625, -2081.625, -2002.109375, -1922.59375, -1843.078125, -1763.5625, -1684.046875, -1604.53125, -1525.015625, -1445.5, -1365.984375, -1286.46875, -1206.953125, -1127.4375, -1047.921875, -968.40625, -888.890625, -809.375, -729.859375, -650.34375, -570.828125, -491.3125, -411.796875, -332.28125, -252.765625, -173.25, -93.734375, -14.21875, 65.296875, 144.8125, 224.328125, 303.84375, 383.359375, 462.875, 542.390625, 621.90625, 701.421875, 780.9375, 860.453125, 939.96875, 1019.484375, 1099.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 20.0, 146.0, 3836.0, 74.0, 9.0, 3.0, 2.0], "bins": [-268.5, -263.98583984375, -259.4716796875, -254.95751953125, -250.443359375, -245.92919921875, -241.4150390625, -236.90087890625, -232.38671875, -227.87255859375, -223.3583984375, -218.84423828125, -214.330078125, -209.81591796875, -205.3017578125, -200.78759765625, -196.2734375, -191.75927734375, -187.2451171875, -182.73095703125, -178.216796875, -173.70263671875, -169.1884765625, -164.67431640625, -160.16015625, -155.64599609375, -151.1318359375, -146.61767578125, -142.103515625, -137.58935546875, -133.0751953125, -128.56103515625, -124.046875, -119.53271484375, -115.0185546875, -110.50439453125, -105.990234375, -101.47607421875, -96.9619140625, -92.44775390625, -87.93359375, -83.41943359375, -78.9052734375, -74.39111328125, -69.876953125, -65.36279296875, -60.8486328125, -56.33447265625, -51.8203125, -47.30615234375, -42.7919921875, -38.27783203125, -33.763671875, -29.24951171875, -24.7353515625, -20.22119140625, -15.70703125, -11.19287109375, -6.6787109375, -2.16455078125, 2.349609375, 6.86376953125, 11.3779296875, 15.89208984375, 20.40625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 92.0, 863.0, 44.0, 4.0, 3.0], "bins": [-4584.515625, -4508.68115234375, -4432.84716796875, -4357.0126953125, -4281.1787109375, -4205.34423828125, -4129.509765625, -4053.67578125, -3977.841552734375, -3902.00732421875, -3826.173095703125, -3750.3388671875, -3674.50439453125, -3598.670166015625, -3522.8359375, -3447.001708984375, -3371.16748046875, -3295.333251953125, -3219.4990234375, -3143.66455078125, -3067.830322265625, -2991.99609375, -2916.161865234375, -2840.32763671875, -2764.4931640625, -2688.658935546875, -2612.82470703125, -2536.990234375, -2461.156005859375, -2385.32177734375, -2309.487548828125, -2233.6533203125, -2157.81884765625, -2081.984619140625, -2006.1502685546875, -1930.3160400390625, -1854.4818115234375, -1778.6474609375, -1702.813232421875, -1626.97900390625, -1551.144775390625, -1475.310546875, -1399.4761962890625, -1323.6419677734375, -1247.8077392578125, -1171.973388671875, -1096.13916015625, -1020.304931640625, -944.4706420898438, -868.6363525390625, -792.8021240234375, -716.9678344726562, -641.133544921875, -565.29931640625, -489.46502685546875, -413.63079833984375, -337.7965087890625, -261.9622497558594, -186.1279754638672, -110.293701171875, -34.459442138671875, 41.37481689453125, 117.2091064453125, 193.0433349609375, 268.87762451171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 16.0, 31.0, 57.0, 96.0, 153.0, 176.0, 164.0, 121.0, 85.0, 53.0, 26.0, 12.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-705.514892578125, -679.2584838867188, -653.0021362304688, -626.7457275390625, -600.4893188476562, -574.2329711914062, -547.9765625, -521.72021484375, -495.46380615234375, -469.2074279785156, -442.9510192871094, -416.69464111328125, -390.4382629394531, -364.181884765625, -337.92547607421875, -311.6690979003906, -285.4126892089844, -259.15631103515625, -232.89991760253906, -206.64352416992188, -180.38714599609375, -154.13075256347656, -127.87435913085938, -101.61798095703125, -75.36158752441406, -49.105201721191406, -22.848812103271484, 3.4075775146484375, 29.663963317871094, 55.92034912109375, 82.17674255371094, 108.43312072753906, 134.68951416015625, 160.94590759277344, 187.20228576660156, 213.45867919921875, 239.71505737304688, 265.971435546875, 292.22784423828125, 318.4842224121094, 344.7406005859375, 370.9969787597656, 397.2533874511719, 423.509765625, 449.7661437988281, 476.02252197265625, 502.2789306640625, 528.5352783203125, 554.791748046875, 581.0481567382812, 607.3045043945312, 633.5609130859375, 659.8173217773438, 686.0736694335938, 712.330078125, 738.58642578125, 764.8428344726562, 791.0992431640625, 817.3555908203125, 843.6119995117188, 869.868408203125, 896.124755859375, 922.3811645507812, 948.6375732421875, 974.8939208984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 10.0, 12.0, 16.0, 9.0, 22.0, 35.0, 46.0, 67.0, 97.0, 205.0, 457.0, 1229.0, 5117.0, 62071.0, 911937.0, 59836.0, 5098.0, 1314.0, 453.0, 195.0, 107.0, 61.0, 42.0, 41.0, 23.0, 16.0, 12.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-296.0, -286.6015625, -277.203125, -267.8046875, -258.40625, -249.0078125, -239.609375, -230.2109375, -220.8125, -211.4140625, -202.015625, -192.6171875, -183.21875, -173.8203125, -164.421875, -155.0234375, -145.625, -136.2265625, -126.828125, -117.4296875, -108.03125, -98.6328125, -89.234375, -79.8359375, -70.4375, -61.0390625, -51.640625, -42.2421875, -32.84375, -23.4453125, -14.046875, -4.6484375, 4.75, 14.1484375, 23.546875, 32.9453125, 42.34375, 51.7421875, 61.140625, 70.5390625, 79.9375, 89.3359375, 98.734375, 108.1328125, 117.53125, 126.9296875, 136.328125, 145.7265625, 155.125, 164.5234375, 173.921875, 183.3203125, 192.71875, 202.1171875, 211.515625, 220.9140625, 230.3125, 239.7109375, 249.109375, 258.5078125, 267.90625, 277.3046875, 286.703125, 296.1015625, 305.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 21.0, 48.0, 67.0, 100.0, 132.0, 171.0, 150.0, 114.0, 85.0, 55.0, 29.0, 13.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -50.194091796875, -49.04443359375, -47.894775390625, -46.7451171875, -45.595458984375, -44.44580078125, -43.296142578125, -42.146484375, -40.996826171875, -39.84716796875, -38.697509765625, -37.5478515625, -36.398193359375, -35.24853515625, -34.098876953125, -32.94921875, -31.799560546875, -30.64990234375, -29.500244140625, -28.3505859375, -27.200927734375, -26.05126953125, -24.901611328125, -23.751953125, -22.602294921875, -21.45263671875, -20.302978515625, -19.1533203125, -18.003662109375, -16.85400390625, -15.704345703125, -14.5546875, -13.405029296875, -12.25537109375, -11.105712890625, -9.9560546875, -8.806396484375, -7.65673828125, -6.507080078125, -5.357421875, -4.207763671875, -3.05810546875, -1.908447265625, -0.7587890625, 0.390869140625, 1.54052734375, 2.690185546875, 3.83984375, 4.989501953125, 6.13916015625, 7.288818359375, 8.4384765625, 9.588134765625, 10.73779296875, 11.887451171875, 13.037109375, 14.186767578125, 15.33642578125, 16.486083984375, 17.6357421875, 18.785400390625, 19.93505859375, 21.084716796875, 22.234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 12.0, 10.0, 19.0, 22.0, 29.0, 40.0, 82.0, 154.0, 314.0, 996.0, 5738.0, 220476.0, 807275.0, 11144.0, 1349.0, 415.0, 183.0, 85.0, 52.0, 44.0, 25.0, 18.0, 10.0, 10.0, 6.0, 2.0, 6.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.5, -296.072265625, -287.64453125, -279.216796875, -270.7890625, -262.361328125, -253.93359375, -245.505859375, -237.078125, -228.650390625, -220.22265625, -211.794921875, -203.3671875, -194.939453125, -186.51171875, -178.083984375, -169.65625, -161.228515625, -152.80078125, -144.373046875, -135.9453125, -127.517578125, -119.08984375, -110.662109375, -102.234375, -93.806640625, -85.37890625, -76.951171875, -68.5234375, -60.095703125, -51.66796875, -43.240234375, -34.8125, -26.384765625, -17.95703125, -9.529296875, -1.1015625, 7.326171875, 15.75390625, 24.181640625, 32.609375, 41.037109375, 49.46484375, 57.892578125, 66.3203125, 74.748046875, 83.17578125, 91.603515625, 100.03125, 108.458984375, 116.88671875, 125.314453125, 133.7421875, 142.169921875, 150.59765625, 159.025390625, 167.453125, 175.880859375, 184.30859375, 192.736328125, 201.1640625, 209.591796875, 218.01953125, 226.447265625, 234.875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 7.0, 9.0, 13.0, 18.0, 26.0, 25.0, 37.0, 36.0, 49.0, 64.0, 65.0, 67.0, 86.0, 67.0, 66.0, 64.0, 46.0, 38.0, 38.0, 38.0, 35.0, 20.0, 14.0, 11.0, 10.0, 6.0, 5.0, 4.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-90.625, -88.171875, -85.71875, -83.265625, -80.8125, -78.359375, -75.90625, -73.453125, -71.0, -68.546875, -66.09375, -63.640625, -61.1875, -58.734375, -56.28125, -53.828125, -51.375, -48.921875, -46.46875, -44.015625, -41.5625, -39.109375, -36.65625, -34.203125, -31.75, -29.296875, -26.84375, -24.390625, -21.9375, -19.484375, -17.03125, -14.578125, -12.125, -9.671875, -7.21875, -4.765625, -2.3125, 0.140625, 2.59375, 5.046875, 7.5, 9.953125, 12.40625, 14.859375, 17.3125, 19.765625, 22.21875, 24.671875, 27.125, 29.578125, 32.03125, 34.484375, 36.9375, 39.390625, 41.84375, 44.296875, 46.75, 49.203125, 51.65625, 54.109375, 56.5625, 59.015625, 61.46875, 63.921875, 66.375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 14.0, 18.0, 28.0, 49.0, 73.0, 125.0, 268.0, 640.0, 2181.0, 14580.0, 808907.0, 211367.0, 7702.0, 1522.0, 525.0, 225.0, 102.0, 72.0, 36.0, 25.0, 18.0, 15.0, 11.0, 7.0, 11.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-156.0, -151.9853515625, -147.970703125, -143.9560546875, -139.94140625, -135.9267578125, -131.912109375, -127.8974609375, -123.8828125, -119.8681640625, -115.853515625, -111.8388671875, -107.82421875, -103.8095703125, -99.794921875, -95.7802734375, -91.765625, -87.7509765625, -83.736328125, -79.7216796875, -75.70703125, -71.6923828125, -67.677734375, -63.6630859375, -59.6484375, -55.6337890625, -51.619140625, -47.6044921875, -43.58984375, -39.5751953125, -35.560546875, -31.5458984375, -27.53125, -23.5166015625, -19.501953125, -15.4873046875, -11.47265625, -7.4580078125, -3.443359375, 0.5712890625, 4.5859375, 8.6005859375, 12.615234375, 16.6298828125, 20.64453125, 24.6591796875, 28.673828125, 32.6884765625, 36.703125, 40.7177734375, 44.732421875, 48.7470703125, 52.76171875, 56.7763671875, 60.791015625, 64.8056640625, 68.8203125, 72.8349609375, 76.849609375, 80.8642578125, 84.87890625, 88.8935546875, 92.908203125, 96.9228515625, 100.9375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 6.0, 7.0, 4.0, 7.0, 20.0, 14.0, 17.0, 27.0, 58.0, 61.0, 90.0, 111.0, 124.0, 119.0, 91.0, 62.0, 47.0, 42.0, 20.0, 25.0, 14.0, 11.0, 8.0, 4.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038967132568359375, -0.003754168748855591, -0.003611624240875244, -0.0034690797328948975, -0.0033265352249145508, -0.003183990716934204, -0.0030414462089538574, -0.0028989017009735107, -0.002756357192993164, -0.0026138126850128174, -0.0024712681770324707, -0.002328723669052124, -0.0021861791610717773, -0.0020436346530914307, -0.001901090145111084, -0.0017585456371307373, -0.0016160011291503906, -0.001473456621170044, -0.0013309121131896973, -0.0011883676052093506, -0.001045823097229004, -0.0009032785892486572, -0.0007607340812683105, -0.0006181895732879639, -0.0004756450653076172, -0.0003331005573272705, -0.00019055604934692383, -4.801154136657715e-05, 9.453296661376953e-05, 0.0002370774745941162, 0.0003796219825744629, 0.0005221664905548096, 0.0006647109985351562, 0.0008072555065155029, 0.0009498000144958496, 0.0010923445224761963, 0.001234889030456543, 0.0013774335384368896, 0.0015199780464172363, 0.001662522554397583, 0.0018050670623779297, 0.0019476115703582764, 0.002090156078338623, 0.0022327005863189697, 0.0023752450942993164, 0.002517789602279663, 0.0026603341102600098, 0.0028028786182403564, 0.002945423126220703, 0.00308796763420105, 0.0032305121421813965, 0.003373056650161743, 0.00351560115814209, 0.0036581456661224365, 0.003800690174102783, 0.00394323468208313, 0.0040857791900634766, 0.004228323698043823, 0.00437086820602417, 0.004513412714004517, 0.004655957221984863, 0.00479850172996521, 0.004941046237945557, 0.005083590745925903, 0.00522613525390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 10.0, 10.0, 18.0, 32.0, 55.0, 80.0, 181.0, 437.0, 1897.0, 20198.0, 955979.0, 65342.0, 3193.0, 618.0, 207.0, 114.0, 42.0, 38.0, 26.0, 19.0, 12.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.0, -120.2021484375, -116.404296875, -112.6064453125, -108.80859375, -105.0107421875, -101.212890625, -97.4150390625, -93.6171875, -89.8193359375, -86.021484375, -82.2236328125, -78.42578125, -74.6279296875, -70.830078125, -67.0322265625, -63.234375, -59.4365234375, -55.638671875, -51.8408203125, -48.04296875, -44.2451171875, -40.447265625, -36.6494140625, -32.8515625, -29.0537109375, -25.255859375, -21.4580078125, -17.66015625, -13.8623046875, -10.064453125, -6.2666015625, -2.46875, 1.3291015625, 5.126953125, 8.9248046875, 12.72265625, 16.5205078125, 20.318359375, 24.1162109375, 27.9140625, 31.7119140625, 35.509765625, 39.3076171875, 43.10546875, 46.9033203125, 50.701171875, 54.4990234375, 58.296875, 62.0947265625, 65.892578125, 69.6904296875, 73.48828125, 77.2861328125, 81.083984375, 84.8818359375, 88.6796875, 92.4775390625, 96.275390625, 100.0732421875, 103.87109375, 107.6689453125, 111.466796875, 115.2646484375, 119.0625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 3.0, 5.0, 11.0, 15.0, 17.0, 29.0, 27.0, 65.0, 88.0, 104.0, 113.0, 151.0, 118.0, 69.0, 51.0, 34.0, 17.0, 18.0, 15.0, 11.0, 7.0, 8.0, 6.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.66748046875, -35.5537109375, -34.43994140625, -33.326171875, -32.21240234375, -31.0986328125, -29.98486328125, -28.87109375, -27.75732421875, -26.6435546875, -25.52978515625, -24.416015625, -23.30224609375, -22.1884765625, -21.07470703125, -19.9609375, -18.84716796875, -17.7333984375, -16.61962890625, -15.505859375, -14.39208984375, -13.2783203125, -12.16455078125, -11.05078125, -9.93701171875, -8.8232421875, -7.70947265625, -6.595703125, -5.48193359375, -4.3681640625, -3.25439453125, -2.140625, -1.02685546875, 0.0869140625, 1.20068359375, 2.314453125, 3.42822265625, 4.5419921875, 5.65576171875, 6.76953125, 7.88330078125, 8.9970703125, 10.11083984375, 11.224609375, 12.33837890625, 13.4521484375, 14.56591796875, 15.6796875, 16.79345703125, 17.9072265625, 19.02099609375, 20.134765625, 21.24853515625, 22.3623046875, 23.47607421875, 24.58984375, 25.70361328125, 26.8173828125, 27.93115234375, 29.044921875, 30.15869140625, 31.2724609375, 32.38623046875, 33.5]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 10.0, 42.0, 511.0, 386.0, 39.0, 8.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-359.887451171875, -297.334716796875, -234.781982421875, -172.22923278808594, -109.67649841308594, -47.123748779296875, 15.428985595703125, 77.98171997070312, 140.53445434570312, 203.08718872070312, 265.6399230957031, 328.19268798828125, 390.74542236328125, 453.29815673828125, 515.8508911132812, 578.4036254882812, 640.9563598632812, 703.5090942382812, 766.0618286132812, 828.6145629882812, 891.1672973632812, 953.7200927734375, 1016.2728271484375, 1078.8255615234375, 1141.3782958984375, 1203.9310302734375, 1266.4837646484375, 1329.0364990234375, 1391.5892333984375, 1454.1419677734375, 1516.6947021484375, 1579.2474365234375, 1641.8001708984375, 1704.3529052734375, 1766.9056396484375, 1829.4583740234375, 1892.0111083984375, 1954.5638427734375, 2017.1165771484375, 2079.66943359375, 2142.22216796875, 2204.77490234375, 2267.32763671875, 2329.88037109375, 2392.43310546875, 2454.98583984375, 2517.53857421875, 2580.09130859375, 2642.64404296875, 2705.19677734375, 2767.74951171875, 2830.30224609375, 2892.85498046875, 2955.40771484375, 3017.96044921875, 3080.51318359375, 3143.06591796875, 3205.61865234375, 3268.17138671875, 3330.72412109375, 3393.27685546875, 3455.82958984375, 3518.38232421875, 3580.93505859375, 3643.48779296875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 0.0, 7.0, 7.0, 10.0, 14.0, 18.0, 25.0, 33.0, 49.0, 60.0, 72.0, 65.0, 71.0, 68.0, 63.0, 68.0, 70.0, 63.0, 48.0, 45.0, 35.0, 33.0, 29.0, 9.0, 14.0, 10.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-674.919921875, -657.9329833984375, -640.946044921875, -623.9590454101562, -606.9721069335938, -589.9851684570312, -572.9981689453125, -556.01123046875, -539.0242919921875, -522.037353515625, -505.0503845214844, -488.06341552734375, -471.07647705078125, -454.08953857421875, -437.1025695800781, -420.1156005859375, -403.128662109375, -386.1417236328125, -369.1547546386719, -352.16778564453125, -335.18084716796875, -318.19390869140625, -301.2069396972656, -284.219970703125, -267.2330322265625, -250.24607849121094, -233.25912475585938, -216.2721710205078, -199.28521728515625, -182.2982635498047, -165.31130981445312, -148.32435607910156, -131.33746337890625, -114.35050964355469, -97.36355590820312, -80.37660217285156, -63.3896484375, -46.40269470214844, -29.415740966796875, -12.428787231445312, 4.55816650390625, 21.545120239257812, 38.532073974609375, 55.51902770996094, 72.5059814453125, 89.49293518066406, 106.47988891601562, 123.46684265136719, 140.45379638671875, 157.4407501220703, 174.42770385742188, 191.41465759277344, 208.401611328125, 225.38856506347656, 242.37551879882812, 259.36248779296875, 276.34942626953125, 293.33636474609375, 310.3233337402344, 327.310302734375, 344.2972412109375, 361.2841796875, 378.2711486816406, 395.25811767578125, 412.24505615234375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 27.0, 51.0, 98.0, 226.0, 620.0, 6402.0, 4177150.0, 9194.0, 302.0, 104.0, 55.0, 20.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0], "bins": [-1128.0, -1106.537109375, -1085.07421875, -1063.611328125, -1042.1484375, -1020.685546875, -999.22265625, -977.759765625, -956.296875, -934.833984375, -913.37109375, -891.908203125, -870.4453125, -848.982421875, -827.51953125, -806.056640625, -784.59375, -763.130859375, -741.66796875, -720.205078125, -698.7421875, -677.279296875, -655.81640625, -634.353515625, -612.890625, -591.427734375, -569.96484375, -548.501953125, -527.0390625, -505.576171875, -484.11328125, -462.650390625, -441.1875, -419.724609375, -398.26171875, -376.798828125, -355.3359375, -333.873046875, -312.41015625, -290.947265625, -269.484375, -248.021484375, -226.55859375, -205.095703125, -183.6328125, -162.169921875, -140.70703125, -119.244140625, -97.78125, -76.318359375, -54.85546875, -33.392578125, -11.9296875, 9.533203125, 30.99609375, 52.458984375, 73.921875, 95.384765625, 116.84765625, 138.310546875, 159.7734375, 181.236328125, 202.69921875, 224.162109375, 245.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 11.0, 21.0, 24.0, 67.0, 85.0, 101.0, 127.0, 146.0, 158.0, 87.0, 72.0, 58.0, 22.0, 10.0, 12.0, 1.0, 5.0, 2.0, 3.0], "bins": [-52.875, -51.8634033203125, -50.851806640625, -49.8402099609375, -48.82861328125, -47.8170166015625, -46.805419921875, -45.7938232421875, -44.7822265625, -43.7706298828125, -42.759033203125, -41.7474365234375, -40.73583984375, -39.7242431640625, -38.712646484375, -37.7010498046875, -36.689453125, -35.6778564453125, -34.666259765625, -33.6546630859375, -32.64306640625, -31.6314697265625, -30.619873046875, -29.6082763671875, -28.5966796875, -27.5850830078125, -26.573486328125, -25.5618896484375, -24.55029296875, -23.5386962890625, -22.527099609375, -21.5155029296875, -20.50390625, -19.4923095703125, -18.480712890625, -17.4691162109375, -16.45751953125, -15.4459228515625, -14.434326171875, -13.4227294921875, -12.4111328125, -11.3995361328125, -10.387939453125, -9.3763427734375, -8.36474609375, -7.3531494140625, -6.341552734375, -5.3299560546875, -4.318359375, -3.3067626953125, -2.295166015625, -1.2835693359375, -0.27197265625, 0.7396240234375, 1.751220703125, 2.7628173828125, 3.7744140625, 4.7860107421875, 5.797607421875, 6.8092041015625, 7.82080078125, 8.8323974609375, 9.843994140625, 10.8555908203125, 11.8671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 11.0, 33.0, 96.0, 421.0, 4309.0, 4188626.0, 650.0, 102.0, 21.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2888.0, -2831.6875, -2775.375, -2719.0625, -2662.75, -2606.4375, -2550.125, -2493.8125, -2437.5, -2381.1875, -2324.875, -2268.5625, -2212.25, -2155.9375, -2099.625, -2043.3125, -1987.0, -1930.6875, -1874.375, -1818.0625, -1761.75, -1705.4375, -1649.125, -1592.8125, -1536.5, -1480.1875, -1423.875, -1367.5625, -1311.25, -1254.9375, -1198.625, -1142.3125, -1086.0, -1029.6875, -973.375, -917.0625, -860.75, -804.4375, -748.125, -691.8125, -635.5, -579.1875, -522.875, -466.5625, -410.25, -353.9375, -297.625, -241.3125, -185.0, -128.6875, -72.375, -16.0625, 40.25, 96.5625, 152.875, 209.1875, 265.5, 321.8125, 378.125, 434.4375, 490.75, 547.0625, 603.375, 659.6875, 716.0]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 17.0, 57.0, 204.0, 3387.0, 343.0, 51.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.5, -181.91162109375, -178.3232421875, -174.73486328125, -171.146484375, -167.55810546875, -163.9697265625, -160.38134765625, -156.79296875, -153.20458984375, -149.6162109375, -146.02783203125, -142.439453125, -138.85107421875, -135.2626953125, -131.67431640625, -128.0859375, -124.49755859375, -120.9091796875, -117.32080078125, -113.732421875, -110.14404296875, -106.5556640625, -102.96728515625, -99.37890625, -95.79052734375, -92.2021484375, -88.61376953125, -85.025390625, -81.43701171875, -77.8486328125, -74.26025390625, -70.671875, -67.08349609375, -63.4951171875, -59.90673828125, -56.318359375, -52.72998046875, -49.1416015625, -45.55322265625, -41.96484375, -38.37646484375, -34.7880859375, -31.19970703125, -27.611328125, -24.02294921875, -20.4345703125, -16.84619140625, -13.2578125, -9.66943359375, -6.0810546875, -2.49267578125, 1.095703125, 4.68408203125, 8.2724609375, 11.86083984375, 15.44921875, 19.03759765625, 22.6259765625, 26.21435546875, 29.802734375, 33.39111328125, 36.9794921875, 40.56787109375, 44.15625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 20.0, 261.0, 690.0, 25.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1611.473388671875, -1559.8580322265625, -1508.2427978515625, -1456.62744140625, -1405.0120849609375, -1353.396728515625, -1301.781494140625, -1250.1661376953125, -1198.55078125, -1146.9354248046875, -1095.3201904296875, -1043.704833984375, -992.0894775390625, -940.4741821289062, -888.85888671875, -837.2435302734375, -785.6282958984375, -734.0130004882812, -682.3976440429688, -630.7823486328125, -579.1669921875, -527.5516967773438, -475.9364013671875, -424.3210754394531, -372.70574951171875, -321.0904235839844, -269.47509765625, -217.85980224609375, -166.24447631835938, -114.629150390625, -63.01385498046875, -11.398529052734375, 40.2166748046875, 91.83199310302734, 143.4473114013672, 195.0626220703125, 246.67794799804688, 298.29327392578125, 349.9085693359375, 401.5238952636719, 453.13922119140625, 504.7545471191406, 556.369873046875, 607.9851684570312, 659.6004638671875, 711.2158203125, 762.8311157226562, 814.4464111328125, 866.061767578125, 917.6770629882812, 969.2924194335938, 1020.90771484375, 1072.5230712890625, 1124.138427734375, 1175.753662109375, 1227.3690185546875, 1278.984375, 1330.5997314453125, 1382.2149658203125, 1433.830322265625, 1485.4456787109375, 1537.06103515625, 1588.67626953125, 1640.2916259765625, 1691.9068603515625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 13.0, 18.0, 28.0, 41.0, 64.0, 86.0, 102.0, 115.0, 111.0, 117.0, 104.0, 72.0, 47.0, 33.0, 32.0, 8.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-518.6447143554688, -504.4065246582031, -490.1683349609375, -475.9301452636719, -461.69195556640625, -447.4537658691406, -433.215576171875, -418.9773864746094, -404.73919677734375, -390.5010070800781, -376.2628173828125, -362.0246276855469, -347.78643798828125, -333.5482482910156, -319.31005859375, -305.0718688964844, -290.83367919921875, -276.5954895019531, -262.3572998046875, -248.11911010742188, -233.88092041015625, -219.64273071289062, -205.404541015625, -191.16635131835938, -176.92816162109375, -162.68997192382812, -148.4517822265625, -134.21359252929688, -119.97540283203125, -105.73721313476562, -91.4990234375, -77.26083374023438, -63.02264404296875, -48.784454345703125, -34.5462646484375, -20.308074951171875, -6.06988525390625, 8.168304443359375, 22.406494140625, 36.644683837890625, 50.88287353515625, 65.12106323242188, 79.3592529296875, 93.59744262695312, 107.83563232421875, 122.07382202148438, 136.31201171875, 150.55020141601562, 164.78839111328125, 179.02658081054688, 193.2647705078125, 207.50296020507812, 221.74114990234375, 235.97933959960938, 250.217529296875, 264.4557189941406, 278.69390869140625, 292.9320983886719, 307.1702880859375, 321.4084777832031, 335.64666748046875, 349.8848571777344, 364.123046875, 378.3612365722656, 392.59942626953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 13.0, 10.0, 15.0, 15.0, 30.0, 29.0, 43.0, 60.0, 74.0, 116.0, 151.0, 296.0, 514.0, 1127.0, 3427.0, 14292.0, 92097.0, 748962.0, 158497.0, 21057.0, 4701.0, 1398.0, 636.0, 320.0, 191.0, 123.0, 92.0, 69.0, 38.0, 24.0, 39.0, 19.0, 15.0, 11.0, 9.0, 10.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.75, -147.412109375, -142.07421875, -136.736328125, -131.3984375, -126.060546875, -120.72265625, -115.384765625, -110.046875, -104.708984375, -99.37109375, -94.033203125, -88.6953125, -83.357421875, -78.01953125, -72.681640625, -67.34375, -62.005859375, -56.66796875, -51.330078125, -45.9921875, -40.654296875, -35.31640625, -29.978515625, -24.640625, -19.302734375, -13.96484375, -8.626953125, -3.2890625, 2.048828125, 7.38671875, 12.724609375, 18.0625, 23.400390625, 28.73828125, 34.076171875, 39.4140625, 44.751953125, 50.08984375, 55.427734375, 60.765625, 66.103515625, 71.44140625, 76.779296875, 82.1171875, 87.455078125, 92.79296875, 98.130859375, 103.46875, 108.806640625, 114.14453125, 119.482421875, 124.8203125, 130.158203125, 135.49609375, 140.833984375, 146.171875, 151.509765625, 156.84765625, 162.185546875, 167.5234375, 172.861328125, 178.19921875, 183.537109375, 188.875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 14.0, 25.0, 27.0, 47.0, 55.0, 103.0, 94.0, 127.0, 115.0, 127.0, 80.0, 65.0, 57.0, 33.0, 11.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.59375, -51.39599609375, -50.1982421875, -49.00048828125, -47.802734375, -46.60498046875, -45.4072265625, -44.20947265625, -43.01171875, -41.81396484375, -40.6162109375, -39.41845703125, -38.220703125, -37.02294921875, -35.8251953125, -34.62744140625, -33.4296875, -32.23193359375, -31.0341796875, -29.83642578125, -28.638671875, -27.44091796875, -26.2431640625, -25.04541015625, -23.84765625, -22.64990234375, -21.4521484375, -20.25439453125, -19.056640625, -17.85888671875, -16.6611328125, -15.46337890625, -14.265625, -13.06787109375, -11.8701171875, -10.67236328125, -9.474609375, -8.27685546875, -7.0791015625, -5.88134765625, -4.68359375, -3.48583984375, -2.2880859375, -1.09033203125, 0.107421875, 1.30517578125, 2.5029296875, 3.70068359375, 4.8984375, 6.09619140625, 7.2939453125, 8.49169921875, 9.689453125, 10.88720703125, 12.0849609375, 13.28271484375, 14.48046875, 15.67822265625, 16.8759765625, 18.07373046875, 19.271484375, 20.46923828125, 21.6669921875, 22.86474609375, 24.0625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 15.0, 16.0, 21.0, 25.0, 33.0, 62.0, 85.0, 155.0, 234.0, 479.0, 1108.0, 3509.0, 20793.0, 444114.0, 547965.0, 23783.0, 3789.0, 1144.0, 500.0, 253.0, 158.0, 99.0, 61.0, 40.0, 30.0, 20.0, 14.0, 11.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.0, -162.970703125, -156.94140625, -150.912109375, -144.8828125, -138.853515625, -132.82421875, -126.794921875, -120.765625, -114.736328125, -108.70703125, -102.677734375, -96.6484375, -90.619140625, -84.58984375, -78.560546875, -72.53125, -66.501953125, -60.47265625, -54.443359375, -48.4140625, -42.384765625, -36.35546875, -30.326171875, -24.296875, -18.267578125, -12.23828125, -6.208984375, -0.1796875, 5.849609375, 11.87890625, 17.908203125, 23.9375, 29.966796875, 35.99609375, 42.025390625, 48.0546875, 54.083984375, 60.11328125, 66.142578125, 72.171875, 78.201171875, 84.23046875, 90.259765625, 96.2890625, 102.318359375, 108.34765625, 114.376953125, 120.40625, 126.435546875, 132.46484375, 138.494140625, 144.5234375, 150.552734375, 156.58203125, 162.611328125, 168.640625, 174.669921875, 180.69921875, 186.728515625, 192.7578125, 198.787109375, 204.81640625, 210.845703125, 216.875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 1.0, 10.0, 15.0, 12.0, 13.0, 17.0, 25.0, 24.0, 31.0, 46.0, 49.0, 46.0, 67.0, 65.0, 67.0, 58.0, 56.0, 73.0, 42.0, 40.0, 49.0, 36.0, 34.0, 31.0, 24.0, 12.0, 18.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.0, -80.056640625, -77.11328125, -74.169921875, -71.2265625, -68.283203125, -65.33984375, -62.396484375, -59.453125, -56.509765625, -53.56640625, -50.623046875, -47.6796875, -44.736328125, -41.79296875, -38.849609375, -35.90625, -32.962890625, -30.01953125, -27.076171875, -24.1328125, -21.189453125, -18.24609375, -15.302734375, -12.359375, -9.416015625, -6.47265625, -3.529296875, -0.5859375, 2.357421875, 5.30078125, 8.244140625, 11.1875, 14.130859375, 17.07421875, 20.017578125, 22.9609375, 25.904296875, 28.84765625, 31.791015625, 34.734375, 37.677734375, 40.62109375, 43.564453125, 46.5078125, 49.451171875, 52.39453125, 55.337890625, 58.28125, 61.224609375, 64.16796875, 67.111328125, 70.0546875, 72.998046875, 75.94140625, 78.884765625, 81.828125, 84.771484375, 87.71484375, 90.658203125, 93.6015625, 96.544921875, 99.48828125, 102.431640625, 105.375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 6.0, 21.0, 26.0, 42.0, 79.0, 192.0, 460.0, 1541.0, 8290.0, 137134.0, 864191.0, 31381.0, 3687.0, 897.0, 306.0, 137.0, 59.0, 41.0, 20.0, 12.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.5, -97.201171875, -94.90234375, -92.603515625, -90.3046875, -88.005859375, -85.70703125, -83.408203125, -81.109375, -78.810546875, -76.51171875, -74.212890625, -71.9140625, -69.615234375, -67.31640625, -65.017578125, -62.71875, -60.419921875, -58.12109375, -55.822265625, -53.5234375, -51.224609375, -48.92578125, -46.626953125, -44.328125, -42.029296875, -39.73046875, -37.431640625, -35.1328125, -32.833984375, -30.53515625, -28.236328125, -25.9375, -23.638671875, -21.33984375, -19.041015625, -16.7421875, -14.443359375, -12.14453125, -9.845703125, -7.546875, -5.248046875, -2.94921875, -0.650390625, 1.6484375, 3.947265625, 6.24609375, 8.544921875, 10.84375, 13.142578125, 15.44140625, 17.740234375, 20.0390625, 22.337890625, 24.63671875, 26.935546875, 29.234375, 31.533203125, 33.83203125, 36.130859375, 38.4296875, 40.728515625, 43.02734375, 45.326171875, 47.625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 10.0, 13.0, 9.0, 19.0, 27.0, 27.0, 41.0, 58.0, 55.0, 85.0, 76.0, 92.0, 86.0, 83.0, 62.0, 56.0, 40.0, 46.0, 25.0, 14.0, 14.0, 17.0, 9.0, 7.0, 7.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003284454345703125, -0.0031896233558654785, -0.003094792366027832, -0.0029999613761901855, -0.002905130386352539, -0.0028102993965148926, -0.002715468406677246, -0.0026206374168395996, -0.002525806427001953, -0.0024309754371643066, -0.00233614444732666, -0.0022413134574890137, -0.002146482467651367, -0.0020516514778137207, -0.0019568204879760742, -0.0018619894981384277, -0.0017671585083007812, -0.0016723275184631348, -0.0015774965286254883, -0.0014826655387878418, -0.0013878345489501953, -0.0012930035591125488, -0.0011981725692749023, -0.0011033415794372559, -0.0010085105895996094, -0.0009136795997619629, -0.0008188486099243164, -0.0007240176200866699, -0.0006291866302490234, -0.000534355640411377, -0.00043952465057373047, -0.000344693660736084, -0.0002498626708984375, -0.00015503168106079102, -6.020069122314453e-05, 3.463029861450195e-05, 0.00012946128845214844, 0.00022429227828979492, 0.0003191232681274414, 0.0004139542579650879, 0.0005087852478027344, 0.0006036162376403809, 0.0006984472274780273, 0.0007932782173156738, 0.0008881092071533203, 0.0009829401969909668, 0.0010777711868286133, 0.0011726021766662598, 0.0012674331665039062, 0.0013622641563415527, 0.0014570951461791992, 0.0015519261360168457, 0.0016467571258544922, 0.0017415881156921387, 0.0018364191055297852, 0.0019312500953674316, 0.002026081085205078, 0.0021209120750427246, 0.002215743064880371, 0.0023105740547180176, 0.002405405044555664, 0.0025002360343933105, 0.002595067024230957, 0.0026898980140686035, 0.00278472900390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 12.0, 10.0, 7.0, 8.0, 21.0, 22.0, 41.0, 54.0, 80.0, 128.0, 242.0, 525.0, 1347.0, 4320.0, 22936.0, 410232.0, 572126.0, 28658.0, 5022.0, 1470.0, 603.0, 275.0, 134.0, 79.0, 41.0, 50.0, 29.0, 17.0, 12.0, 11.0, 6.0, 2.0, 6.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.8349609375, -44.201171875, -42.5673828125, -40.93359375, -39.2998046875, -37.666015625, -36.0322265625, -34.3984375, -32.7646484375, -31.130859375, -29.4970703125, -27.86328125, -26.2294921875, -24.595703125, -22.9619140625, -21.328125, -19.6943359375, -18.060546875, -16.4267578125, -14.79296875, -13.1591796875, -11.525390625, -9.8916015625, -8.2578125, -6.6240234375, -4.990234375, -3.3564453125, -1.72265625, -0.0888671875, 1.544921875, 3.1787109375, 4.8125, 6.4462890625, 8.080078125, 9.7138671875, 11.34765625, 12.9814453125, 14.615234375, 16.2490234375, 17.8828125, 19.5166015625, 21.150390625, 22.7841796875, 24.41796875, 26.0517578125, 27.685546875, 29.3193359375, 30.953125, 32.5869140625, 34.220703125, 35.8544921875, 37.48828125, 39.1220703125, 40.755859375, 42.3896484375, 44.0234375, 45.6572265625, 47.291015625, 48.9248046875, 50.55859375, 52.1923828125, 53.826171875, 55.4599609375, 57.09375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 9.0, 14.0, 11.0, 11.0, 16.0, 19.0, 25.0, 47.0, 61.0, 69.0, 92.0, 108.0, 103.0, 94.0, 77.0, 56.0, 41.0, 25.0, 26.0, 17.0, 13.0, 17.0, 8.0, 3.0, 6.0, 2.0, 3.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.015625, -23.2109375, -22.40625, -21.6015625, -20.796875, -19.9921875, -19.1875, -18.3828125, -17.578125, -16.7734375, -15.96875, -15.1640625, -14.359375, -13.5546875, -12.75, -11.9453125, -11.140625, -10.3359375, -9.53125, -8.7265625, -7.921875, -7.1171875, -6.3125, -5.5078125, -4.703125, -3.8984375, -3.09375, -2.2890625, -1.484375, -0.6796875, 0.125, 0.9296875, 1.734375, 2.5390625, 3.34375, 4.1484375, 4.953125, 5.7578125, 6.5625, 7.3671875, 8.171875, 8.9765625, 9.78125, 10.5859375, 11.390625, 12.1953125, 13.0, 13.8046875, 14.609375, 15.4140625, 16.21875, 17.0234375, 17.828125, 18.6328125, 19.4375, 20.2421875, 21.046875, 21.8515625, 22.65625, 23.4609375, 24.265625, 25.0703125, 25.875, 26.6796875, 27.484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 10.0, 12.0, 77.0, 240.0, 437.0, 142.0, 53.0, 19.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-880.3253173828125, -842.2881469726562, -804.2509765625, -766.2138061523438, -728.1766357421875, -690.1395263671875, -652.1023559570312, -614.065185546875, -576.0280151367188, -537.9908447265625, -499.95367431640625, -461.9165344238281, -423.8793640136719, -385.8421936035156, -347.8050537109375, -309.76788330078125, -271.730712890625, -233.69354248046875, -195.65638732910156, -157.61923217773438, -119.58206176757812, -81.54489135742188, -43.50773620605469, -5.4705810546875, 32.56658935546875, 70.60375213623047, 108.64091491699219, 146.67807006835938, 184.71524047851562, 222.75241088867188, 260.78955078125, 298.82672119140625, 336.86376953125, 374.90093994140625, 412.9381103515625, 450.9752502441406, 489.0124206542969, 527.049560546875, 565.0867309570312, 603.1239013671875, 641.1610717773438, 679.1982421875, 717.2354125976562, 755.2725830078125, 793.3096923828125, 831.346923828125, 869.384033203125, 907.4212036132812, 945.4583740234375, 983.4955444335938, 1021.53271484375, 1059.56982421875, 1097.6070556640625, 1135.6441650390625, 1173.681396484375, 1211.718505859375, 1249.755615234375, 1287.792724609375, 1325.8299560546875, 1363.8670654296875, 1401.904296875, 1439.94140625, 1477.9786376953125, 1516.0157470703125, 1554.052978515625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 15.0, 24.0, 11.0, 24.0, 32.0, 56.0, 65.0, 44.0, 71.0, 66.0, 72.0, 64.0, 79.0, 76.0, 62.0, 52.0, 45.0, 33.0, 24.0, 16.0, 16.0, 18.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-536.2186279296875, -516.4986572265625, -496.7786560058594, -477.05865478515625, -457.33868408203125, -437.61871337890625, -417.8987121582031, -398.1787109375, -378.458740234375, -358.73876953125, -339.0187683105469, -319.29876708984375, -299.57879638671875, -279.85882568359375, -260.1388244628906, -240.41883850097656, -220.6988525390625, -200.97886657714844, -181.25888061523438, -161.5388946533203, -141.81890869140625, -122.09892272949219, -102.37893676757812, -82.65895080566406, -62.93896484375, -43.21897888183594, -23.498992919921875, -3.7790069580078125, 15.94097900390625, 35.66096496582031, 55.380950927734375, 75.10093688964844, 94.82098388671875, 114.54096984863281, 134.26095581054688, 153.98094177246094, 173.700927734375, 193.42091369628906, 213.14089965820312, 232.8608856201172, 252.58087158203125, 272.30084228515625, 292.0208435058594, 311.7408447265625, 331.4608154296875, 351.1807861328125, 370.9007873535156, 390.62078857421875, 410.34075927734375, 430.06072998046875, 449.7807312011719, 469.500732421875, 489.220703125, 508.940673828125, 528.66064453125, 548.3806762695312, 568.1006469726562, 587.8206176757812, 607.5406494140625, 627.2606201171875, 646.9805908203125, 666.7005615234375, 686.4205322265625, 706.1405639648438, 725.8605346679688]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 9.0, 12.0, 12.0, 34.0, 54.0, 93.0, 188.0, 418.0, 1088.0, 5166.0, 292746.0, 3885330.0, 7530.0, 1027.0, 317.0, 129.0, 58.0, 28.0, 11.0, 11.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-507.0, -495.7578125, -484.515625, -473.2734375, -462.03125, -450.7890625, -439.546875, -428.3046875, -417.0625, -405.8203125, -394.578125, -383.3359375, -372.09375, -360.8515625, -349.609375, -338.3671875, -327.125, -315.8828125, -304.640625, -293.3984375, -282.15625, -270.9140625, -259.671875, -248.4296875, -237.1875, -225.9453125, -214.703125, -203.4609375, -192.21875, -180.9765625, -169.734375, -158.4921875, -147.25, -136.0078125, -124.765625, -113.5234375, -102.28125, -91.0390625, -79.796875, -68.5546875, -57.3125, -46.0703125, -34.828125, -23.5859375, -12.34375, -1.1015625, 10.140625, 21.3828125, 32.625, 43.8671875, 55.109375, 66.3515625, 77.59375, 88.8359375, 100.078125, 111.3203125, 122.5625, 133.8046875, 145.046875, 156.2890625, 167.53125, 178.7734375, 190.015625, 201.2578125, 212.5]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 7.0, 22.0, 35.0, 53.0, 60.0, 98.0, 104.0, 120.0, 109.0, 115.0, 78.0, 62.0, 57.0, 37.0, 20.0, 10.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.375, -50.1787109375, -48.982421875, -47.7861328125, -46.58984375, -45.3935546875, -44.197265625, -43.0009765625, -41.8046875, -40.6083984375, -39.412109375, -38.2158203125, -37.01953125, -35.8232421875, -34.626953125, -33.4306640625, -32.234375, -31.0380859375, -29.841796875, -28.6455078125, -27.44921875, -26.2529296875, -25.056640625, -23.8603515625, -22.6640625, -21.4677734375, -20.271484375, -19.0751953125, -17.87890625, -16.6826171875, -15.486328125, -14.2900390625, -13.09375, -11.8974609375, -10.701171875, -9.5048828125, -8.30859375, -7.1123046875, -5.916015625, -4.7197265625, -3.5234375, -2.3271484375, -1.130859375, 0.0654296875, 1.26171875, 2.4580078125, 3.654296875, 4.8505859375, 6.046875, 7.2431640625, 8.439453125, 9.6357421875, 10.83203125, 12.0283203125, 13.224609375, 14.4208984375, 15.6171875, 16.8134765625, 18.009765625, 19.2060546875, 20.40234375, 21.5986328125, 22.794921875, 23.9912109375, 25.1875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 12.0, 39.0, 65.0, 156.0, 1046.0, 4192110.0, 500.0, 143.0, 95.0, 46.0, 40.0, 17.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-876.0, -815.09375, -754.1875, -693.28125, -632.375, -571.46875, -510.5625, -449.65625, -388.75, -327.84375, -266.9375, -206.03125, -145.125, -84.21875, -23.3125, 37.59375, 98.5, 159.40625, 220.3125, 281.21875, 342.125, 403.03125, 463.9375, 524.84375, 585.75, 646.65625, 707.5625, 768.46875, 829.375, 890.28125, 951.1875, 1012.09375, 1073.0, 1133.90625, 1194.8125, 1255.71875, 1316.625, 1377.53125, 1438.4375, 1499.34375, 1560.25, 1621.15625, 1682.0625, 1742.96875, 1803.875, 1864.78125, 1925.6875, 1986.59375, 2047.5, 2108.40625, 2169.3125, 2230.21875, 2291.125, 2352.03125, 2412.9375, 2473.84375, 2534.75, 2595.65625, 2656.5625, 2717.46875, 2778.375, 2839.28125, 2900.1875, 2961.09375, 3022.0]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 28.0, 571.0, 3431.0, 50.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.625, -89.275390625, -81.92578125, -74.576171875, -67.2265625, -59.876953125, -52.52734375, -45.177734375, -37.828125, -30.478515625, -23.12890625, -15.779296875, -8.4296875, -1.080078125, 6.26953125, 13.619140625, 20.96875, 28.318359375, 35.66796875, 43.017578125, 50.3671875, 57.716796875, 65.06640625, 72.416015625, 79.765625, 87.115234375, 94.46484375, 101.814453125, 109.1640625, 116.513671875, 123.86328125, 131.212890625, 138.5625, 145.912109375, 153.26171875, 160.611328125, 167.9609375, 175.310546875, 182.66015625, 190.009765625, 197.359375, 204.708984375, 212.05859375, 219.408203125, 226.7578125, 234.107421875, 241.45703125, 248.806640625, 256.15625, 263.505859375, 270.85546875, 278.205078125, 285.5546875, 292.904296875, 300.25390625, 307.603515625, 314.953125, 322.302734375, 329.65234375, 337.001953125, 344.3515625, 351.701171875, 359.05078125, 366.400390625, 373.75]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 916.0, 80.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3067.76220703125, -2971.279296875, -2874.796142578125, -2778.313232421875, -2681.830078125, -2585.34716796875, -2488.8642578125, -2392.381103515625, -2295.89794921875, -2199.4150390625, -2102.931884765625, -2006.448974609375, -1909.9658203125, -1813.48291015625, -1716.9998779296875, -1620.516845703125, -1524.033935546875, -1427.5509033203125, -1331.06787109375, -1234.5849609375, -1138.101806640625, -1041.618896484375, -945.1358642578125, -848.65283203125, -752.1697998046875, -655.686767578125, -559.2037353515625, -462.72076416015625, -366.23773193359375, -269.75469970703125, -173.271728515625, -76.7886962890625, 19.6943359375, 116.17735290527344, 212.66036987304688, 309.14337158203125, 405.62640380859375, 502.10943603515625, 598.5924072265625, 695.075439453125, 791.5584716796875, 888.04150390625, 984.5245361328125, 1081.007568359375, 1177.490478515625, 1273.9736328125, 1370.45654296875, 1466.9395751953125, 1563.422607421875, 1659.9056396484375, 1756.388671875, 1852.87158203125, 1949.354736328125, 2045.837646484375, 2142.32080078125, 2238.8037109375, 2335.28662109375, 2431.76953125, 2528.252685546875, 2624.735595703125, 2721.21875, 2817.70166015625, 2914.1845703125, 3010.667724609375, 3107.15087890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 12.0, 36.0, 62.0, 109.0, 157.0, 200.0, 187.0, 110.0, 73.0, 37.0, 13.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-675.1411743164062, -657.6409301757812, -640.1406860351562, -622.6404418945312, -605.1402587890625, -587.6400146484375, -570.1397705078125, -552.6395263671875, -535.1392822265625, -517.6390380859375, -500.1387939453125, -482.6385803222656, -465.1383361816406, -447.6380920410156, -430.13787841796875, -412.63763427734375, -395.13739013671875, -377.63714599609375, -360.13690185546875, -342.6366882324219, -325.1364440917969, -307.6361999511719, -290.135986328125, -272.6357421875, -255.135498046875, -237.63525390625, -220.13502502441406, -202.63479614257812, -185.13455200195312, -167.63430786132812, -150.1340789794922, -132.63385009765625, -115.1336669921875, -97.63343048095703, -80.13319396972656, -62.632957458496094, -45.132720947265625, -27.632484436035156, -10.132247924804688, 7.367988586425781, 24.86822509765625, 42.36846160888672, 59.86869812011719, 77.36893463134766, 94.86917114257812, 112.3694076538086, 129.86964416503906, 147.369873046875, 164.8701171875, 182.370361328125, 199.87059020996094, 217.37081909179688, 234.87106323242188, 252.37130737304688, 269.87152099609375, 287.37176513671875, 304.87200927734375, 322.37225341796875, 339.87249755859375, 357.3727111816406, 374.8729553222656, 392.3731994628906, 409.8734130859375, 427.3736572265625, 444.8739013671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 11.0, 5.0, 19.0, 25.0, 28.0, 45.0, 58.0, 93.0, 182.0, 333.0, 693.0, 1778.0, 5225.0, 20928.0, 127102.0, 695084.0, 162376.0, 24945.0, 6070.0, 1913.0, 738.0, 364.0, 193.0, 107.0, 62.0, 41.0, 37.0, 21.0, 14.0, 11.0, 8.0, 3.0, 8.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.625, -113.8974609375, -110.169921875, -106.4423828125, -102.71484375, -98.9873046875, -95.259765625, -91.5322265625, -87.8046875, -84.0771484375, -80.349609375, -76.6220703125, -72.89453125, -69.1669921875, -65.439453125, -61.7119140625, -57.984375, -54.2568359375, -50.529296875, -46.8017578125, -43.07421875, -39.3466796875, -35.619140625, -31.8916015625, -28.1640625, -24.4365234375, -20.708984375, -16.9814453125, -13.25390625, -9.5263671875, -5.798828125, -2.0712890625, 1.65625, 5.3837890625, 9.111328125, 12.8388671875, 16.56640625, 20.2939453125, 24.021484375, 27.7490234375, 31.4765625, 35.2041015625, 38.931640625, 42.6591796875, 46.38671875, 50.1142578125, 53.841796875, 57.5693359375, 61.296875, 65.0244140625, 68.751953125, 72.4794921875, 76.20703125, 79.9345703125, 83.662109375, 87.3896484375, 91.1171875, 94.8447265625, 98.572265625, 102.2998046875, 106.02734375, 109.7548828125, 113.482421875, 117.2099609375, 120.9375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 17.0, 19.0, 23.0, 30.0, 45.0, 50.0, 62.0, 66.0, 74.0, 111.0, 90.0, 67.0, 78.0, 62.0, 53.0, 42.0, 37.0, 14.0, 21.0, 12.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.1875, -32.394287109375, -31.60107421875, -30.807861328125, -30.0146484375, -29.221435546875, -28.42822265625, -27.635009765625, -26.841796875, -26.048583984375, -25.25537109375, -24.462158203125, -23.6689453125, -22.875732421875, -22.08251953125, -21.289306640625, -20.49609375, -19.702880859375, -18.90966796875, -18.116455078125, -17.3232421875, -16.530029296875, -15.73681640625, -14.943603515625, -14.150390625, -13.357177734375, -12.56396484375, -11.770751953125, -10.9775390625, -10.184326171875, -9.39111328125, -8.597900390625, -7.8046875, -7.011474609375, -6.21826171875, -5.425048828125, -4.6318359375, -3.838623046875, -3.04541015625, -2.252197265625, -1.458984375, -0.665771484375, 0.12744140625, 0.920654296875, 1.7138671875, 2.507080078125, 3.30029296875, 4.093505859375, 4.88671875, 5.679931640625, 6.47314453125, 7.266357421875, 8.0595703125, 8.852783203125, 9.64599609375, 10.439208984375, 11.232421875, 12.025634765625, 12.81884765625, 13.612060546875, 14.4052734375, 15.198486328125, 15.99169921875, 16.784912109375, 17.578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 8.0, 15.0, 17.0, 33.0, 43.0, 42.0, 68.0, 118.0, 172.0, 290.0, 520.0, 914.0, 2220.0, 7923.0, 60765.0, 803143.0, 153020.0, 13374.0, 3075.0, 1202.0, 580.0, 371.0, 205.0, 120.0, 80.0, 78.0, 35.0, 32.0, 22.0, 13.0, 9.0, 5.0, 5.0, 8.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-175.625, -170.833984375, -166.04296875, -161.251953125, -156.4609375, -151.669921875, -146.87890625, -142.087890625, -137.296875, -132.505859375, -127.71484375, -122.923828125, -118.1328125, -113.341796875, -108.55078125, -103.759765625, -98.96875, -94.177734375, -89.38671875, -84.595703125, -79.8046875, -75.013671875, -70.22265625, -65.431640625, -60.640625, -55.849609375, -51.05859375, -46.267578125, -41.4765625, -36.685546875, -31.89453125, -27.103515625, -22.3125, -17.521484375, -12.73046875, -7.939453125, -3.1484375, 1.642578125, 6.43359375, 11.224609375, 16.015625, 20.806640625, 25.59765625, 30.388671875, 35.1796875, 39.970703125, 44.76171875, 49.552734375, 54.34375, 59.134765625, 63.92578125, 68.716796875, 73.5078125, 78.298828125, 83.08984375, 87.880859375, 92.671875, 97.462890625, 102.25390625, 107.044921875, 111.8359375, 116.626953125, 121.41796875, 126.208984375, 131.0]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 6.0, 10.0, 12.0, 13.0, 23.0, 25.0, 32.0, 42.0, 37.0, 50.0, 58.0, 71.0, 52.0, 57.0, 59.0, 67.0, 52.0, 57.0, 48.0, 50.0, 39.0, 27.0, 18.0, 22.0, 8.0, 9.0, 15.0, 9.0, 8.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-108.625, -105.75, -102.875, -100.0, -97.125, -94.25, -91.375, -88.5, -85.625, -82.75, -79.875, -77.0, -74.125, -71.25, -68.375, -65.5, -62.625, -59.75, -56.875, -54.0, -51.125, -48.25, -45.375, -42.5, -39.625, -36.75, -33.875, -31.0, -28.125, -25.25, -22.375, -19.5, -16.625, -13.75, -10.875, -8.0, -5.125, -2.25, 0.625, 3.5, 6.375, 9.25, 12.125, 15.0, 17.875, 20.75, 23.625, 26.5, 29.375, 32.25, 35.125, 38.0, 40.875, 43.75, 46.625, 49.5, 52.375, 55.25, 58.125, 61.0, 63.875, 66.75, 69.625, 72.5, 75.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 10.0, 15.0, 37.0, 35.0, 79.0, 162.0, 345.0, 1393.0, 11240.0, 904149.0, 125313.0, 4411.0, 782.0, 272.0, 121.0, 70.0, 41.0, 31.0, 15.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.875, -111.853515625, -107.83203125, -103.810546875, -99.7890625, -95.767578125, -91.74609375, -87.724609375, -83.703125, -79.681640625, -75.66015625, -71.638671875, -67.6171875, -63.595703125, -59.57421875, -55.552734375, -51.53125, -47.509765625, -43.48828125, -39.466796875, -35.4453125, -31.423828125, -27.40234375, -23.380859375, -19.359375, -15.337890625, -11.31640625, -7.294921875, -3.2734375, 0.748046875, 4.76953125, 8.791015625, 12.8125, 16.833984375, 20.85546875, 24.876953125, 28.8984375, 32.919921875, 36.94140625, 40.962890625, 44.984375, 49.005859375, 53.02734375, 57.048828125, 61.0703125, 65.091796875, 69.11328125, 73.134765625, 77.15625, 81.177734375, 85.19921875, 89.220703125, 93.2421875, 97.263671875, 101.28515625, 105.306640625, 109.328125, 113.349609375, 117.37109375, 121.392578125, 125.4140625, 129.435546875, 133.45703125, 137.478515625, 141.5]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 7.0, 11.0, 11.0, 14.0, 31.0, 40.0, 42.0, 66.0, 110.0, 103.0, 108.0, 121.0, 88.0, 59.0, 54.0, 33.0, 26.0, 19.0, 9.0, 12.0, 9.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00470733642578125, -0.004578739404678345, -0.0044501423835754395, -0.004321545362472534, -0.004192948341369629, -0.004064351320266724, -0.003935754299163818, -0.003807157278060913, -0.003678560256958008, -0.0035499632358551025, -0.0034213662147521973, -0.003292769193649292, -0.0031641721725463867, -0.0030355751514434814, -0.002906978130340576, -0.002778381109237671, -0.0026497840881347656, -0.0025211870670318604, -0.002392590045928955, -0.00226399302482605, -0.0021353960037231445, -0.0020067989826202393, -0.001878201961517334, -0.0017496049404144287, -0.0016210079193115234, -0.0014924108982086182, -0.0013638138771057129, -0.0012352168560028076, -0.0011066198348999023, -0.000978022813796997, -0.0008494257926940918, -0.0007208287715911865, -0.0005922317504882812, -0.000463634729385376, -0.0003350377082824707, -0.00020644068717956543, -7.784366607666016e-05, 5.075335502624512e-05, 0.0001793503761291504, 0.00030794739723205566, 0.00043654441833496094, 0.0005651414394378662, 0.0006937384605407715, 0.0008223354816436768, 0.000950932502746582, 0.0010795295238494873, 0.0012081265449523926, 0.0013367235660552979, 0.0014653205871582031, 0.0015939176082611084, 0.0017225146293640137, 0.001851111650466919, 0.0019797086715698242, 0.0021083056926727295, 0.0022369027137756348, 0.00236549973487854, 0.0024940967559814453, 0.0026226937770843506, 0.002751290798187256, 0.002879887819290161, 0.0030084848403930664, 0.0031370818614959717, 0.003265678882598877, 0.0033942759037017822, 0.0035228729248046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 11.0, 15.0, 18.0, 31.0, 63.0, 99.0, 227.0, 538.0, 1982.0, 16702.0, 952542.0, 71099.0, 3816.0, 831.0, 263.0, 115.0, 63.0, 53.0, 25.0, 15.0, 14.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-107.9375, -105.0732421875, -102.208984375, -99.3447265625, -96.48046875, -93.6162109375, -90.751953125, -87.8876953125, -85.0234375, -82.1591796875, -79.294921875, -76.4306640625, -73.56640625, -70.7021484375, -67.837890625, -64.9736328125, -62.109375, -59.2451171875, -56.380859375, -53.5166015625, -50.65234375, -47.7880859375, -44.923828125, -42.0595703125, -39.1953125, -36.3310546875, -33.466796875, -30.6025390625, -27.73828125, -24.8740234375, -22.009765625, -19.1455078125, -16.28125, -13.4169921875, -10.552734375, -7.6884765625, -4.82421875, -1.9599609375, 0.904296875, 3.7685546875, 6.6328125, 9.4970703125, 12.361328125, 15.2255859375, 18.08984375, 20.9541015625, 23.818359375, 26.6826171875, 29.546875, 32.4111328125, 35.275390625, 38.1396484375, 41.00390625, 43.8681640625, 46.732421875, 49.5966796875, 52.4609375, 55.3251953125, 58.189453125, 61.0537109375, 63.91796875, 66.7822265625, 69.646484375, 72.5107421875, 75.375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 8.0, 4.0, 20.0, 26.0, 53.0, 94.0, 149.0, 215.0, 170.0, 128.0, 54.0, 33.0, 7.0, 10.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-69.25, -67.54443359375, -65.8388671875, -64.13330078125, -62.427734375, -60.72216796875, -59.0166015625, -57.31103515625, -55.60546875, -53.89990234375, -52.1943359375, -50.48876953125, -48.783203125, -47.07763671875, -45.3720703125, -43.66650390625, -41.9609375, -40.25537109375, -38.5498046875, -36.84423828125, -35.138671875, -33.43310546875, -31.7275390625, -30.02197265625, -28.31640625, -26.61083984375, -24.9052734375, -23.19970703125, -21.494140625, -19.78857421875, -18.0830078125, -16.37744140625, -14.671875, -12.96630859375, -11.2607421875, -9.55517578125, -7.849609375, -6.14404296875, -4.4384765625, -2.73291015625, -1.02734375, 0.67822265625, 2.3837890625, 4.08935546875, 5.794921875, 7.50048828125, 9.2060546875, 10.91162109375, 12.6171875, 14.32275390625, 16.0283203125, 17.73388671875, 19.439453125, 21.14501953125, 22.8505859375, 24.55615234375, 26.26171875, 27.96728515625, 29.6728515625, 31.37841796875, 33.083984375, 34.78955078125, 36.4951171875, 38.20068359375, 39.90625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 30.0, 103.0, 322.0, 361.0, 116.0, 39.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1742.66015625, -1704.87646484375, -1667.0927734375, -1629.30908203125, -1591.525390625, -1553.74169921875, -1515.9580078125, -1478.17431640625, -1440.390625, -1402.60693359375, -1364.8232421875, -1327.03955078125, -1289.255859375, -1251.47216796875, -1213.6884765625, -1175.90478515625, -1138.12109375, -1100.33740234375, -1062.5537109375, -1024.77001953125, -986.986328125, -949.20263671875, -911.4189453125, -873.63525390625, -835.8515625, -798.06787109375, -760.2841796875, -722.50048828125, -684.716796875, -646.93310546875, -609.1494140625, -571.36572265625, -533.5820922851562, -495.79840087890625, -458.01470947265625, -420.23101806640625, -382.44732666015625, -344.66363525390625, -306.87994384765625, -269.09625244140625, -231.31256103515625, -193.52886962890625, -155.74517822265625, -117.96148681640625, -80.17779541015625, -42.39410400390625, -4.61041259765625, 33.17327880859375, 70.95697021484375, 108.74066162109375, 146.52435302734375, 184.30804443359375, 222.09173583984375, 259.87542724609375, 297.65911865234375, 335.44281005859375, 373.22650146484375, 411.01019287109375, 448.79388427734375, 486.57757568359375, 524.3612670898438, 562.1449584960938, 599.9286499023438, 637.7123413085938, 675.4960327148438]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 2.0, 9.0, 5.0, 8.0, 15.0, 11.0, 21.0, 34.0, 36.0, 30.0, 32.0, 51.0, 53.0, 54.0, 53.0, 53.0, 54.0, 50.0, 60.0, 56.0, 46.0, 44.0, 45.0, 39.0, 36.0, 26.0, 18.0, 13.0, 11.0, 8.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-432.62591552734375, -417.2890930175781, -401.9522705078125, -386.61541748046875, -371.2785949707031, -355.9417724609375, -340.6049499511719, -325.26812744140625, -309.9312744140625, -294.5944519042969, -279.25762939453125, -263.9207763671875, -248.58395385742188, -233.24713134765625, -217.91030883789062, -202.573486328125, -187.23666381835938, -171.89984130859375, -156.56300354003906, -141.22618103027344, -125.88935089111328, -110.55252075195312, -95.2156982421875, -79.87886810302734, -64.54203796386719, -49.20520782470703, -33.86838150024414, -18.53155517578125, -3.1947250366210938, 12.142105102539062, 27.478927612304688, 42.815757751464844, 58.152587890625, 73.48941802978516, 88.82624816894531, 104.16307067871094, 119.4999008178711, 134.83673095703125, 150.17355346679688, 165.5103759765625, 180.8472137451172, 196.1840362548828, 211.5208740234375, 226.85769653320312, 242.19451904296875, 257.5313720703125, 272.8681640625, 288.20501708984375, 303.5418395996094, 318.878662109375, 334.2154846191406, 349.55230712890625, 364.88916015625, 380.2259826660156, 395.56280517578125, 410.8996276855469, 426.2364501953125, 441.5732727050781, 456.91009521484375, 472.2469482421875, 487.5837707519531, 502.92059326171875, 518.2574462890625, 533.59423828125, 548.9310913085938]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 12.0, 13.0, 23.0, 33.0, 53.0, 92.0, 143.0, 232.0, 437.0, 1019.0, 2925.0, 11564.0, 103484.0, 3975721.0, 84603.0, 10036.0, 2437.0, 756.0, 335.0, 162.0, 68.0, 60.0, 21.0, 22.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0], "bins": [-283.0, -276.9091796875, -270.818359375, -264.7275390625, -258.63671875, -252.5458984375, -246.455078125, -240.3642578125, -234.2734375, -228.1826171875, -222.091796875, -216.0009765625, -209.91015625, -203.8193359375, -197.728515625, -191.6376953125, -185.546875, -179.4560546875, -173.365234375, -167.2744140625, -161.18359375, -155.0927734375, -149.001953125, -142.9111328125, -136.8203125, -130.7294921875, -124.638671875, -118.5478515625, -112.45703125, -106.3662109375, -100.275390625, -94.1845703125, -88.09375, -82.0029296875, -75.912109375, -69.8212890625, -63.73046875, -57.6396484375, -51.548828125, -45.4580078125, -39.3671875, -33.2763671875, -27.185546875, -21.0947265625, -15.00390625, -8.9130859375, -2.822265625, 3.2685546875, 9.359375, 15.4501953125, 21.541015625, 27.6318359375, 33.72265625, 39.8134765625, 45.904296875, 51.9951171875, 58.0859375, 64.1767578125, 70.267578125, 76.3583984375, 82.44921875, 88.5400390625, 94.630859375, 100.7216796875, 106.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 10.0, 14.0, 29.0, 21.0, 25.0, 31.0, 54.0, 68.0, 68.0, 61.0, 75.0, 75.0, 80.0, 65.0, 70.0, 48.0, 34.0, 43.0, 38.0, 25.0, 15.0, 14.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-30.765625, -30.053955078125, -29.34228515625, -28.630615234375, -27.9189453125, -27.207275390625, -26.49560546875, -25.783935546875, -25.072265625, -24.360595703125, -23.64892578125, -22.937255859375, -22.2255859375, -21.513916015625, -20.80224609375, -20.090576171875, -19.37890625, -18.667236328125, -17.95556640625, -17.243896484375, -16.5322265625, -15.820556640625, -15.10888671875, -14.397216796875, -13.685546875, -12.973876953125, -12.26220703125, -11.550537109375, -10.8388671875, -10.127197265625, -9.41552734375, -8.703857421875, -7.9921875, -7.280517578125, -6.56884765625, -5.857177734375, -5.1455078125, -4.433837890625, -3.72216796875, -3.010498046875, -2.298828125, -1.587158203125, -0.87548828125, -0.163818359375, 0.5478515625, 1.259521484375, 1.97119140625, 2.682861328125, 3.39453125, 4.106201171875, 4.81787109375, 5.529541015625, 6.2412109375, 6.952880859375, 7.66455078125, 8.376220703125, 9.087890625, 9.799560546875, 10.51123046875, 11.222900390625, 11.9345703125, 12.646240234375, 13.35791015625, 14.069580078125, 14.78125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 5.0, 10.0, 15.0, 26.0, 32.0, 49.0, 108.0, 214.0, 480.0, 1248.0, 3867.0, 17764.0, 1024281.0, 3115028.0, 23092.0, 5132.0, 1681.0, 615.0, 268.0, 133.0, 69.0, 51.0, 26.0, 28.0, 11.0, 9.0, 6.0, 6.0, 9.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.375, -152.921875, -147.46875, -142.015625, -136.5625, -131.109375, -125.65625, -120.203125, -114.75, -109.296875, -103.84375, -98.390625, -92.9375, -87.484375, -82.03125, -76.578125, -71.125, -65.671875, -60.21875, -54.765625, -49.3125, -43.859375, -38.40625, -32.953125, -27.5, -22.046875, -16.59375, -11.140625, -5.6875, -0.234375, 5.21875, 10.671875, 16.125, 21.578125, 27.03125, 32.484375, 37.9375, 43.390625, 48.84375, 54.296875, 59.75, 65.203125, 70.65625, 76.109375, 81.5625, 87.015625, 92.46875, 97.921875, 103.375, 108.828125, 114.28125, 119.734375, 125.1875, 130.640625, 136.09375, 141.546875, 147.0, 152.453125, 157.90625, 163.359375, 168.8125, 174.265625, 179.71875, 185.171875, 190.625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 13.0, 11.0, 16.0, 35.0, 57.0, 113.0, 258.0, 1047.0, 1866.0, 336.0, 122.0, 61.0, 32.0, 23.0, 16.0, 9.0, 2.0, 9.0, 6.0, 2.0, 5.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.9375, -45.326171875, -43.71484375, -42.103515625, -40.4921875, -38.880859375, -37.26953125, -35.658203125, -34.046875, -32.435546875, -30.82421875, -29.212890625, -27.6015625, -25.990234375, -24.37890625, -22.767578125, -21.15625, -19.544921875, -17.93359375, -16.322265625, -14.7109375, -13.099609375, -11.48828125, -9.876953125, -8.265625, -6.654296875, -5.04296875, -3.431640625, -1.8203125, -0.208984375, 1.40234375, 3.013671875, 4.625, 6.236328125, 7.84765625, 9.458984375, 11.0703125, 12.681640625, 14.29296875, 15.904296875, 17.515625, 19.126953125, 20.73828125, 22.349609375, 23.9609375, 25.572265625, 27.18359375, 28.794921875, 30.40625, 32.017578125, 33.62890625, 35.240234375, 36.8515625, 38.462890625, 40.07421875, 41.685546875, 43.296875, 44.908203125, 46.51953125, 48.130859375, 49.7421875, 51.353515625, 52.96484375, 54.576171875, 56.1875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 35.0, 95.0, 393.0, 331.0, 89.0, 26.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-287.711181640625, -269.74853515625, -251.78590393066406, -233.82327270507812, -215.86062622070312, -197.89797973632812, -179.9353485107422, -161.97271728515625, -144.01007080078125, -126.04743194580078, -108.08479309082031, -90.12215423583984, -72.15951538085938, -54.196876525878906, -36.23423767089844, -18.27159881591797, -0.3089599609375, 17.65367889404297, 35.61631774902344, 53.578956604003906, 71.54159545898438, 89.50423431396484, 107.46687316894531, 125.42951202392578, 143.39215087890625, 161.35479736328125, 179.3174285888672, 197.28005981445312, 215.24270629882812, 233.20535278320312, 251.16798400878906, 269.130615234375, 287.09326171875, 305.055908203125, 323.0185546875, 340.9811706542969, 358.9438171386719, 376.9064636230469, 394.86907958984375, 412.83172607421875, 430.79437255859375, 448.75701904296875, 466.71966552734375, 484.6822814941406, 502.6449279785156, 520.6075439453125, 538.5701904296875, 556.5328369140625, 574.4954833984375, 592.4581298828125, 610.4207763671875, 628.3834228515625, 646.3460693359375, 664.3086547851562, 682.2713012695312, 700.2339477539062, 718.1965942382812, 736.1592407226562, 754.1218872070312, 772.0845336914062, 790.047119140625, 808.009765625, 825.972412109375, 843.93505859375, 861.897705078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 11.0, 17.0, 20.0, 29.0, 31.0, 36.0, 43.0, 52.0, 56.0, 64.0, 69.0, 56.0, 64.0, 67.0, 49.0, 53.0, 54.0, 43.0, 41.0, 35.0, 28.0, 18.0, 17.0, 9.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-206.3984375, -200.08758544921875, -193.77671813964844, -187.4658660888672, -181.15499877929688, -174.84414672851562, -168.53329467773438, -162.22242736816406, -155.91156005859375, -149.6007080078125, -143.2898406982422, -136.97898864746094, -130.66812133789062, -124.35726928710938, -118.0464096069336, -111.73554992675781, -105.42469787597656, -99.11383819580078, -92.802978515625, -86.49212646484375, -80.18125915527344, -73.87040710449219, -67.5595474243164, -61.248687744140625, -54.937828063964844, -48.62696838378906, -42.31610870361328, -36.005252838134766, -29.694393157958984, -23.383533477783203, -17.072677612304688, -10.761817932128906, -4.4509429931640625, 1.8599157333374023, 8.170774459838867, 14.481632232666016, 20.792491912841797, 27.103351593017578, 33.414207458496094, 39.725067138671875, 46.035926818847656, 52.34678649902344, 58.65764617919922, 64.968505859375, 71.27935791015625, 77.59022521972656, 83.90107727050781, 90.2119369506836, 96.52279663085938, 102.83365631103516, 109.14451599121094, 115.45536804199219, 121.7662353515625, 128.07708740234375, 134.387939453125, 140.6988067626953, 147.00967407226562, 153.32052612304688, 159.6313934326172, 165.94224548339844, 172.25311279296875, 178.56396484375, 184.87481689453125, 191.18568420410156, 197.4965362548828]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 6.0, 8.0, 4.0, 12.0, 11.0, 28.0, 23.0, 38.0, 61.0, 89.0, 138.0, 227.0, 393.0, 681.0, 1519.0, 3670.0, 9988.0, 32014.0, 139868.0, 559678.0, 230433.0, 47241.0, 13596.0, 4846.0, 1989.0, 823.0, 476.0, 252.0, 151.0, 92.0, 54.0, 48.0, 29.0, 18.0, 13.0, 14.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0625, -70.51171875, -67.9609375, -65.41015625, -62.859375, -60.30859375, -57.7578125, -55.20703125, -52.65625, -50.10546875, -47.5546875, -45.00390625, -42.453125, -39.90234375, -37.3515625, -34.80078125, -32.25, -29.69921875, -27.1484375, -24.59765625, -22.046875, -19.49609375, -16.9453125, -14.39453125, -11.84375, -9.29296875, -6.7421875, -4.19140625, -1.640625, 0.91015625, 3.4609375, 6.01171875, 8.5625, 11.11328125, 13.6640625, 16.21484375, 18.765625, 21.31640625, 23.8671875, 26.41796875, 28.96875, 31.51953125, 34.0703125, 36.62109375, 39.171875, 41.72265625, 44.2734375, 46.82421875, 49.375, 51.92578125, 54.4765625, 57.02734375, 59.578125, 62.12890625, 64.6796875, 67.23046875, 69.78125, 72.33203125, 74.8828125, 77.43359375, 79.984375, 82.53515625, 85.0859375, 87.63671875, 90.1875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 12.0, 11.0, 28.0, 20.0, 42.0, 44.0, 52.0, 53.0, 71.0, 66.0, 73.0, 68.0, 78.0, 63.0, 50.0, 59.0, 43.0, 48.0, 22.0, 28.0, 15.0, 10.0, 11.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.88720703125, -21.2431640625, -20.59912109375, -19.955078125, -19.31103515625, -18.6669921875, -18.02294921875, -17.37890625, -16.73486328125, -16.0908203125, -15.44677734375, -14.802734375, -14.15869140625, -13.5146484375, -12.87060546875, -12.2265625, -11.58251953125, -10.9384765625, -10.29443359375, -9.650390625, -9.00634765625, -8.3623046875, -7.71826171875, -7.07421875, -6.43017578125, -5.7861328125, -5.14208984375, -4.498046875, -3.85400390625, -3.2099609375, -2.56591796875, -1.921875, -1.27783203125, -0.6337890625, 0.01025390625, 0.654296875, 1.29833984375, 1.9423828125, 2.58642578125, 3.23046875, 3.87451171875, 4.5185546875, 5.16259765625, 5.806640625, 6.45068359375, 7.0947265625, 7.73876953125, 8.3828125, 9.02685546875, 9.6708984375, 10.31494140625, 10.958984375, 11.60302734375, 12.2470703125, 12.89111328125, 13.53515625, 14.17919921875, 14.8232421875, 15.46728515625, 16.111328125, 16.75537109375, 17.3994140625, 18.04345703125, 18.6875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 8.0, 20.0, 16.0, 25.0, 46.0, 70.0, 100.0, 130.0, 186.0, 288.0, 460.0, 755.0, 1437.0, 3342.0, 10557.0, 46638.0, 309824.0, 559661.0, 88247.0, 17452.0, 4836.0, 1871.0, 951.0, 563.0, 340.0, 232.0, 139.0, 106.0, 90.0, 41.0, 34.0, 20.0, 12.0, 14.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.1875, -78.583984375, -75.98046875, -73.376953125, -70.7734375, -68.169921875, -65.56640625, -62.962890625, -60.359375, -57.755859375, -55.15234375, -52.548828125, -49.9453125, -47.341796875, -44.73828125, -42.134765625, -39.53125, -36.927734375, -34.32421875, -31.720703125, -29.1171875, -26.513671875, -23.91015625, -21.306640625, -18.703125, -16.099609375, -13.49609375, -10.892578125, -8.2890625, -5.685546875, -3.08203125, -0.478515625, 2.125, 4.728515625, 7.33203125, 9.935546875, 12.5390625, 15.142578125, 17.74609375, 20.349609375, 22.953125, 25.556640625, 28.16015625, 30.763671875, 33.3671875, 35.970703125, 38.57421875, 41.177734375, 43.78125, 46.384765625, 48.98828125, 51.591796875, 54.1953125, 56.798828125, 59.40234375, 62.005859375, 64.609375, 67.212890625, 69.81640625, 72.419921875, 75.0234375, 77.626953125, 80.23046875, 82.833984375, 85.4375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 10.0, 7.0, 9.0, 19.0, 23.0, 16.0, 22.0, 26.0, 37.0, 52.0, 36.0, 39.0, 40.0, 53.0, 51.0, 52.0, 48.0, 41.0, 51.0, 43.0, 38.0, 37.0, 46.0, 22.0, 33.0, 23.0, 15.0, 16.0, 17.0, 21.0, 14.0, 11.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-77.3125, -75.224609375, -73.13671875, -71.048828125, -68.9609375, -66.873046875, -64.78515625, -62.697265625, -60.609375, -58.521484375, -56.43359375, -54.345703125, -52.2578125, -50.169921875, -48.08203125, -45.994140625, -43.90625, -41.818359375, -39.73046875, -37.642578125, -35.5546875, -33.466796875, -31.37890625, -29.291015625, -27.203125, -25.115234375, -23.02734375, -20.939453125, -18.8515625, -16.763671875, -14.67578125, -12.587890625, -10.5, -8.412109375, -6.32421875, -4.236328125, -2.1484375, -0.060546875, 2.02734375, 4.115234375, 6.203125, 8.291015625, 10.37890625, 12.466796875, 14.5546875, 16.642578125, 18.73046875, 20.818359375, 22.90625, 24.994140625, 27.08203125, 29.169921875, 31.2578125, 33.345703125, 35.43359375, 37.521484375, 39.609375, 41.697265625, 43.78515625, 45.873046875, 47.9609375, 50.048828125, 52.13671875, 54.224609375, 56.3125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 6.0, 16.0, 17.0, 28.0, 37.0, 61.0, 96.0, 154.0, 261.0, 453.0, 874.0, 2055.0, 6008.0, 28296.0, 966604.0, 32755.0, 6543.0, 2188.0, 909.0, 472.0, 274.0, 163.0, 93.0, 63.0, 30.0, 19.0, 14.0, 12.0, 12.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-151.875, -147.4765625, -143.078125, -138.6796875, -134.28125, -129.8828125, -125.484375, -121.0859375, -116.6875, -112.2890625, -107.890625, -103.4921875, -99.09375, -94.6953125, -90.296875, -85.8984375, -81.5, -77.1015625, -72.703125, -68.3046875, -63.90625, -59.5078125, -55.109375, -50.7109375, -46.3125, -41.9140625, -37.515625, -33.1171875, -28.71875, -24.3203125, -19.921875, -15.5234375, -11.125, -6.7265625, -2.328125, 2.0703125, 6.46875, 10.8671875, 15.265625, 19.6640625, 24.0625, 28.4609375, 32.859375, 37.2578125, 41.65625, 46.0546875, 50.453125, 54.8515625, 59.25, 63.6484375, 68.046875, 72.4453125, 76.84375, 81.2421875, 85.640625, 90.0390625, 94.4375, 98.8359375, 103.234375, 107.6328125, 112.03125, 116.4296875, 120.828125, 125.2265625, 129.625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 19.0, 21.0, 36.0, 68.0, 91.0, 115.0, 123.0, 126.0, 143.0, 85.0, 53.0, 45.0, 16.0, 13.0, 3.0, 7.0, 3.0, 2.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00388336181640625, -0.0037270188331604004, -0.0035706758499145508, -0.003414332866668701, -0.0032579898834228516, -0.003101646900177002, -0.0029453039169311523, -0.0027889609336853027, -0.002632617950439453, -0.0024762749671936035, -0.002319931983947754, -0.0021635890007019043, -0.0020072460174560547, -0.001850903034210205, -0.0016945600509643555, -0.0015382170677185059, -0.0013818740844726562, -0.0012255311012268066, -0.001069188117980957, -0.0009128451347351074, -0.0007565021514892578, -0.0006001591682434082, -0.0004438161849975586, -0.000287473201751709, -0.00013113021850585938, 2.5212764739990234e-05, 0.00018155574798583984, 0.00033789873123168945, 0.0004942417144775391, 0.0006505846977233887, 0.0008069276809692383, 0.0009632706642150879, 0.0011196136474609375, 0.0012759566307067871, 0.0014322996139526367, 0.0015886425971984863, 0.001744985580444336, 0.0019013285636901855, 0.002057671546936035, 0.0022140145301818848, 0.0023703575134277344, 0.002526700496673584, 0.0026830434799194336, 0.002839386463165283, 0.002995729446411133, 0.0031520724296569824, 0.003308415412902832, 0.0034647583961486816, 0.0036211013793945312, 0.003777444362640381, 0.0039337873458862305, 0.00409013032913208, 0.00424647331237793, 0.004402816295623779, 0.004559159278869629, 0.0047155022621154785, 0.004871845245361328, 0.005028188228607178, 0.005184531211853027, 0.005340874195098877, 0.0054972171783447266, 0.005653560161590576, 0.005809903144836426, 0.005966246128082275, 0.006122589111328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 6.0, 13.0, 13.0, 24.0, 29.0, 32.0, 40.0, 64.0, 80.0, 131.0, 257.0, 418.0, 633.0, 1130.0, 2305.0, 5462.0, 23879.0, 946851.0, 53178.0, 7676.0, 2793.0, 1378.0, 817.0, 479.0, 271.0, 170.0, 112.0, 77.0, 56.0, 34.0, 29.0, 20.0, 15.0, 12.0, 10.0, 7.0, 4.0, 1.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-118.0625, -114.4462890625, -110.830078125, -107.2138671875, -103.59765625, -99.9814453125, -96.365234375, -92.7490234375, -89.1328125, -85.5166015625, -81.900390625, -78.2841796875, -74.66796875, -71.0517578125, -67.435546875, -63.8193359375, -60.203125, -56.5869140625, -52.970703125, -49.3544921875, -45.73828125, -42.1220703125, -38.505859375, -34.8896484375, -31.2734375, -27.6572265625, -24.041015625, -20.4248046875, -16.80859375, -13.1923828125, -9.576171875, -5.9599609375, -2.34375, 1.2724609375, 4.888671875, 8.5048828125, 12.12109375, 15.7373046875, 19.353515625, 22.9697265625, 26.5859375, 30.2021484375, 33.818359375, 37.4345703125, 41.05078125, 44.6669921875, 48.283203125, 51.8994140625, 55.515625, 59.1318359375, 62.748046875, 66.3642578125, 69.98046875, 73.5966796875, 77.212890625, 80.8291015625, 84.4453125, 88.0615234375, 91.677734375, 95.2939453125, 98.91015625, 102.5263671875, 106.142578125, 109.7587890625, 113.375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 8.0, 4.0, 11.0, 13.0, 14.0, 28.0, 97.0, 222.0, 305.0, 163.0, 44.0, 24.0, 13.0, 10.0, 6.0, 1.0, 5.0, 4.0, 2.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.625, -68.365234375, -66.10546875, -63.845703125, -61.5859375, -59.326171875, -57.06640625, -54.806640625, -52.546875, -50.287109375, -48.02734375, -45.767578125, -43.5078125, -41.248046875, -38.98828125, -36.728515625, -34.46875, -32.208984375, -29.94921875, -27.689453125, -25.4296875, -23.169921875, -20.91015625, -18.650390625, -16.390625, -14.130859375, -11.87109375, -9.611328125, -7.3515625, -5.091796875, -2.83203125, -0.572265625, 1.6875, 3.947265625, 6.20703125, 8.466796875, 10.7265625, 12.986328125, 15.24609375, 17.505859375, 19.765625, 22.025390625, 24.28515625, 26.544921875, 28.8046875, 31.064453125, 33.32421875, 35.583984375, 37.84375, 40.103515625, 42.36328125, 44.623046875, 46.8828125, 49.142578125, 51.40234375, 53.662109375, 55.921875, 58.181640625, 60.44140625, 62.701171875, 64.9609375, 67.220703125, 69.48046875, 71.740234375, 74.0]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 13.0, 15.0, 46.0, 140.0, 372.0, 297.0, 90.0, 22.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1907.246826171875, -1863.828125, -1820.4093017578125, -1776.9906005859375, -1733.57177734375, -1690.153076171875, -1646.7342529296875, -1603.3155517578125, -1559.896728515625, -1516.47802734375, -1473.0592041015625, -1429.6405029296875, -1386.2216796875, -1342.802978515625, -1299.3841552734375, -1255.9654541015625, -1212.546630859375, -1169.1279296875, -1125.7091064453125, -1082.2904052734375, -1038.87158203125, -995.4528198242188, -952.0340576171875, -908.6153564453125, -865.1966552734375, -821.7778930664062, -778.359130859375, -734.9403686523438, -691.5216064453125, -648.1028442382812, -604.68408203125, -561.265380859375, -517.8465576171875, -474.42779541015625, -431.009033203125, -387.59027099609375, -344.1715087890625, -300.75274658203125, -257.3340148925781, -213.91525268554688, -170.49649047851562, -127.07772827148438, -83.65897369384766, -40.24021911621094, 3.1785430908203125, 46.59730529785156, 90.01605224609375, 133.434814453125, 176.85357666015625, 220.2723388671875, 263.69110107421875, 307.10986328125, 350.52862548828125, 393.9473876953125, 437.3661193847656, 480.7848815917969, 524.20361328125, 567.6223754882812, 611.0411376953125, 654.4598999023438, 697.878662109375, 741.2974243164062, 784.7161865234375, 828.1348876953125, 871.5537109375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 9.0, 10.0, 8.0, 14.0, 14.0, 21.0, 24.0, 21.0, 23.0, 32.0, 32.0, 39.0, 47.0, 46.0, 45.0, 36.0, 37.0, 40.0, 39.0, 36.0, 40.0, 34.0, 33.0, 32.0, 39.0, 29.0, 17.0, 24.0, 31.0, 15.0, 22.0, 10.0, 16.0, 14.0, 18.0, 11.0, 4.0, 6.0, 2.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-368.9228515625, -357.8231506347656, -346.72344970703125, -335.623779296875, -324.5240783691406, -313.42437744140625, -302.3246765136719, -291.2249755859375, -280.1252746582031, -269.02557373046875, -257.9258728027344, -246.82618713378906, -235.7264862060547, -224.62680053710938, -213.527099609375, -202.42739868164062, -191.3277130126953, -180.22801208496094, -169.12832641601562, -158.02862548828125, -146.92892456054688, -135.8292236328125, -124.72953796386719, -113.62983703613281, -102.53014373779297, -91.43045043945312, -80.33074951171875, -69.2310562133789, -58.1313591003418, -47.03166198730469, -35.931968688964844, -24.83226776123047, -13.732574462890625, -2.632878303527832, 8.466817855834961, 19.566513061523438, 30.666210174560547, 41.765907287597656, 52.8656005859375, 63.965301513671875, 75.06499481201172, 86.16468811035156, 97.26438903808594, 108.36408233642578, 119.46377563476562, 130.5634765625, 141.66317749023438, 152.76287841796875, 163.86256408691406, 174.96226501464844, 186.06195068359375, 197.16165161132812, 208.2613525390625, 219.36105346679688, 230.4607391357422, 241.56044006347656, 252.66012573242188, 263.75982666015625, 274.8595275878906, 285.959228515625, 297.05889892578125, 308.1585998535156, 319.25830078125, 330.3580017089844, 341.45770263671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 7.0, 10.0, 6.0, 10.0, 14.0, 32.0, 36.0, 70.0, 80.0, 153.0, 277.0, 505.0, 1012.0, 2111.0, 5377.0, 16846.0, 84617.0, 3696800.0, 338117.0, 34194.0, 8634.0, 2821.0, 1221.0, 602.0, 291.0, 168.0, 105.0, 52.0, 44.0, 16.0, 17.0, 12.0, 6.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.0625, -76.572265625, -74.08203125, -71.591796875, -69.1015625, -66.611328125, -64.12109375, -61.630859375, -59.140625, -56.650390625, -54.16015625, -51.669921875, -49.1796875, -46.689453125, -44.19921875, -41.708984375, -39.21875, -36.728515625, -34.23828125, -31.748046875, -29.2578125, -26.767578125, -24.27734375, -21.787109375, -19.296875, -16.806640625, -14.31640625, -11.826171875, -9.3359375, -6.845703125, -4.35546875, -1.865234375, 0.625, 3.115234375, 5.60546875, 8.095703125, 10.5859375, 13.076171875, 15.56640625, 18.056640625, 20.546875, 23.037109375, 25.52734375, 28.017578125, 30.5078125, 32.998046875, 35.48828125, 37.978515625, 40.46875, 42.958984375, 45.44921875, 47.939453125, 50.4296875, 52.919921875, 55.41015625, 57.900390625, 60.390625, 62.880859375, 65.37109375, 67.861328125, 70.3515625, 72.841796875, 75.33203125, 77.822265625, 80.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 8.0, 11.0, 12.0, 14.0, 10.0, 17.0, 22.0, 31.0, 19.0, 42.0, 45.0, 41.0, 35.0, 59.0, 69.0, 63.0, 52.0, 52.0, 52.0, 52.0, 49.0, 36.0, 39.0, 27.0, 32.0, 23.0, 21.0, 21.0, 11.0, 12.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.7265625, -17.1875, -16.6484375, -16.109375, -15.5703125, -15.03125, -14.4921875, -13.953125, -13.4140625, -12.875, -12.3359375, -11.796875, -11.2578125, -10.71875, -10.1796875, -9.640625, -9.1015625, -8.5625, -8.0234375, -7.484375, -6.9453125, -6.40625, -5.8671875, -5.328125, -4.7890625, -4.25, -3.7109375, -3.171875, -2.6328125, -2.09375, -1.5546875, -1.015625, -0.4765625, 0.0625, 0.6015625, 1.140625, 1.6796875, 2.21875, 2.7578125, 3.296875, 3.8359375, 4.375, 4.9140625, 5.453125, 5.9921875, 6.53125, 7.0703125, 7.609375, 8.1484375, 8.6875, 9.2265625, 9.765625, 10.3046875, 10.84375, 11.3828125, 11.921875, 12.4609375, 13.0, 13.5390625, 14.078125, 14.6171875, 15.15625, 15.6953125, 16.234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 15.0, 13.0, 25.0, 14.0, 33.0, 40.0, 60.0, 82.0, 112.0, 218.0, 360.0, 944.0, 3032.0, 15410.0, 227492.0, 3865131.0, 68951.0, 8683.0, 2006.0, 729.0, 382.0, 192.0, 109.0, 83.0, 49.0, 35.0, 26.0, 14.0, 11.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.375, -90.294921875, -87.21484375, -84.134765625, -81.0546875, -77.974609375, -74.89453125, -71.814453125, -68.734375, -65.654296875, -62.57421875, -59.494140625, -56.4140625, -53.333984375, -50.25390625, -47.173828125, -44.09375, -41.013671875, -37.93359375, -34.853515625, -31.7734375, -28.693359375, -25.61328125, -22.533203125, -19.453125, -16.373046875, -13.29296875, -10.212890625, -7.1328125, -4.052734375, -0.97265625, 2.107421875, 5.1875, 8.267578125, 11.34765625, 14.427734375, 17.5078125, 20.587890625, 23.66796875, 26.748046875, 29.828125, 32.908203125, 35.98828125, 39.068359375, 42.1484375, 45.228515625, 48.30859375, 51.388671875, 54.46875, 57.548828125, 60.62890625, 63.708984375, 66.7890625, 69.869140625, 72.94921875, 76.029296875, 79.109375, 82.189453125, 85.26953125, 88.349609375, 91.4296875, 94.509765625, 97.58984375, 100.669921875, 103.75]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 7.0, 4.0, 16.0, 24.0, 54.0, 97.0, 247.0, 2065.0, 1042.0, 259.0, 109.0, 60.0, 26.0, 22.0, 14.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.15625, -36.91943359375, -35.6826171875, -34.44580078125, -33.208984375, -31.97216796875, -30.7353515625, -29.49853515625, -28.26171875, -27.02490234375, -25.7880859375, -24.55126953125, -23.314453125, -22.07763671875, -20.8408203125, -19.60400390625, -18.3671875, -17.13037109375, -15.8935546875, -14.65673828125, -13.419921875, -12.18310546875, -10.9462890625, -9.70947265625, -8.47265625, -7.23583984375, -5.9990234375, -4.76220703125, -3.525390625, -2.28857421875, -1.0517578125, 0.18505859375, 1.421875, 2.65869140625, 3.8955078125, 5.13232421875, 6.369140625, 7.60595703125, 8.8427734375, 10.07958984375, 11.31640625, 12.55322265625, 13.7900390625, 15.02685546875, 16.263671875, 17.50048828125, 18.7373046875, 19.97412109375, 21.2109375, 22.44775390625, 23.6845703125, 24.92138671875, 26.158203125, 27.39501953125, 28.6318359375, 29.86865234375, 31.10546875, 32.34228515625, 33.5791015625, 34.81591796875, 36.052734375, 37.28955078125, 38.5263671875, 39.76318359375, 41.0]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 44.0, 409.0, 417.0, 89.0, 22.0, 12.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-444.410400390625, -425.7106018066406, -407.01080322265625, -388.31097412109375, -369.6111755371094, -350.911376953125, -332.2115478515625, -313.5117492675781, -294.81195068359375, -276.1121520996094, -257.412353515625, -238.7125244140625, -220.01272583007812, -201.31292724609375, -182.6131134033203, -163.91329956054688, -145.2135009765625, -126.5136947631836, -107.81388854980469, -89.11408233642578, -70.41427612304688, -51.71446990966797, -33.01466369628906, -14.314849853515625, 4.38494873046875, 23.084754943847656, 41.78456115722656, 60.48436737060547, 79.18417358398438, 97.88397979736328, 116.58378601074219, 135.28359985351562, 153.98333740234375, 172.68313598632812, 191.38294982910156, 210.082763671875, 228.78256225585938, 247.48236083984375, 266.18218994140625, 284.8819885253906, 303.581787109375, 322.2815856933594, 340.98138427734375, 359.68121337890625, 378.3810119628906, 397.080810546875, 415.7806396484375, 434.4804382324219, 453.18023681640625, 471.8800354003906, 490.579833984375, 509.2796630859375, 527.9794921875, 546.6792602539062, 565.3790893554688, 584.078857421875, 602.7786865234375, 621.478515625, 640.1782836914062, 658.8781127929688, 677.577880859375, 696.2777099609375, 714.9775390625, 733.6773681640625, 752.3771362304688]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 7.0, 8.0, 9.0, 9.0, 7.0, 17.0, 19.0, 18.0, 23.0, 28.0, 23.0, 30.0, 36.0, 43.0, 35.0, 34.0, 46.0, 41.0, 29.0, 34.0, 37.0, 45.0, 33.0, 30.0, 35.0, 44.0, 34.0, 30.0, 23.0, 30.0, 22.0, 28.0, 18.0, 12.0, 19.0, 13.0, 12.0, 12.0, 6.0, 3.0, 5.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-87.89079284667969, -85.0030288696289, -82.11527252197266, -79.22750854492188, -76.33975219726562, -73.45198822021484, -70.56422424316406, -67.67646789550781, -64.78870391845703, -61.900943756103516, -59.01318359375, -56.12541961669922, -53.2376594543457, -50.34989929199219, -47.462135314941406, -44.57437515258789, -41.686614990234375, -38.79885482788086, -35.911094665527344, -33.02333068847656, -30.135570526123047, -27.24781036376953, -24.360048294067383, -21.472286224365234, -18.58452606201172, -15.696764945983887, -12.809003829956055, -9.921242713928223, -7.033481597900391, -4.145720481872559, -1.2579593658447266, 1.6298027038574219, 4.5175628662109375, 7.4053239822387695, 10.293085098266602, 13.180846214294434, 16.068607330322266, 18.95636749267578, 21.84412956237793, 24.731891632080078, 27.619651794433594, 30.50741195678711, 33.395172119140625, 36.282936096191406, 39.17069625854492, 42.05845642089844, 44.94622039794922, 47.833980560302734, 50.72174072265625, 53.609500885009766, 56.49726104736328, 59.38502502441406, 62.27278518676758, 65.1605453491211, 68.04830932617188, 70.93606567382812, 73.8238296508789, 76.71159362792969, 79.59934997558594, 82.48711395263672, 85.3748779296875, 88.26263427734375, 91.15039825439453, 94.03816223144531, 96.92591857910156]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 20.0, 20.0, 25.0, 35.0, 43.0, 74.0, 124.0, 176.0, 247.0, 439.0, 800.0, 1387.0, 2576.0, 4884.0, 10446.0, 23478.0, 58832.0, 169852.0, 396982.0, 240063.0, 80841.0, 30687.0, 13051.0, 6118.0, 3154.0, 1710.0, 900.0, 556.0, 350.0, 229.0, 132.0, 99.0, 48.0, 38.0, 29.0, 20.0, 15.0, 14.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-57.0625, -55.201171875, -53.33984375, -51.478515625, -49.6171875, -47.755859375, -45.89453125, -44.033203125, -42.171875, -40.310546875, -38.44921875, -36.587890625, -34.7265625, -32.865234375, -31.00390625, -29.142578125, -27.28125, -25.419921875, -23.55859375, -21.697265625, -19.8359375, -17.974609375, -16.11328125, -14.251953125, -12.390625, -10.529296875, -8.66796875, -6.806640625, -4.9453125, -3.083984375, -1.22265625, 0.638671875, 2.5, 4.361328125, 6.22265625, 8.083984375, 9.9453125, 11.806640625, 13.66796875, 15.529296875, 17.390625, 19.251953125, 21.11328125, 22.974609375, 24.8359375, 26.697265625, 28.55859375, 30.419921875, 32.28125, 34.142578125, 36.00390625, 37.865234375, 39.7265625, 41.587890625, 43.44921875, 45.310546875, 47.171875, 49.033203125, 50.89453125, 52.755859375, 54.6171875, 56.478515625, 58.33984375, 60.201171875, 62.0625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 5.0, 8.0, 16.0, 13.0, 21.0, 28.0, 26.0, 27.0, 38.0, 45.0, 47.0, 56.0, 71.0, 64.0, 61.0, 60.0, 52.0, 40.0, 53.0, 46.0, 39.0, 35.0, 28.0, 31.0, 21.0, 15.0, 11.0, 11.0, 5.0, 2.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.421875, -18.8712158203125, -18.320556640625, -17.7698974609375, -17.21923828125, -16.6685791015625, -16.117919921875, -15.5672607421875, -15.0166015625, -14.4659423828125, -13.915283203125, -13.3646240234375, -12.81396484375, -12.2633056640625, -11.712646484375, -11.1619873046875, -10.611328125, -10.0606689453125, -9.510009765625, -8.9593505859375, -8.40869140625, -7.8580322265625, -7.307373046875, -6.7567138671875, -6.2060546875, -5.6553955078125, -5.104736328125, -4.5540771484375, -4.00341796875, -3.4527587890625, -2.902099609375, -2.3514404296875, -1.80078125, -1.2501220703125, -0.699462890625, -0.1488037109375, 0.40185546875, 0.9525146484375, 1.503173828125, 2.0538330078125, 2.6044921875, 3.1551513671875, 3.705810546875, 4.2564697265625, 4.80712890625, 5.3577880859375, 5.908447265625, 6.4591064453125, 7.009765625, 7.5604248046875, 8.111083984375, 8.6617431640625, 9.21240234375, 9.7630615234375, 10.313720703125, 10.8643798828125, 11.4150390625, 11.9656982421875, 12.516357421875, 13.0670166015625, 13.61767578125, 14.1683349609375, 14.718994140625, 15.2696533203125, 15.8203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 3.0, 9.0, 10.0, 13.0, 19.0, 26.0, 31.0, 49.0, 70.0, 101.0, 117.0, 131.0, 200.0, 288.0, 442.0, 634.0, 1163.0, 2550.0, 7259.0, 30900.0, 214365.0, 637868.0, 122042.0, 19998.0, 5224.0, 2059.0, 987.0, 595.0, 375.0, 268.0, 220.0, 131.0, 84.0, 74.0, 54.0, 48.0, 45.0, 19.0, 17.0, 12.0, 10.0, 8.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-102.25, -99.185546875, -96.12109375, -93.056640625, -89.9921875, -86.927734375, -83.86328125, -80.798828125, -77.734375, -74.669921875, -71.60546875, -68.541015625, -65.4765625, -62.412109375, -59.34765625, -56.283203125, -53.21875, -50.154296875, -47.08984375, -44.025390625, -40.9609375, -37.896484375, -34.83203125, -31.767578125, -28.703125, -25.638671875, -22.57421875, -19.509765625, -16.4453125, -13.380859375, -10.31640625, -7.251953125, -4.1875, -1.123046875, 1.94140625, 5.005859375, 8.0703125, 11.134765625, 14.19921875, 17.263671875, 20.328125, 23.392578125, 26.45703125, 29.521484375, 32.5859375, 35.650390625, 38.71484375, 41.779296875, 44.84375, 47.908203125, 50.97265625, 54.037109375, 57.1015625, 60.166015625, 63.23046875, 66.294921875, 69.359375, 72.423828125, 75.48828125, 78.552734375, 81.6171875, 84.681640625, 87.74609375, 90.810546875, 93.875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 13.0, 7.0, 17.0, 13.0, 29.0, 32.0, 28.0, 35.0, 45.0, 28.0, 32.0, 34.0, 44.0, 56.0, 40.0, 48.0, 54.0, 39.0, 34.0, 39.0, 46.0, 27.0, 35.0, 24.0, 33.0, 22.0, 18.0, 23.0, 15.0, 14.0, 11.0, 9.0, 7.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-71.0625, -69.005859375, -66.94921875, -64.892578125, -62.8359375, -60.779296875, -58.72265625, -56.666015625, -54.609375, -52.552734375, -50.49609375, -48.439453125, -46.3828125, -44.326171875, -42.26953125, -40.212890625, -38.15625, -36.099609375, -34.04296875, -31.986328125, -29.9296875, -27.873046875, -25.81640625, -23.759765625, -21.703125, -19.646484375, -17.58984375, -15.533203125, -13.4765625, -11.419921875, -9.36328125, -7.306640625, -5.25, -3.193359375, -1.13671875, 0.919921875, 2.9765625, 5.033203125, 7.08984375, 9.146484375, 11.203125, 13.259765625, 15.31640625, 17.373046875, 19.4296875, 21.486328125, 23.54296875, 25.599609375, 27.65625, 29.712890625, 31.76953125, 33.826171875, 35.8828125, 37.939453125, 39.99609375, 42.052734375, 44.109375, 46.166015625, 48.22265625, 50.279296875, 52.3359375, 54.392578125, 56.44921875, 58.505859375, 60.5625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 8.0, 6.0, 16.0, 14.0, 21.0, 28.0, 43.0, 66.0, 97.0, 149.0, 251.0, 532.0, 1030.0, 2347.0, 6248.0, 19604.0, 117735.0, 797957.0, 77617.0, 15470.0, 5274.0, 2047.0, 849.0, 463.0, 244.0, 137.0, 101.0, 71.0, 39.0, 27.0, 12.0, 13.0, 9.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-73.75, -71.66748046875, -69.5849609375, -67.50244140625, -65.419921875, -63.33740234375, -61.2548828125, -59.17236328125, -57.08984375, -55.00732421875, -52.9248046875, -50.84228515625, -48.759765625, -46.67724609375, -44.5947265625, -42.51220703125, -40.4296875, -38.34716796875, -36.2646484375, -34.18212890625, -32.099609375, -30.01708984375, -27.9345703125, -25.85205078125, -23.76953125, -21.68701171875, -19.6044921875, -17.52197265625, -15.439453125, -13.35693359375, -11.2744140625, -9.19189453125, -7.109375, -5.02685546875, -2.9443359375, -0.86181640625, 1.220703125, 3.30322265625, 5.3857421875, 7.46826171875, 9.55078125, 11.63330078125, 13.7158203125, 15.79833984375, 17.880859375, 19.96337890625, 22.0458984375, 24.12841796875, 26.2109375, 28.29345703125, 30.3759765625, 32.45849609375, 34.541015625, 36.62353515625, 38.7060546875, 40.78857421875, 42.87109375, 44.95361328125, 47.0361328125, 49.11865234375, 51.201171875, 53.28369140625, 55.3662109375, 57.44873046875, 59.53125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 6.0, 9.0, 10.0, 8.0, 13.0, 25.0, 46.0, 52.0, 56.0, 62.0, 101.0, 105.0, 108.0, 91.0, 59.0, 56.0, 35.0, 45.0, 22.0, 10.0, 15.0, 8.0, 9.0, 7.0, 1.0, 4.0, 4.0, 3.0, 1.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.004180908203125, -0.004057109355926514, -0.003933310508728027, -0.003809511661529541, -0.0036857128143310547, -0.0035619139671325684, -0.003438115119934082, -0.0033143162727355957, -0.0031905174255371094, -0.003066718578338623, -0.0029429197311401367, -0.0028191208839416504, -0.002695322036743164, -0.0025715231895446777, -0.0024477243423461914, -0.002323925495147705, -0.0022001266479492188, -0.0020763278007507324, -0.001952528953552246, -0.0018287301063537598, -0.0017049312591552734, -0.0015811324119567871, -0.0014573335647583008, -0.0013335347175598145, -0.0012097358703613281, -0.0010859370231628418, -0.0009621381759643555, -0.0008383393287658691, -0.0007145404815673828, -0.0005907416343688965, -0.00046694278717041016, -0.00034314393997192383, -0.0002193450927734375, -9.554624557495117e-05, 2.8252601623535156e-05, 0.00015205144882202148, 0.0002758502960205078, 0.00039964914321899414, 0.0005234479904174805, 0.0006472468376159668, 0.0007710456848144531, 0.0008948445320129395, 0.0010186433792114258, 0.0011424422264099121, 0.0012662410736083984, 0.0013900399208068848, 0.001513838768005371, 0.0016376376152038574, 0.0017614364624023438, 0.00188523530960083, 0.0020090341567993164, 0.0021328330039978027, 0.002256631851196289, 0.0023804306983947754, 0.0025042295455932617, 0.002628028392791748, 0.0027518272399902344, 0.0028756260871887207, 0.002999424934387207, 0.0031232237815856934, 0.0032470226287841797, 0.003370821475982666, 0.0034946203231811523, 0.0036184191703796387, 0.003742218017578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 10.0, 7.0, 11.0, 21.0, 22.0, 44.0, 65.0, 114.0, 180.0, 450.0, 1263.0, 5866.0, 69209.0, 935269.0, 30582.0, 3771.0, 929.0, 336.0, 139.0, 102.0, 64.0, 29.0, 15.0, 17.0, 15.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.5625, -121.9091796875, -118.255859375, -114.6025390625, -110.94921875, -107.2958984375, -103.642578125, -99.9892578125, -96.3359375, -92.6826171875, -89.029296875, -85.3759765625, -81.72265625, -78.0693359375, -74.416015625, -70.7626953125, -67.109375, -63.4560546875, -59.802734375, -56.1494140625, -52.49609375, -48.8427734375, -45.189453125, -41.5361328125, -37.8828125, -34.2294921875, -30.576171875, -26.9228515625, -23.26953125, -19.6162109375, -15.962890625, -12.3095703125, -8.65625, -5.0029296875, -1.349609375, 2.3037109375, 5.95703125, 9.6103515625, 13.263671875, 16.9169921875, 20.5703125, 24.2236328125, 27.876953125, 31.5302734375, 35.18359375, 38.8369140625, 42.490234375, 46.1435546875, 49.796875, 53.4501953125, 57.103515625, 60.7568359375, 64.41015625, 68.0634765625, 71.716796875, 75.3701171875, 79.0234375, 82.6767578125, 86.330078125, 89.9833984375, 93.63671875, 97.2900390625, 100.943359375, 104.5966796875, 108.25]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 6.0, 15.0, 14.0, 26.0, 32.0, 79.0, 121.0, 201.0, 177.0, 122.0, 79.0, 27.0, 18.0, 15.0, 12.0, 12.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.0, -70.10009765625, -68.2001953125, -66.30029296875, -64.400390625, -62.50048828125, -60.6005859375, -58.70068359375, -56.80078125, -54.90087890625, -53.0009765625, -51.10107421875, -49.201171875, -47.30126953125, -45.4013671875, -43.50146484375, -41.6015625, -39.70166015625, -37.8017578125, -35.90185546875, -34.001953125, -32.10205078125, -30.2021484375, -28.30224609375, -26.40234375, -24.50244140625, -22.6025390625, -20.70263671875, -18.802734375, -16.90283203125, -15.0029296875, -13.10302734375, -11.203125, -9.30322265625, -7.4033203125, -5.50341796875, -3.603515625, -1.70361328125, 0.1962890625, 2.09619140625, 3.99609375, 5.89599609375, 7.7958984375, 9.69580078125, 11.595703125, 13.49560546875, 15.3955078125, 17.29541015625, 19.1953125, 21.09521484375, 22.9951171875, 24.89501953125, 26.794921875, 28.69482421875, 30.5947265625, 32.49462890625, 34.39453125, 36.29443359375, 38.1943359375, 40.09423828125, 41.994140625, 43.89404296875, 45.7939453125, 47.69384765625, 49.59375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 25.0, 118.0, 611.0, 225.0, 14.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3334.91552734375, -3246.25830078125, -3157.60107421875, -3068.94384765625, -2980.28662109375, -2891.62939453125, -2802.97216796875, -2714.31494140625, -2625.65771484375, -2537.00048828125, -2448.34326171875, -2359.68603515625, -2271.02880859375, -2182.37158203125, -2093.71435546875, -2005.0572509765625, -1916.400146484375, -1827.742919921875, -1739.085693359375, -1650.428466796875, -1561.771240234375, -1473.114013671875, -1384.4569091796875, -1295.7996826171875, -1207.1424560546875, -1118.4852294921875, -1029.8280029296875, -941.1708374023438, -852.5136108398438, -763.8563842773438, -675.19921875, -586.5419921875, -497.884521484375, -409.227294921875, -320.5700988769531, -231.91290283203125, -143.25567626953125, -54.59844970703125, 34.0587158203125, 122.7159423828125, 211.3731689453125, 300.0303955078125, 388.6875915527344, 477.34478759765625, 566.0020141601562, 654.6592407226562, 743.31640625, 831.9736328125, 920.630859375, 1009.2880859375, 1097.9453125, 1186.6025390625, 1275.259765625, 1363.9169921875, 1452.5740966796875, 1541.2313232421875, 1629.8885498046875, 1718.5457763671875, 1807.2030029296875, 1895.860107421875, 1984.517333984375, 2073.174560546875, 2161.831787109375, 2250.489013671875, 2339.146240234375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 3.0, 5.0, 9.0, 11.0, 20.0, 20.0, 13.0, 22.0, 18.0, 18.0, 30.0, 46.0, 37.0, 38.0, 61.0, 39.0, 52.0, 44.0, 51.0, 38.0, 41.0, 36.0, 45.0, 36.0, 41.0, 37.0, 31.0, 23.0, 20.0, 15.0, 18.0, 17.0, 18.0, 8.0, 6.0, 5.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.515380859375, -387.03643798828125, -373.5575256347656, -360.0785827636719, -346.5996398925781, -333.1207275390625, -319.64178466796875, -306.162841796875, -292.68389892578125, -279.2049560546875, -265.7260437011719, -252.24710083007812, -238.76815795898438, -225.2892303466797, -211.810302734375, -198.33135986328125, -184.85243225097656, -171.37350463867188, -157.89456176757812, -144.41563415527344, -130.9366912841797, -117.457763671875, -103.97882843017578, -90.49989318847656, -77.02095794677734, -63.542022705078125, -50.063087463378906, -36.58415603637695, -23.105220794677734, -9.626289367675781, 3.8526458740234375, 17.331581115722656, 30.810516357421875, 44.289451599121094, 57.76838684082031, 71.247314453125, 84.72625732421875, 98.20518493652344, 111.68412017822266, 125.16305541992188, 138.64199829101562, 152.1209259033203, 165.59986877441406, 179.07879638671875, 192.5577392578125, 206.0366668701172, 219.51559448242188, 232.99453735351562, 246.4734649658203, 259.952392578125, 273.43133544921875, 286.9102783203125, 300.3891906738281, 313.8681335449219, 327.3470764160156, 340.82598876953125, 354.304931640625, 367.78387451171875, 381.2627868652344, 394.7417297363281, 408.2206726074219, 421.6995849609375, 435.17852783203125, 448.657470703125, 462.13641357421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 13.0, 20.0, 43.0, 88.0, 141.0, 315.0, 638.0, 1769.0, 4570.0, 17028.0, 142159.0, 3902585.0, 104270.0, 14497.0, 3800.0, 1278.0, 524.0, 245.0, 134.0, 62.0, 37.0, 20.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.375, -95.6171875, -91.859375, -88.1015625, -84.34375, -80.5859375, -76.828125, -73.0703125, -69.3125, -65.5546875, -61.796875, -58.0390625, -54.28125, -50.5234375, -46.765625, -43.0078125, -39.25, -35.4921875, -31.734375, -27.9765625, -24.21875, -20.4609375, -16.703125, -12.9453125, -9.1875, -5.4296875, -1.671875, 2.0859375, 5.84375, 9.6015625, 13.359375, 17.1171875, 20.875, 24.6328125, 28.390625, 32.1484375, 35.90625, 39.6640625, 43.421875, 47.1796875, 50.9375, 54.6953125, 58.453125, 62.2109375, 65.96875, 69.7265625, 73.484375, 77.2421875, 81.0, 84.7578125, 88.515625, 92.2734375, 96.03125, 99.7890625, 103.546875, 107.3046875, 111.0625, 114.8203125, 118.578125, 122.3359375, 126.09375, 129.8515625, 133.609375, 137.3671875, 141.125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 11.0, 6.0, 8.0, 19.0, 18.0, 23.0, 21.0, 16.0, 24.0, 30.0, 42.0, 36.0, 36.0, 47.0, 39.0, 61.0, 46.0, 47.0, 48.0, 30.0, 49.0, 41.0, 28.0, 34.0, 29.0, 24.0, 38.0, 26.0, 15.0, 21.0, 22.0, 11.0, 8.0, 10.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.3046875, -14.7930908203125, -14.281494140625, -13.7698974609375, -13.25830078125, -12.7467041015625, -12.235107421875, -11.7235107421875, -11.2119140625, -10.7003173828125, -10.188720703125, -9.6771240234375, -9.16552734375, -8.6539306640625, -8.142333984375, -7.6307373046875, -7.119140625, -6.6075439453125, -6.095947265625, -5.5843505859375, -5.07275390625, -4.5611572265625, -4.049560546875, -3.5379638671875, -3.0263671875, -2.5147705078125, -2.003173828125, -1.4915771484375, -0.97998046875, -0.4683837890625, 0.043212890625, 0.5548095703125, 1.06640625, 1.5780029296875, 2.089599609375, 2.6011962890625, 3.11279296875, 3.6243896484375, 4.135986328125, 4.6475830078125, 5.1591796875, 5.6707763671875, 6.182373046875, 6.6939697265625, 7.20556640625, 7.7171630859375, 8.228759765625, 8.7403564453125, 9.251953125, 9.7635498046875, 10.275146484375, 10.7867431640625, 11.29833984375, 11.8099365234375, 12.321533203125, 12.8331298828125, 13.3447265625, 13.8563232421875, 14.367919921875, 14.8795166015625, 15.39111328125, 15.9027099609375, 16.414306640625, 16.9259033203125, 17.4375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 22.0, 21.0, 44.0, 72.0, 150.0, 298.0, 709.0, 1803.0, 5177.0, 22977.0, 381794.0, 3703236.0, 63205.0, 9682.0, 2994.0, 1121.0, 482.0, 216.0, 115.0, 57.0, 26.0, 20.0, 12.0, 13.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.4375, -90.2412109375, -87.044921875, -83.8486328125, -80.65234375, -77.4560546875, -74.259765625, -71.0634765625, -67.8671875, -64.6708984375, -61.474609375, -58.2783203125, -55.08203125, -51.8857421875, -48.689453125, -45.4931640625, -42.296875, -39.1005859375, -35.904296875, -32.7080078125, -29.51171875, -26.3154296875, -23.119140625, -19.9228515625, -16.7265625, -13.5302734375, -10.333984375, -7.1376953125, -3.94140625, -0.7451171875, 2.451171875, 5.6474609375, 8.84375, 12.0400390625, 15.236328125, 18.4326171875, 21.62890625, 24.8251953125, 28.021484375, 31.2177734375, 34.4140625, 37.6103515625, 40.806640625, 44.0029296875, 47.19921875, 50.3955078125, 53.591796875, 56.7880859375, 59.984375, 63.1806640625, 66.376953125, 69.5732421875, 72.76953125, 75.9658203125, 79.162109375, 82.3583984375, 85.5546875, 88.7509765625, 91.947265625, 95.1435546875, 98.33984375, 101.5361328125, 104.732421875, 107.9287109375, 111.125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 16.0, 20.0, 31.0, 60.0, 94.0, 156.0, 445.0, 1958.0, 727.0, 229.0, 128.0, 63.0, 39.0, 22.0, 11.0, 12.0, 8.0, 7.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -27.879150390625, -26.64892578125, -25.418701171875, -24.1884765625, -22.958251953125, -21.72802734375, -20.497802734375, -19.267578125, -18.037353515625, -16.80712890625, -15.576904296875, -14.3466796875, -13.116455078125, -11.88623046875, -10.656005859375, -9.42578125, -8.195556640625, -6.96533203125, -5.735107421875, -4.5048828125, -3.274658203125, -2.04443359375, -0.814208984375, 0.416015625, 1.646240234375, 2.87646484375, 4.106689453125, 5.3369140625, 6.567138671875, 7.79736328125, 9.027587890625, 10.2578125, 11.488037109375, 12.71826171875, 13.948486328125, 15.1787109375, 16.408935546875, 17.63916015625, 18.869384765625, 20.099609375, 21.329833984375, 22.56005859375, 23.790283203125, 25.0205078125, 26.250732421875, 27.48095703125, 28.711181640625, 29.94140625, 31.171630859375, 32.40185546875, 33.632080078125, 34.8623046875, 36.092529296875, 37.32275390625, 38.552978515625, 39.783203125, 41.013427734375, 42.24365234375, 43.473876953125, 44.7041015625, 45.934326171875, 47.16455078125, 48.394775390625, 49.625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 35.0, 139.0, 306.0, 290.0, 142.0, 37.0, 19.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-218.39405822753906, -206.19766235351562, -194.0012664794922, -181.80487060546875, -169.60845947265625, -157.41207885742188, -145.21566772460938, -133.01927185058594, -120.8228759765625, -108.62648010253906, -96.43008422851562, -84.23368072509766, -72.03728485107422, -59.84088897705078, -47.64448547363281, -35.448089599609375, -23.251693725585938, -11.055295944213867, 1.1411018371582031, 13.337501525878906, 25.533897399902344, 37.73029327392578, 49.92669677734375, 62.12309265136719, 74.31948852539062, 86.51588439941406, 98.7122802734375, 110.90868377685547, 123.1050796508789, 135.30148315429688, 147.4978790283203, 159.69427490234375, 171.89068603515625, 184.0870819091797, 196.28347778320312, 208.47988891601562, 220.67626953125, 232.8726806640625, 245.06907653808594, 257.2654724121094, 269.46185302734375, 281.65826416015625, 293.8546447753906, 306.0510559082031, 318.2474365234375, 330.44384765625, 342.6402587890625, 354.8366394042969, 367.0330505371094, 379.2294616699219, 391.42584228515625, 403.62225341796875, 415.8186340332031, 428.0150451660156, 440.21142578125, 452.4078369140625, 464.604248046875, 476.8006591796875, 488.9970397949219, 501.1934509277344, 513.3898315429688, 525.5862426757812, 537.7826538085938, 549.97900390625, 562.1754150390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 7.0, 5.0, 6.0, 12.0, 16.0, 20.0, 31.0, 21.0, 29.0, 50.0, 54.0, 55.0, 49.0, 51.0, 59.0, 47.0, 65.0, 62.0, 55.0, 43.0, 56.0, 35.0, 33.0, 27.0, 25.0, 18.0, 16.0, 15.0, 11.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.82026672363281, -110.4427719116211, -106.06526947021484, -101.68777465820312, -97.31027221679688, -92.93277740478516, -88.55528259277344, -84.17778015136719, -79.80028533935547, -75.42279052734375, -71.0452880859375, -66.66779327392578, -62.2902946472168, -57.91279602050781, -53.535301208496094, -49.15780258178711, -44.780303955078125, -40.40280532836914, -36.025306701660156, -31.647811889648438, -27.270313262939453, -22.89281463623047, -18.515317916870117, -14.137821197509766, -9.760322570800781, -5.382824897766113, -1.0053272247314453, 3.3721704483032227, 7.749668121337891, 12.127166748046875, 16.504663467407227, 20.882160186767578, 25.259658813476562, 29.637157440185547, 34.01465606689453, 38.39215087890625, 42.769649505615234, 47.14714813232422, 51.52464294433594, 55.90214157104492, 60.279640197753906, 64.65713500976562, 69.03463745117188, 73.4121322631836, 77.78962707519531, 82.16712951660156, 86.54462432861328, 90.922119140625, 95.29962158203125, 99.67711639404297, 104.05461883544922, 108.43211364746094, 112.80961608886719, 117.1871109008789, 121.56460571289062, 125.94210815429688, 130.31961059570312, 134.69711303710938, 139.07460021972656, 143.4521026611328, 147.82960510253906, 152.20709228515625, 156.5845947265625, 160.96209716796875, 165.33958435058594]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 9.0, 9.0, 14.0, 16.0, 20.0, 33.0, 59.0, 84.0, 120.0, 172.0, 277.0, 462.0, 726.0, 1386.0, 2513.0, 5551.0, 13148.0, 35223.0, 124288.0, 517001.0, 250837.0, 60333.0, 20012.0, 8162.0, 3735.0, 1841.0, 934.0, 546.0, 333.0, 228.0, 160.0, 103.0, 64.0, 46.0, 32.0, 21.0, 16.0, 6.0, 4.0, 10.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-87.5, -84.98046875, -82.4609375, -79.94140625, -77.421875, -74.90234375, -72.3828125, -69.86328125, -67.34375, -64.82421875, -62.3046875, -59.78515625, -57.265625, -54.74609375, -52.2265625, -49.70703125, -47.1875, -44.66796875, -42.1484375, -39.62890625, -37.109375, -34.58984375, -32.0703125, -29.55078125, -27.03125, -24.51171875, -21.9921875, -19.47265625, -16.953125, -14.43359375, -11.9140625, -9.39453125, -6.875, -4.35546875, -1.8359375, 0.68359375, 3.203125, 5.72265625, 8.2421875, 10.76171875, 13.28125, 15.80078125, 18.3203125, 20.83984375, 23.359375, 25.87890625, 28.3984375, 30.91796875, 33.4375, 35.95703125, 38.4765625, 40.99609375, 43.515625, 46.03515625, 48.5546875, 51.07421875, 53.59375, 56.11328125, 58.6328125, 61.15234375, 63.671875, 66.19140625, 68.7109375, 71.23046875, 73.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 8.0, 7.0, 12.0, 16.0, 27.0, 19.0, 24.0, 35.0, 39.0, 43.0, 44.0, 43.0, 63.0, 58.0, 55.0, 55.0, 64.0, 45.0, 42.0, 56.0, 36.0, 36.0, 35.0, 16.0, 26.0, 18.0, 21.0, 15.0, 14.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.298583984375, -16.67529296875, -16.052001953125, -15.4287109375, -14.805419921875, -14.18212890625, -13.558837890625, -12.935546875, -12.312255859375, -11.68896484375, -11.065673828125, -10.4423828125, -9.819091796875, -9.19580078125, -8.572509765625, -7.94921875, -7.325927734375, -6.70263671875, -6.079345703125, -5.4560546875, -4.832763671875, -4.20947265625, -3.586181640625, -2.962890625, -2.339599609375, -1.71630859375, -1.093017578125, -0.4697265625, 0.153564453125, 0.77685546875, 1.400146484375, 2.0234375, 2.646728515625, 3.27001953125, 3.893310546875, 4.5166015625, 5.139892578125, 5.76318359375, 6.386474609375, 7.009765625, 7.633056640625, 8.25634765625, 8.879638671875, 9.5029296875, 10.126220703125, 10.74951171875, 11.372802734375, 11.99609375, 12.619384765625, 13.24267578125, 13.865966796875, 14.4892578125, 15.112548828125, 15.73583984375, 16.359130859375, 16.982421875, 17.605712890625, 18.22900390625, 18.852294921875, 19.4755859375, 20.098876953125, 20.72216796875, 21.345458984375, 21.96875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 5.0, 16.0, 19.0, 27.0, 36.0, 44.0, 57.0, 66.0, 100.0, 160.0, 255.0, 306.0, 495.0, 846.0, 1757.0, 4828.0, 22183.0, 200866.0, 729007.0, 70161.0, 10992.0, 3056.0, 1237.0, 647.0, 404.0, 276.0, 184.0, 142.0, 100.0, 68.0, 56.0, 35.0, 32.0, 21.0, 18.0, 15.0, 8.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-148.0, -143.68359375, -139.3671875, -135.05078125, -130.734375, -126.41796875, -122.1015625, -117.78515625, -113.46875, -109.15234375, -104.8359375, -100.51953125, -96.203125, -91.88671875, -87.5703125, -83.25390625, -78.9375, -74.62109375, -70.3046875, -65.98828125, -61.671875, -57.35546875, -53.0390625, -48.72265625, -44.40625, -40.08984375, -35.7734375, -31.45703125, -27.140625, -22.82421875, -18.5078125, -14.19140625, -9.875, -5.55859375, -1.2421875, 3.07421875, 7.390625, 11.70703125, 16.0234375, 20.33984375, 24.65625, 28.97265625, 33.2890625, 37.60546875, 41.921875, 46.23828125, 50.5546875, 54.87109375, 59.1875, 63.50390625, 67.8203125, 72.13671875, 76.453125, 80.76953125, 85.0859375, 89.40234375, 93.71875, 98.03515625, 102.3515625, 106.66796875, 110.984375, 115.30078125, 119.6171875, 123.93359375, 128.25]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 8.0, 7.0, 9.0, 14.0, 9.0, 24.0, 17.0, 40.0, 31.0, 48.0, 45.0, 49.0, 61.0, 59.0, 43.0, 47.0, 49.0, 61.0, 43.0, 59.0, 42.0, 48.0, 29.0, 33.0, 29.0, 15.0, 20.0, 11.0, 18.0, 4.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-97.5, -94.572265625, -91.64453125, -88.716796875, -85.7890625, -82.861328125, -79.93359375, -77.005859375, -74.078125, -71.150390625, -68.22265625, -65.294921875, -62.3671875, -59.439453125, -56.51171875, -53.583984375, -50.65625, -47.728515625, -44.80078125, -41.873046875, -38.9453125, -36.017578125, -33.08984375, -30.162109375, -27.234375, -24.306640625, -21.37890625, -18.451171875, -15.5234375, -12.595703125, -9.66796875, -6.740234375, -3.8125, -0.884765625, 2.04296875, 4.970703125, 7.8984375, 10.826171875, 13.75390625, 16.681640625, 19.609375, 22.537109375, 25.46484375, 28.392578125, 31.3203125, 34.248046875, 37.17578125, 40.103515625, 43.03125, 45.958984375, 48.88671875, 51.814453125, 54.7421875, 57.669921875, 60.59765625, 63.525390625, 66.453125, 69.380859375, 72.30859375, 75.236328125, 78.1640625, 81.091796875, 84.01953125, 86.947265625, 89.875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 3.0, 9.0, 10.0, 27.0, 32.0, 77.0, 142.0, 434.0, 1718.0, 19466.0, 1002752.0, 21312.0, 1793.0, 457.0, 156.0, 70.0, 36.0, 16.0, 15.0, 14.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.375, -221.330078125, -213.28515625, -205.240234375, -197.1953125, -189.150390625, -181.10546875, -173.060546875, -165.015625, -156.970703125, -148.92578125, -140.880859375, -132.8359375, -124.791015625, -116.74609375, -108.701171875, -100.65625, -92.611328125, -84.56640625, -76.521484375, -68.4765625, -60.431640625, -52.38671875, -44.341796875, -36.296875, -28.251953125, -20.20703125, -12.162109375, -4.1171875, 3.927734375, 11.97265625, 20.017578125, 28.0625, 36.107421875, 44.15234375, 52.197265625, 60.2421875, 68.287109375, 76.33203125, 84.376953125, 92.421875, 100.466796875, 108.51171875, 116.556640625, 124.6015625, 132.646484375, 140.69140625, 148.736328125, 156.78125, 164.826171875, 172.87109375, 180.916015625, 188.9609375, 197.005859375, 205.05078125, 213.095703125, 221.140625, 229.185546875, 237.23046875, 245.275390625, 253.3203125, 261.365234375, 269.41015625, 277.455078125, 285.5]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 29.0, 33.0, 126.0, 298.0, 297.0, 115.0, 46.0, 19.0, 6.0, 3.0, 7.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00786590576171875, -0.007452130317687988, -0.0070383548736572266, -0.006624579429626465, -0.006210803985595703, -0.005797028541564941, -0.00538325309753418, -0.004969477653503418, -0.004555702209472656, -0.0041419267654418945, -0.003728151321411133, -0.003314375877380371, -0.0029006004333496094, -0.0024868249893188477, -0.002073049545288086, -0.0016592741012573242, -0.0012454986572265625, -0.0008317232131958008, -0.00041794776916503906, -4.172325134277344e-06, 0.0004096031188964844, 0.0008233785629272461, 0.0012371540069580078, 0.0016509294509887695, 0.0020647048950195312, 0.002478480339050293, 0.0028922557830810547, 0.0033060312271118164, 0.003719806671142578, 0.00413358211517334, 0.0045473575592041016, 0.004961133003234863, 0.005374908447265625, 0.005788683891296387, 0.0062024593353271484, 0.00661623477935791, 0.007030010223388672, 0.007443785667419434, 0.007857561111450195, 0.008271336555480957, 0.008685111999511719, 0.00909888744354248, 0.009512662887573242, 0.009926438331604004, 0.010340213775634766, 0.010753989219665527, 0.011167764663696289, 0.01158154010772705, 0.011995315551757812, 0.012409090995788574, 0.012822866439819336, 0.013236641883850098, 0.01365041732788086, 0.014064192771911621, 0.014477968215942383, 0.014891743659973145, 0.015305519104003906, 0.015719294548034668, 0.01613306999206543, 0.01654684543609619, 0.016960620880126953, 0.017374396324157715, 0.017788171768188477, 0.01820194721221924, 0.01861572265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 8.0, 6.0, 10.0, 19.0, 25.0, 58.0, 94.0, 248.0, 607.0, 2597.0, 63546.0, 971140.0, 8379.0, 1105.0, 366.0, 175.0, 68.0, 40.0, 21.0, 13.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-200.75, -193.642578125, -186.53515625, -179.427734375, -172.3203125, -165.212890625, -158.10546875, -150.998046875, -143.890625, -136.783203125, -129.67578125, -122.568359375, -115.4609375, -108.353515625, -101.24609375, -94.138671875, -87.03125, -79.923828125, -72.81640625, -65.708984375, -58.6015625, -51.494140625, -44.38671875, -37.279296875, -30.171875, -23.064453125, -15.95703125, -8.849609375, -1.7421875, 5.365234375, 12.47265625, 19.580078125, 26.6875, 33.794921875, 40.90234375, 48.009765625, 55.1171875, 62.224609375, 69.33203125, 76.439453125, 83.546875, 90.654296875, 97.76171875, 104.869140625, 111.9765625, 119.083984375, 126.19140625, 133.298828125, 140.40625, 147.513671875, 154.62109375, 161.728515625, 168.8359375, 175.943359375, 183.05078125, 190.158203125, 197.265625, 204.373046875, 211.48046875, 218.587890625, 225.6953125, 232.802734375, 239.91015625, 247.017578125, 254.125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 9.0, 13.0, 29.0, 49.0, 125.0, 295.0, 261.0, 108.0, 47.0, 27.0, 16.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.6875, -104.1416015625, -99.595703125, -95.0498046875, -90.50390625, -85.9580078125, -81.412109375, -76.8662109375, -72.3203125, -67.7744140625, -63.228515625, -58.6826171875, -54.13671875, -49.5908203125, -45.044921875, -40.4990234375, -35.953125, -31.4072265625, -26.861328125, -22.3154296875, -17.76953125, -13.2236328125, -8.677734375, -4.1318359375, 0.4140625, 4.9599609375, 9.505859375, 14.0517578125, 18.59765625, 23.1435546875, 27.689453125, 32.2353515625, 36.78125, 41.3271484375, 45.873046875, 50.4189453125, 54.96484375, 59.5107421875, 64.056640625, 68.6025390625, 73.1484375, 77.6943359375, 82.240234375, 86.7861328125, 91.33203125, 95.8779296875, 100.423828125, 104.9697265625, 109.515625, 114.0615234375, 118.607421875, 123.1533203125, 127.69921875, 132.2451171875, 136.791015625, 141.3369140625, 145.8828125, 150.4287109375, 154.974609375, 159.5205078125, 164.06640625, 168.6123046875, 173.158203125, 177.7041015625, 182.25]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 14.0, 32.0, 110.0, 319.0, 321.0, 133.0, 41.0, 16.0, 10.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2501.990234375, -2452.849853515625, -2403.709228515625, -2354.56884765625, -2305.42822265625, -2256.287841796875, -2207.1474609375, -2158.0068359375, -2108.866455078125, -2059.72607421875, -2010.58544921875, -1961.445068359375, -1912.3045654296875, -1863.1640625, -1814.023681640625, -1764.8831787109375, -1715.74267578125, -1666.6021728515625, -1617.461669921875, -1568.3212890625, -1519.1807861328125, -1470.040283203125, -1420.89990234375, -1371.7593994140625, -1322.618896484375, -1273.4783935546875, -1224.337890625, -1175.197509765625, -1126.0570068359375, -1076.91650390625, -1027.776123046875, -978.6356201171875, -929.4950561523438, -880.3546142578125, -831.214111328125, -782.0736083984375, -732.9331665039062, -683.792724609375, -634.6522216796875, -585.51171875, -536.3712768554688, -487.2308044433594, -438.09033203125, -388.9498596191406, -339.80938720703125, -290.6689147949219, -241.5284423828125, -192.38796997070312, -143.24749755859375, -94.10702514648438, -44.966552734375, 4.173919677734375, 53.31439208984375, 102.45486450195312, 151.5953369140625, 200.73580932617188, 249.87628173828125, 299.0167541503906, 348.1572265625, 397.2976989746094, 446.43817138671875, 495.5786437988281, 544.7191162109375, 593.859619140625, 643.0000610351562]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 8.0, 6.0, 13.0, 12.0, 15.0, 19.0, 23.0, 24.0, 26.0, 21.0, 29.0, 33.0, 27.0, 29.0, 53.0, 42.0, 49.0, 39.0, 44.0, 50.0, 37.0, 34.0, 37.0, 43.0, 35.0, 33.0, 23.0, 25.0, 23.0, 17.0, 30.0, 18.0, 11.0, 8.0, 10.0, 11.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-404.33477783203125, -391.48724365234375, -378.63970947265625, -365.79217529296875, -352.94464111328125, -340.09710693359375, -327.24957275390625, -314.4020080566406, -301.5544738769531, -288.7069396972656, -275.8594055175781, -263.0118713378906, -250.16432189941406, -237.31678771972656, -224.46925354003906, -211.6217041015625, -198.77418518066406, -185.92665100097656, -173.07911682128906, -160.2315673828125, -147.384033203125, -134.5364990234375, -121.68896484375, -108.84142303466797, -95.99388885498047, -83.14635467529297, -70.29881286621094, -57.45127868652344, -44.60374069213867, -31.756202697753906, -18.908668518066406, -6.061126708984375, 6.786407470703125, 19.63394546508789, 32.481483459472656, 45.329017639160156, 58.17655563354492, 71.02409362792969, 83.87162780761719, 96.71916961669922, 109.56670379638672, 122.41423797607422, 135.26177978515625, 148.10931396484375, 160.95684814453125, 173.80438232421875, 186.65191650390625, 199.4994659423828, 212.3470001220703, 225.1945343017578, 238.0420684814453, 250.88961791992188, 263.7371520996094, 276.5846862792969, 289.4322204589844, 302.2797546386719, 315.1272888183594, 327.9748229980469, 340.8223571777344, 353.6698913574219, 366.5174255371094, 379.364990234375, 392.2125244140625, 405.06005859375, 417.9075927734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 14.0, 15.0, 19.0, 21.0, 47.0, 81.0, 155.0, 309.0, 652.0, 1675.0, 4283.0, 13808.0, 76324.0, 3837052.0, 225060.0, 24582.0, 6431.0, 2094.0, 828.0, 392.0, 194.0, 101.0, 60.0, 32.0, 22.0, 6.0, 6.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.5625, -87.0380859375, -83.513671875, -79.9892578125, -76.46484375, -72.9404296875, -69.416015625, -65.8916015625, -62.3671875, -58.8427734375, -55.318359375, -51.7939453125, -48.26953125, -44.7451171875, -41.220703125, -37.6962890625, -34.171875, -30.6474609375, -27.123046875, -23.5986328125, -20.07421875, -16.5498046875, -13.025390625, -9.5009765625, -5.9765625, -2.4521484375, 1.072265625, 4.5966796875, 8.12109375, 11.6455078125, 15.169921875, 18.6943359375, 22.21875, 25.7431640625, 29.267578125, 32.7919921875, 36.31640625, 39.8408203125, 43.365234375, 46.8896484375, 50.4140625, 53.9384765625, 57.462890625, 60.9873046875, 64.51171875, 68.0361328125, 71.560546875, 75.0849609375, 78.609375, 82.1337890625, 85.658203125, 89.1826171875, 92.70703125, 96.2314453125, 99.755859375, 103.2802734375, 106.8046875, 110.3291015625, 113.853515625, 117.3779296875, 120.90234375, 124.4267578125, 127.951171875, 131.4755859375, 135.0]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 2.0, 5.0, 9.0, 14.0, 20.0, 17.0, 20.0, 21.0, 27.0, 32.0, 30.0, 27.0, 47.0, 59.0, 53.0, 45.0, 58.0, 67.0, 49.0, 54.0, 50.0, 48.0, 42.0, 32.0, 33.0, 30.0, 30.0, 13.0, 9.0, 13.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.402099609375, -18.72607421875, -18.050048828125, -17.3740234375, -16.697998046875, -16.02197265625, -15.345947265625, -14.669921875, -13.993896484375, -13.31787109375, -12.641845703125, -11.9658203125, -11.289794921875, -10.61376953125, -9.937744140625, -9.26171875, -8.585693359375, -7.90966796875, -7.233642578125, -6.5576171875, -5.881591796875, -5.20556640625, -4.529541015625, -3.853515625, -3.177490234375, -2.50146484375, -1.825439453125, -1.1494140625, -0.473388671875, 0.20263671875, 0.878662109375, 1.5546875, 2.230712890625, 2.90673828125, 3.582763671875, 4.2587890625, 4.934814453125, 5.61083984375, 6.286865234375, 6.962890625, 7.638916015625, 8.31494140625, 8.990966796875, 9.6669921875, 10.343017578125, 11.01904296875, 11.695068359375, 12.37109375, 13.047119140625, 13.72314453125, 14.399169921875, 15.0751953125, 15.751220703125, 16.42724609375, 17.103271484375, 17.779296875, 18.455322265625, 19.13134765625, 19.807373046875, 20.4833984375, 21.159423828125, 21.83544921875, 22.511474609375, 23.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 5.0, 11.0, 11.0, 17.0, 14.0, 30.0, 43.0, 76.0, 118.0, 249.0, 551.0, 1095.0, 2579.0, 6931.0, 23805.0, 147234.0, 3745458.0, 222596.0, 29558.0, 8156.0, 3059.0, 1297.0, 638.0, 320.0, 172.0, 94.0, 55.0, 34.0, 26.0, 14.0, 15.0, 6.0, 3.0, 7.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-76.3125, -73.732421875, -71.15234375, -68.572265625, -65.9921875, -63.412109375, -60.83203125, -58.251953125, -55.671875, -53.091796875, -50.51171875, -47.931640625, -45.3515625, -42.771484375, -40.19140625, -37.611328125, -35.03125, -32.451171875, -29.87109375, -27.291015625, -24.7109375, -22.130859375, -19.55078125, -16.970703125, -14.390625, -11.810546875, -9.23046875, -6.650390625, -4.0703125, -1.490234375, 1.08984375, 3.669921875, 6.25, 8.830078125, 11.41015625, 13.990234375, 16.5703125, 19.150390625, 21.73046875, 24.310546875, 26.890625, 29.470703125, 32.05078125, 34.630859375, 37.2109375, 39.791015625, 42.37109375, 44.951171875, 47.53125, 50.111328125, 52.69140625, 55.271484375, 57.8515625, 60.431640625, 63.01171875, 65.591796875, 68.171875, 70.751953125, 73.33203125, 75.912109375, 78.4921875, 81.072265625, 83.65234375, 86.232421875, 88.8125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 11.0, 8.0, 3.0, 15.0, 8.0, 13.0, 33.0, 45.0, 51.0, 87.0, 159.0, 346.0, 2023.0, 674.0, 265.0, 100.0, 76.0, 37.0, 26.0, 21.0, 21.0, 5.0, 11.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.404541015625, -23.41845703125, -22.432373046875, -21.4462890625, -20.460205078125, -19.47412109375, -18.488037109375, -17.501953125, -16.515869140625, -15.52978515625, -14.543701171875, -13.5576171875, -12.571533203125, -11.58544921875, -10.599365234375, -9.61328125, -8.627197265625, -7.64111328125, -6.655029296875, -5.6689453125, -4.682861328125, -3.69677734375, -2.710693359375, -1.724609375, -0.738525390625, 0.24755859375, 1.233642578125, 2.2197265625, 3.205810546875, 4.19189453125, 5.177978515625, 6.1640625, 7.150146484375, 8.13623046875, 9.122314453125, 10.1083984375, 11.094482421875, 12.08056640625, 13.066650390625, 14.052734375, 15.038818359375, 16.02490234375, 17.010986328125, 17.9970703125, 18.983154296875, 19.96923828125, 20.955322265625, 21.94140625, 22.927490234375, 23.91357421875, 24.899658203125, 25.8857421875, 26.871826171875, 27.85791015625, 28.843994140625, 29.830078125, 30.816162109375, 31.80224609375, 32.788330078125, 33.7744140625, 34.760498046875, 35.74658203125, 36.732666015625, 37.71875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 10.0, 69.0, 524.0, 353.0, 35.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-752.4171142578125, -729.530029296875, -706.6429443359375, -683.755859375, -660.8688354492188, -637.9817504882812, -615.0946655273438, -592.2075805664062, -569.320556640625, -546.4334716796875, -523.54638671875, -500.6593322753906, -477.77227783203125, -454.88519287109375, -431.99810791015625, -409.11102294921875, -386.22393798828125, -363.33685302734375, -340.4497985839844, -317.5627136230469, -294.6756591796875, -271.78857421875, -248.9014892578125, -226.01441955566406, -203.12734985351562, -180.2402801513672, -157.35321044921875, -134.46612548828125, -111.57905578613281, -88.69198608398438, -65.80490112304688, -42.91783142089844, -20.03076171875, 2.856311798095703, 25.743385314941406, 48.630462646484375, 71.51753234863281, 94.40460205078125, 117.29168701171875, 140.1787567138672, 163.06582641601562, 185.95289611816406, 208.8399658203125, 231.72705078125, 254.61412048339844, 277.5011901855469, 300.3882751464844, 323.27532958984375, 346.16241455078125, 369.04949951171875, 391.9365539550781, 414.8236389160156, 437.710693359375, 460.5977783203125, 483.48486328125, 506.3719482421875, 529.259033203125, 552.1461181640625, 575.033203125, 597.9202880859375, 620.8073120117188, 643.6943969726562, 666.5814819335938, 689.4685668945312, 712.3555908203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 15.0, 19.0, 16.0, 24.0, 27.0, 45.0, 40.0, 62.0, 62.0, 60.0, 56.0, 77.0, 52.0, 83.0, 65.0, 48.0, 51.0, 47.0, 40.0, 21.0, 22.0, 13.0, 14.0, 12.0, 10.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.28091430664062, -78.82987976074219, -74.37885284423828, -69.92781829833984, -65.4767837524414, -61.025753021240234, -56.57472229003906, -52.123687744140625, -47.67265701293945, -43.22162628173828, -38.770591735839844, -34.31956100463867, -29.868528366088867, -25.417495727539062, -20.96646499633789, -16.515432357788086, -12.064399719238281, -7.613367557525635, -3.1623353958129883, 1.2886962890625, 5.739728927612305, 10.19076156616211, 14.641792297363281, 19.092824935913086, 23.54385757446289, 27.994890213012695, 32.4459228515625, 36.89695358276367, 41.347984313964844, 45.79901885986328, 50.25004959106445, 54.701080322265625, 59.15211486816406, 63.603145599365234, 68.0541763305664, 72.50521087646484, 76.95624542236328, 81.40727233886719, 85.85830688476562, 90.30934143066406, 94.7603759765625, 99.21141052246094, 103.66243743896484, 108.11347198486328, 112.56450653076172, 117.01553344726562, 121.46656799316406, 125.9176025390625, 130.36862182617188, 134.8196563720703, 139.27069091796875, 143.72171020507812, 148.17274475097656, 152.623779296875, 157.07481384277344, 161.52584838867188, 165.9768829345703, 170.42791748046875, 174.8789520263672, 179.32998657226562, 183.781005859375, 188.23204040527344, 192.68307495117188, 197.1341094970703, 201.58514404296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 9.0, 22.0, 24.0, 32.0, 63.0, 82.0, 143.0, 224.0, 417.0, 881.0, 1979.0, 5758.0, 20581.0, 93602.0, 513544.0, 330763.0, 59132.0, 13791.0, 4261.0, 1633.0, 719.0, 366.0, 175.0, 122.0, 76.0, 48.0, 30.0, 21.0, 25.0, 11.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.4375, -64.4873046875, -61.537109375, -58.5869140625, -55.63671875, -52.6865234375, -49.736328125, -46.7861328125, -43.8359375, -40.8857421875, -37.935546875, -34.9853515625, -32.03515625, -29.0849609375, -26.134765625, -23.1845703125, -20.234375, -17.2841796875, -14.333984375, -11.3837890625, -8.43359375, -5.4833984375, -2.533203125, 0.4169921875, 3.3671875, 6.3173828125, 9.267578125, 12.2177734375, 15.16796875, 18.1181640625, 21.068359375, 24.0185546875, 26.96875, 29.9189453125, 32.869140625, 35.8193359375, 38.76953125, 41.7197265625, 44.669921875, 47.6201171875, 50.5703125, 53.5205078125, 56.470703125, 59.4208984375, 62.37109375, 65.3212890625, 68.271484375, 71.2216796875, 74.171875, 77.1220703125, 80.072265625, 83.0224609375, 85.97265625, 88.9228515625, 91.873046875, 94.8232421875, 97.7734375, 100.7236328125, 103.673828125, 106.6240234375, 109.57421875, 112.5244140625, 115.474609375, 118.4248046875, 121.375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 14.0, 10.0, 14.0, 15.0, 27.0, 29.0, 35.0, 41.0, 39.0, 44.0, 64.0, 64.0, 59.0, 78.0, 60.0, 75.0, 66.0, 44.0, 48.0, 39.0, 31.0, 25.0, 21.0, 13.0, 7.0, 9.0, 10.0, 4.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.25, -21.431884765625, -20.61376953125, -19.795654296875, -18.9775390625, -18.159423828125, -17.34130859375, -16.523193359375, -15.705078125, -14.886962890625, -14.06884765625, -13.250732421875, -12.4326171875, -11.614501953125, -10.79638671875, -9.978271484375, -9.16015625, -8.342041015625, -7.52392578125, -6.705810546875, -5.8876953125, -5.069580078125, -4.25146484375, -3.433349609375, -2.615234375, -1.797119140625, -0.97900390625, -0.160888671875, 0.6572265625, 1.475341796875, 2.29345703125, 3.111572265625, 3.9296875, 4.747802734375, 5.56591796875, 6.384033203125, 7.2021484375, 8.020263671875, 8.83837890625, 9.656494140625, 10.474609375, 11.292724609375, 12.11083984375, 12.928955078125, 13.7470703125, 14.565185546875, 15.38330078125, 16.201416015625, 17.01953125, 17.837646484375, 18.65576171875, 19.473876953125, 20.2919921875, 21.110107421875, 21.92822265625, 22.746337890625, 23.564453125, 24.382568359375, 25.20068359375, 26.018798828125, 26.8369140625, 27.655029296875, 28.47314453125, 29.291259765625, 30.109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 11.0, 15.0, 30.0, 54.0, 62.0, 91.0, 137.0, 239.0, 466.0, 887.0, 2572.0, 13655.0, 165908.0, 787954.0, 65904.0, 7260.0, 1595.0, 709.0, 337.0, 212.0, 136.0, 94.0, 73.0, 47.0, 28.0, 25.0, 13.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-149.625, -145.13671875, -140.6484375, -136.16015625, -131.671875, -127.18359375, -122.6953125, -118.20703125, -113.71875, -109.23046875, -104.7421875, -100.25390625, -95.765625, -91.27734375, -86.7890625, -82.30078125, -77.8125, -73.32421875, -68.8359375, -64.34765625, -59.859375, -55.37109375, -50.8828125, -46.39453125, -41.90625, -37.41796875, -32.9296875, -28.44140625, -23.953125, -19.46484375, -14.9765625, -10.48828125, -6.0, -1.51171875, 2.9765625, 7.46484375, 11.953125, 16.44140625, 20.9296875, 25.41796875, 29.90625, 34.39453125, 38.8828125, 43.37109375, 47.859375, 52.34765625, 56.8359375, 61.32421875, 65.8125, 70.30078125, 74.7890625, 79.27734375, 83.765625, 88.25390625, 92.7421875, 97.23046875, 101.71875, 106.20703125, 110.6953125, 115.18359375, 119.671875, 124.16015625, 128.6484375, 133.13671875, 137.625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 16.0, 9.0, 12.0, 9.0, 18.0, 17.0, 29.0, 27.0, 41.0, 63.0, 47.0, 66.0, 60.0, 74.0, 43.0, 72.0, 69.0, 51.0, 56.0, 52.0, 30.0, 25.0, 27.0, 17.0, 19.0, 25.0, 10.0, 5.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-124.5, -121.07421875, -117.6484375, -114.22265625, -110.796875, -107.37109375, -103.9453125, -100.51953125, -97.09375, -93.66796875, -90.2421875, -86.81640625, -83.390625, -79.96484375, -76.5390625, -73.11328125, -69.6875, -66.26171875, -62.8359375, -59.41015625, -55.984375, -52.55859375, -49.1328125, -45.70703125, -42.28125, -38.85546875, -35.4296875, -32.00390625, -28.578125, -25.15234375, -21.7265625, -18.30078125, -14.875, -11.44921875, -8.0234375, -4.59765625, -1.171875, 2.25390625, 5.6796875, 9.10546875, 12.53125, 15.95703125, 19.3828125, 22.80859375, 26.234375, 29.66015625, 33.0859375, 36.51171875, 39.9375, 43.36328125, 46.7890625, 50.21484375, 53.640625, 57.06640625, 60.4921875, 63.91796875, 67.34375, 70.76953125, 74.1953125, 77.62109375, 81.046875, 84.47265625, 87.8984375, 91.32421875, 94.75]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 18.0, 27.0, 55.0, 74.0, 100.0, 167.0, 293.0, 668.0, 1840.0, 7531.0, 62749.0, 850400.0, 110465.0, 10219.0, 2285.0, 814.0, 310.0, 199.0, 116.0, 54.0, 42.0, 24.0, 21.0, 17.0, 10.0, 9.0, 5.0, 3.0, 8.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.65625, -51.90234375, -50.1484375, -48.39453125, -46.640625, -44.88671875, -43.1328125, -41.37890625, -39.625, -37.87109375, -36.1171875, -34.36328125, -32.609375, -30.85546875, -29.1015625, -27.34765625, -25.59375, -23.83984375, -22.0859375, -20.33203125, -18.578125, -16.82421875, -15.0703125, -13.31640625, -11.5625, -9.80859375, -8.0546875, -6.30078125, -4.546875, -2.79296875, -1.0390625, 0.71484375, 2.46875, 4.22265625, 5.9765625, 7.73046875, 9.484375, 11.23828125, 12.9921875, 14.74609375, 16.5, 18.25390625, 20.0078125, 21.76171875, 23.515625, 25.26953125, 27.0234375, 28.77734375, 30.53125, 32.28515625, 34.0390625, 35.79296875, 37.546875, 39.30078125, 41.0546875, 42.80859375, 44.5625, 46.31640625, 48.0703125, 49.82421875, 51.578125, 53.33203125, 55.0859375, 56.83984375, 58.59375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 17.0, 17.0, 28.0, 38.0, 58.0, 91.0, 150.0, 178.0, 139.0, 71.0, 54.0, 43.0, 20.0, 19.0, 16.0, 7.0, 5.0, 3.0, 7.0, 1.0, 6.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00469970703125, -0.004567146301269531, -0.0044345855712890625, -0.004302024841308594, -0.004169464111328125, -0.004036903381347656, -0.0039043426513671875, -0.0037717819213867188, -0.00363922119140625, -0.0035066604614257812, -0.0033740997314453125, -0.0032415390014648438, -0.003108978271484375, -0.0029764175415039062, -0.0028438568115234375, -0.0027112960815429688, -0.0025787353515625, -0.0024461746215820312, -0.0023136138916015625, -0.0021810531616210938, -0.002048492431640625, -0.0019159317016601562, -0.0017833709716796875, -0.0016508102416992188, -0.00151824951171875, -0.0013856887817382812, -0.0012531280517578125, -0.0011205673217773438, -0.000988006591796875, -0.0008554458618164062, -0.0007228851318359375, -0.0005903244018554688, -0.000457763671875, -0.00032520294189453125, -0.0001926422119140625, -6.008148193359375e-05, 7.2479248046875e-05, 0.00020503997802734375, 0.0003376007080078125, 0.00047016143798828125, 0.00060272216796875, 0.0007352828979492188, 0.0008678436279296875, 0.0010004043579101562, 0.001132965087890625, 0.0012655258178710938, 0.0013980865478515625, 0.0015306472778320312, 0.0016632080078125, 0.0017957687377929688, 0.0019283294677734375, 0.0020608901977539062, 0.002193450927734375, 0.0023260116577148438, 0.0024585723876953125, 0.0025911331176757812, 0.00272369384765625, 0.0028562545776367188, 0.0029888153076171875, 0.0031213760375976562, 0.003253936767578125, 0.0033864974975585938, 0.0035190582275390625, 0.0036516189575195312, 0.0037841796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 13.0, 18.0, 23.0, 57.0, 88.0, 158.0, 402.0, 1122.0, 8676.0, 501210.0, 525776.0, 9088.0, 1177.0, 377.0, 169.0, 87.0, 55.0, 20.0, 16.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.125, -67.86328125, -65.6015625, -63.33984375, -61.078125, -58.81640625, -56.5546875, -54.29296875, -52.03125, -49.76953125, -47.5078125, -45.24609375, -42.984375, -40.72265625, -38.4609375, -36.19921875, -33.9375, -31.67578125, -29.4140625, -27.15234375, -24.890625, -22.62890625, -20.3671875, -18.10546875, -15.84375, -13.58203125, -11.3203125, -9.05859375, -6.796875, -4.53515625, -2.2734375, -0.01171875, 2.25, 4.51171875, 6.7734375, 9.03515625, 11.296875, 13.55859375, 15.8203125, 18.08203125, 20.34375, 22.60546875, 24.8671875, 27.12890625, 29.390625, 31.65234375, 33.9140625, 36.17578125, 38.4375, 40.69921875, 42.9609375, 45.22265625, 47.484375, 49.74609375, 52.0078125, 54.26953125, 56.53125, 58.79296875, 61.0546875, 63.31640625, 65.578125, 67.83984375, 70.1015625, 72.36328125, 74.625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 12.0, 8.0, 14.0, 21.0, 43.0, 73.0, 138.0, 234.0, 203.0, 105.0, 55.0, 39.0, 19.0, 12.0, 13.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.875, -74.10546875, -72.3359375, -70.56640625, -68.796875, -67.02734375, -65.2578125, -63.48828125, -61.71875, -59.94921875, -58.1796875, -56.41015625, -54.640625, -52.87109375, -51.1015625, -49.33203125, -47.5625, -45.79296875, -44.0234375, -42.25390625, -40.484375, -38.71484375, -36.9453125, -35.17578125, -33.40625, -31.63671875, -29.8671875, -28.09765625, -26.328125, -24.55859375, -22.7890625, -21.01953125, -19.25, -17.48046875, -15.7109375, -13.94140625, -12.171875, -10.40234375, -8.6328125, -6.86328125, -5.09375, -3.32421875, -1.5546875, 0.21484375, 1.984375, 3.75390625, 5.5234375, 7.29296875, 9.0625, 10.83203125, 12.6015625, 14.37109375, 16.140625, 17.91015625, 19.6796875, 21.44921875, 23.21875, 24.98828125, 26.7578125, 28.52734375, 30.296875, 32.06640625, 33.8359375, 35.60546875, 37.375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 7.0, 8.0, 32.0, 106.0, 329.0, 360.0, 115.0, 33.0, 9.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-607.0286254882812, -566.983154296875, -526.9376831054688, -486.8922424316406, -446.8467712402344, -406.8013000488281, -366.755859375, -326.71038818359375, -286.6649169921875, -246.61944580078125, -206.57398986816406, -166.52853393554688, -126.48306274414062, -86.43759155273438, -46.39213562011719, -6.3466796875, 33.69879150390625, 73.74425506591797, 113.78971862792969, 153.83517456054688, 193.88064575195312, 233.92611694335938, 273.9715576171875, 314.01702880859375, 354.0625, 394.10797119140625, 434.1534423828125, 474.1988830566406, 514.244384765625, 554.289794921875, 594.3352661132812, 634.3807373046875, 674.42626953125, 714.4717407226562, 754.5172119140625, 794.5626831054688, 834.608154296875, 874.653564453125, 914.6990356445312, 954.7445068359375, 994.7899780273438, 1034.83544921875, 1074.880859375, 1114.9263916015625, 1154.9718017578125, 1195.017333984375, 1235.062744140625, 1275.108154296875, 1315.1536865234375, 1355.1990966796875, 1395.24462890625, 1435.2900390625, 1475.3355712890625, 1515.3809814453125, 1555.426513671875, 1595.471923828125, 1635.517333984375, 1675.562744140625, 1715.6082763671875, 1755.6536865234375, 1795.69921875, 1835.74462890625, 1875.7901611328125, 1915.8355712890625, 1955.881103515625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 13.0, 7.0, 10.0, 16.0, 22.0, 24.0, 18.0, 21.0, 31.0, 28.0, 26.0, 36.0, 38.0, 36.0, 40.0, 34.0, 30.0, 38.0, 42.0, 44.0, 44.0, 44.0, 36.0, 31.0, 30.0, 32.0, 25.0, 20.0, 35.0, 26.0, 16.0, 12.0, 12.0, 13.0, 8.0, 11.0, 11.0, 7.0, 5.0, 3.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.5924072265625, -367.0968933105469, -355.60137939453125, -344.1058654785156, -332.6103515625, -321.1148376464844, -309.61932373046875, -298.1238098144531, -286.6282958984375, -275.1327819824219, -263.63726806640625, -252.14175415039062, -240.646240234375, -229.15072631835938, -217.65521240234375, -206.15969848632812, -194.66416931152344, -183.1686553955078, -171.6731414794922, -160.17762756347656, -148.68211364746094, -137.1865997314453, -125.69107818603516, -114.19556427001953, -102.7000503540039, -91.20453643798828, -79.70902252197266, -68.2135009765625, -56.71799087524414, -45.222476959228516, -33.726959228515625, -22.2314453125, -10.735931396484375, 0.7595834732055664, 12.255098342895508, 23.750614166259766, 35.24612808227539, 46.741641998291016, 58.237159729003906, 69.73267364501953, 81.22818756103516, 92.72370147705078, 104.2192153930664, 115.71473693847656, 127.21025085449219, 138.7057647705078, 150.20127868652344, 161.69679260253906, 173.1923065185547, 184.6878204345703, 196.18333435058594, 207.67884826660156, 219.1743621826172, 230.6698760986328, 242.1654052734375, 253.66091918945312, 265.15643310546875, 276.6519470214844, 288.1474609375, 299.6429748535156, 311.13848876953125, 322.6340026855469, 334.1295166015625, 345.6250305175781, 357.12054443359375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 15.0, 32.0, 64.0, 163.0, 305.0, 844.0, 2589.0, 13793.0, 343062.0, 3807299.0, 20917.0, 3553.0, 927.0, 364.0, 150.0, 76.0, 41.0, 21.0, 20.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-164.0, -156.578125, -149.15625, -141.734375, -134.3125, -126.890625, -119.46875, -112.046875, -104.625, -97.203125, -89.78125, -82.359375, -74.9375, -67.515625, -60.09375, -52.671875, -45.25, -37.828125, -30.40625, -22.984375, -15.5625, -8.140625, -0.71875, 6.703125, 14.125, 21.546875, 28.96875, 36.390625, 43.8125, 51.234375, 58.65625, 66.078125, 73.5, 80.921875, 88.34375, 95.765625, 103.1875, 110.609375, 118.03125, 125.453125, 132.875, 140.296875, 147.71875, 155.140625, 162.5625, 169.984375, 177.40625, 184.828125, 192.25, 199.671875, 207.09375, 214.515625, 221.9375, 229.359375, 236.78125, 244.203125, 251.625, 259.046875, 266.46875, 273.890625, 281.3125, 288.734375, 296.15625, 303.578125, 311.0]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 13.0, 11.0, 14.0, 10.0, 14.0, 29.0, 25.0, 46.0, 39.0, 40.0, 46.0, 83.0, 64.0, 42.0, 69.0, 71.0, 57.0, 60.0, 40.0, 40.0, 41.0, 25.0, 18.0, 29.0, 20.0, 11.0, 13.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -20.85205078125, -20.0166015625, -19.18115234375, -18.345703125, -17.51025390625, -16.6748046875, -15.83935546875, -15.00390625, -14.16845703125, -13.3330078125, -12.49755859375, -11.662109375, -10.82666015625, -9.9912109375, -9.15576171875, -8.3203125, -7.48486328125, -6.6494140625, -5.81396484375, -4.978515625, -4.14306640625, -3.3076171875, -2.47216796875, -1.63671875, -0.80126953125, 0.0341796875, 0.86962890625, 1.705078125, 2.54052734375, 3.3759765625, 4.21142578125, 5.046875, 5.88232421875, 6.7177734375, 7.55322265625, 8.388671875, 9.22412109375, 10.0595703125, 10.89501953125, 11.73046875, 12.56591796875, 13.4013671875, 14.23681640625, 15.072265625, 15.90771484375, 16.7431640625, 17.57861328125, 18.4140625, 19.24951171875, 20.0849609375, 20.92041015625, 21.755859375, 22.59130859375, 23.4267578125, 24.26220703125, 25.09765625, 25.93310546875, 26.7685546875, 27.60400390625, 28.439453125, 29.27490234375, 30.1103515625, 30.94580078125, 31.78125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 9.0, 13.0, 16.0, 25.0, 46.0, 78.0, 159.0, 292.0, 598.0, 1400.0, 3499.0, 11189.0, 54028.0, 3346869.0, 719334.0, 41399.0, 9538.0, 3251.0, 1262.0, 607.0, 276.0, 166.0, 87.0, 43.0, 31.0, 23.0, 11.0, 8.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.375, -80.990234375, -77.60546875, -74.220703125, -70.8359375, -67.451171875, -64.06640625, -60.681640625, -57.296875, -53.912109375, -50.52734375, -47.142578125, -43.7578125, -40.373046875, -36.98828125, -33.603515625, -30.21875, -26.833984375, -23.44921875, -20.064453125, -16.6796875, -13.294921875, -9.91015625, -6.525390625, -3.140625, 0.244140625, 3.62890625, 7.013671875, 10.3984375, 13.783203125, 17.16796875, 20.552734375, 23.9375, 27.322265625, 30.70703125, 34.091796875, 37.4765625, 40.861328125, 44.24609375, 47.630859375, 51.015625, 54.400390625, 57.78515625, 61.169921875, 64.5546875, 67.939453125, 71.32421875, 74.708984375, 78.09375, 81.478515625, 84.86328125, 88.248046875, 91.6328125, 95.017578125, 98.40234375, 101.787109375, 105.171875, 108.556640625, 111.94140625, 115.326171875, 118.7109375, 122.095703125, 125.48046875, 128.865234375, 132.25]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 16.0, 18.0, 31.0, 40.0, 78.0, 121.0, 317.0, 2651.0, 440.0, 134.0, 57.0, 51.0, 26.0, 18.0, 11.0, 16.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.1875, -33.75634765625, -32.3251953125, -30.89404296875, -29.462890625, -28.03173828125, -26.6005859375, -25.16943359375, -23.73828125, -22.30712890625, -20.8759765625, -19.44482421875, -18.013671875, -16.58251953125, -15.1513671875, -13.72021484375, -12.2890625, -10.85791015625, -9.4267578125, -7.99560546875, -6.564453125, -5.13330078125, -3.7021484375, -2.27099609375, -0.83984375, 0.59130859375, 2.0224609375, 3.45361328125, 4.884765625, 6.31591796875, 7.7470703125, 9.17822265625, 10.609375, 12.04052734375, 13.4716796875, 14.90283203125, 16.333984375, 17.76513671875, 19.1962890625, 20.62744140625, 22.05859375, 23.48974609375, 24.9208984375, 26.35205078125, 27.783203125, 29.21435546875, 30.6455078125, 32.07666015625, 33.5078125, 34.93896484375, 36.3701171875, 37.80126953125, 39.232421875, 40.66357421875, 42.0947265625, 43.52587890625, 44.95703125, 46.38818359375, 47.8193359375, 49.25048828125, 50.681640625, 52.11279296875, 53.5439453125, 54.97509765625, 56.40625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 17.0, 64.0, 378.0, 444.0, 81.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.39041137695312, -213.36802673339844, -194.34564208984375, -175.32327270507812, -156.30088806152344, -137.27850341796875, -118.2561264038086, -99.23374938964844, -80.21136474609375, -61.18898391723633, -42.166603088378906, -23.144222259521484, -4.1218414306640625, 14.900543212890625, 33.92292022705078, 52.94529724121094, 71.96768188476562, 90.99006652832031, 110.01244354248047, 129.03482055664062, 148.0572052001953, 167.07958984375, 186.10195922851562, 205.1243438720703, 224.146728515625, 243.1691131591797, 262.1914978027344, 281.2138671875, 300.23626708984375, 319.2586364746094, 338.281005859375, 357.30340576171875, 376.32574462890625, 395.3481140136719, 414.3705139160156, 433.39288330078125, 452.415283203125, 471.4376525878906, 490.46002197265625, 509.482421875, 528.5047607421875, 547.5271606445312, 566.5494995117188, 585.5718994140625, 604.5942993164062, 623.61669921875, 642.6390380859375, 661.6614379882812, 680.683837890625, 699.7062377929688, 718.7285766601562, 737.7509765625, 756.7733764648438, 775.7957763671875, 794.818115234375, 813.8405151367188, 832.8629150390625, 851.8853149414062, 870.9076538085938, 889.9300537109375, 908.9524536132812, 927.974853515625, 946.9971923828125, 966.0195922851562, 985.0419311523438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 8.0, 8.0, 22.0, 34.0, 44.0, 52.0, 76.0, 80.0, 86.0, 103.0, 93.0, 98.0, 80.0, 61.0, 52.0, 41.0, 25.0, 14.0, 9.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.13246154785156, -152.6924591064453, -145.25247192382812, -137.81246948242188, -130.37246704101562, -122.93247985839844, -115.49247741699219, -108.05248260498047, -100.61248779296875, -93.17249298095703, -85.73249816894531, -78.29249572753906, -70.85250091552734, -63.412506103515625, -55.97250747680664, -48.532508850097656, -41.09251403808594, -33.65251922607422, -26.212520599365234, -18.772523880004883, -11.332527160644531, -3.8925323486328125, 3.547466278076172, 10.987464904785156, 18.427459716796875, 25.867456436157227, 33.30745315551758, 40.74745178222656, 48.18744659423828, 55.62744140625, 63.067440032958984, 70.50743865966797, 77.94741821289062, 85.38741302490234, 92.82740783691406, 100.26741027832031, 107.70740509033203, 115.14739990234375, 122.58740234375, 130.02740478515625, 137.46739196777344, 144.9073944091797, 152.34738159179688, 159.78738403320312, 167.22738647460938, 174.66737365722656, 182.1073760986328, 189.54736328125, 196.98736572265625, 204.4273681640625, 211.8673553466797, 219.30735778808594, 226.74734497070312, 234.18734741210938, 241.62734985351562, 249.06735229492188, 256.50732421875, 263.94732666015625, 271.3873291015625, 278.8273010253906, 286.2673034667969, 293.7073059082031, 301.1473083496094, 308.5873107910156, 316.0273132324219]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 5.0, 3.0, 15.0, 17.0, 26.0, 37.0, 58.0, 94.0, 160.0, 225.0, 454.0, 891.0, 1984.0, 4638.0, 13720.0, 47017.0, 194553.0, 522877.0, 192581.0, 46834.0, 13629.0, 4737.0, 1929.0, 913.0, 490.0, 267.0, 162.0, 95.0, 60.0, 31.0, 24.0, 13.0, 6.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.0, -92.9521484375, -89.904296875, -86.8564453125, -83.80859375, -80.7607421875, -77.712890625, -74.6650390625, -71.6171875, -68.5693359375, -65.521484375, -62.4736328125, -59.42578125, -56.3779296875, -53.330078125, -50.2822265625, -47.234375, -44.1865234375, -41.138671875, -38.0908203125, -35.04296875, -31.9951171875, -28.947265625, -25.8994140625, -22.8515625, -19.8037109375, -16.755859375, -13.7080078125, -10.66015625, -7.6123046875, -4.564453125, -1.5166015625, 1.53125, 4.5791015625, 7.626953125, 10.6748046875, 13.72265625, 16.7705078125, 19.818359375, 22.8662109375, 25.9140625, 28.9619140625, 32.009765625, 35.0576171875, 38.10546875, 41.1533203125, 44.201171875, 47.2490234375, 50.296875, 53.3447265625, 56.392578125, 59.4404296875, 62.48828125, 65.5361328125, 68.583984375, 71.6318359375, 74.6796875, 77.7275390625, 80.775390625, 83.8232421875, 86.87109375, 89.9189453125, 92.966796875, 96.0146484375, 99.0625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 11.0, 12.0, 21.0, 18.0, 16.0, 28.0, 40.0, 49.0, 54.0, 69.0, 72.0, 53.0, 83.0, 74.0, 68.0, 89.0, 56.0, 42.0, 35.0, 29.0, 16.0, 23.0, 14.0, 14.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -19.96044921875, -18.9833984375, -18.00634765625, -17.029296875, -16.05224609375, -15.0751953125, -14.09814453125, -13.12109375, -12.14404296875, -11.1669921875, -10.18994140625, -9.212890625, -8.23583984375, -7.2587890625, -6.28173828125, -5.3046875, -4.32763671875, -3.3505859375, -2.37353515625, -1.396484375, -0.41943359375, 0.5576171875, 1.53466796875, 2.51171875, 3.48876953125, 4.4658203125, 5.44287109375, 6.419921875, 7.39697265625, 8.3740234375, 9.35107421875, 10.328125, 11.30517578125, 12.2822265625, 13.25927734375, 14.236328125, 15.21337890625, 16.1904296875, 17.16748046875, 18.14453125, 19.12158203125, 20.0986328125, 21.07568359375, 22.052734375, 23.02978515625, 24.0068359375, 24.98388671875, 25.9609375, 26.93798828125, 27.9150390625, 28.89208984375, 29.869140625, 30.84619140625, 31.8232421875, 32.80029296875, 33.77734375, 34.75439453125, 35.7314453125, 36.70849609375, 37.685546875, 38.66259765625, 39.6396484375, 40.61669921875, 41.59375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 7.0, 15.0, 21.0, 24.0, 34.0, 37.0, 68.0, 70.0, 113.0, 156.0, 193.0, 310.0, 412.0, 646.0, 1173.0, 3263.0, 18975.0, 256479.0, 703385.0, 52388.0, 6421.0, 1799.0, 839.0, 488.0, 322.0, 258.0, 181.0, 108.0, 106.0, 60.0, 57.0, 35.0, 28.0, 12.0, 13.0, 12.0, 14.0, 6.0, 4.0, 4.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-154.125, -149.1875, -144.25, -139.3125, -134.375, -129.4375, -124.5, -119.5625, -114.625, -109.6875, -104.75, -99.8125, -94.875, -89.9375, -85.0, -80.0625, -75.125, -70.1875, -65.25, -60.3125, -55.375, -50.4375, -45.5, -40.5625, -35.625, -30.6875, -25.75, -20.8125, -15.875, -10.9375, -6.0, -1.0625, 3.875, 8.8125, 13.75, 18.6875, 23.625, 28.5625, 33.5, 38.4375, 43.375, 48.3125, 53.25, 58.1875, 63.125, 68.0625, 73.0, 77.9375, 82.875, 87.8125, 92.75, 97.6875, 102.625, 107.5625, 112.5, 117.4375, 122.375, 127.3125, 132.25, 137.1875, 142.125, 147.0625, 152.0, 156.9375, 161.875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 6.0, 9.0, 6.0, 8.0, 11.0, 11.0, 16.0, 20.0, 16.0, 38.0, 34.0, 40.0, 46.0, 55.0, 45.0, 48.0, 59.0, 38.0, 43.0, 51.0, 65.0, 46.0, 37.0, 28.0, 34.0, 28.0, 23.0, 16.0, 24.0, 20.0, 13.0, 6.0, 12.0, 9.0, 5.0, 6.0, 0.0, 2.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-91.5, -88.4140625, -85.328125, -82.2421875, -79.15625, -76.0703125, -72.984375, -69.8984375, -66.8125, -63.7265625, -60.640625, -57.5546875, -54.46875, -51.3828125, -48.296875, -45.2109375, -42.125, -39.0390625, -35.953125, -32.8671875, -29.78125, -26.6953125, -23.609375, -20.5234375, -17.4375, -14.3515625, -11.265625, -8.1796875, -5.09375, -2.0078125, 1.078125, 4.1640625, 7.25, 10.3359375, 13.421875, 16.5078125, 19.59375, 22.6796875, 25.765625, 28.8515625, 31.9375, 35.0234375, 38.109375, 41.1953125, 44.28125, 47.3671875, 50.453125, 53.5390625, 56.625, 59.7109375, 62.796875, 65.8828125, 68.96875, 72.0546875, 75.140625, 78.2265625, 81.3125, 84.3984375, 87.484375, 90.5703125, 93.65625, 96.7421875, 99.828125, 102.9140625, 106.0]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 12.0, 14.0, 25.0, 50.0, 51.0, 86.0, 161.0, 273.0, 547.0, 1283.0, 3230.0, 10583.0, 50277.0, 672582.0, 270259.0, 27632.0, 7138.0, 2434.0, 894.0, 428.0, 230.0, 133.0, 74.0, 35.0, 39.0, 17.0, 10.0, 10.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.9375, -66.18798828125, -64.4384765625, -62.68896484375, -60.939453125, -59.18994140625, -57.4404296875, -55.69091796875, -53.94140625, -52.19189453125, -50.4423828125, -48.69287109375, -46.943359375, -45.19384765625, -43.4443359375, -41.69482421875, -39.9453125, -38.19580078125, -36.4462890625, -34.69677734375, -32.947265625, -31.19775390625, -29.4482421875, -27.69873046875, -25.94921875, -24.19970703125, -22.4501953125, -20.70068359375, -18.951171875, -17.20166015625, -15.4521484375, -13.70263671875, -11.953125, -10.20361328125, -8.4541015625, -6.70458984375, -4.955078125, -3.20556640625, -1.4560546875, 0.29345703125, 2.04296875, 3.79248046875, 5.5419921875, 7.29150390625, 9.041015625, 10.79052734375, 12.5400390625, 14.28955078125, 16.0390625, 17.78857421875, 19.5380859375, 21.28759765625, 23.037109375, 24.78662109375, 26.5361328125, 28.28564453125, 30.03515625, 31.78466796875, 33.5341796875, 35.28369140625, 37.033203125, 38.78271484375, 40.5322265625, 42.28173828125, 44.03125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 22.0, 21.0, 39.0, 50.0, 61.0, 103.0, 154.0, 203.0, 114.0, 71.0, 63.0, 25.0, 15.0, 12.0, 11.0, 8.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007171630859375, -0.0069618821144104, -0.006752133369445801, -0.006542384624481201, -0.0063326358795166016, -0.006122887134552002, -0.005913138389587402, -0.005703389644622803, -0.005493640899658203, -0.0052838921546936035, -0.005074143409729004, -0.004864394664764404, -0.004654645919799805, -0.004444897174835205, -0.0042351484298706055, -0.004025399684906006, -0.0038156509399414062, -0.0036059021949768066, -0.003396153450012207, -0.0031864047050476074, -0.002976655960083008, -0.002766907215118408, -0.0025571584701538086, -0.002347409725189209, -0.0021376609802246094, -0.0019279122352600098, -0.0017181634902954102, -0.0015084147453308105, -0.001298666000366211, -0.0010889172554016113, -0.0008791685104370117, -0.0006694197654724121, -0.0004596710205078125, -0.0002499222755432129, -4.017353057861328e-05, 0.00016957521438598633, 0.00037932395935058594, 0.0005890727043151855, 0.0007988214492797852, 0.0010085701942443848, 0.0012183189392089844, 0.001428067684173584, 0.0016378164291381836, 0.0018475651741027832, 0.002057313919067383, 0.0022670626640319824, 0.002476811408996582, 0.0026865601539611816, 0.0028963088989257812, 0.003106057643890381, 0.0033158063888549805, 0.00352555513381958, 0.0037353038787841797, 0.003945052623748779, 0.004154801368713379, 0.0043645501136779785, 0.004574298858642578, 0.004784047603607178, 0.004993796348571777, 0.005203545093536377, 0.0054132938385009766, 0.005623042583465576, 0.005832791328430176, 0.006042540073394775, 0.006252288818359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 11.0, 13.0, 19.0, 31.0, 41.0, 47.0, 82.0, 114.0, 188.0, 293.0, 557.0, 1072.0, 2403.0, 7590.0, 37094.0, 594176.0, 367218.0, 27197.0, 6183.0, 2024.0, 931.0, 446.0, 265.0, 164.0, 116.0, 64.0, 52.0, 39.0, 28.0, 15.0, 13.0, 16.0, 12.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.625, -55.76123046875, -53.8974609375, -52.03369140625, -50.169921875, -48.30615234375, -46.4423828125, -44.57861328125, -42.71484375, -40.85107421875, -38.9873046875, -37.12353515625, -35.259765625, -33.39599609375, -31.5322265625, -29.66845703125, -27.8046875, -25.94091796875, -24.0771484375, -22.21337890625, -20.349609375, -18.48583984375, -16.6220703125, -14.75830078125, -12.89453125, -11.03076171875, -9.1669921875, -7.30322265625, -5.439453125, -3.57568359375, -1.7119140625, 0.15185546875, 2.015625, 3.87939453125, 5.7431640625, 7.60693359375, 9.470703125, 11.33447265625, 13.1982421875, 15.06201171875, 16.92578125, 18.78955078125, 20.6533203125, 22.51708984375, 24.380859375, 26.24462890625, 28.1083984375, 29.97216796875, 31.8359375, 33.69970703125, 35.5634765625, 37.42724609375, 39.291015625, 41.15478515625, 43.0185546875, 44.88232421875, 46.74609375, 48.60986328125, 50.4736328125, 52.33740234375, 54.201171875, 56.06494140625, 57.9287109375, 59.79248046875, 61.65625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 8.0, 3.0, 8.0, 8.0, 11.0, 13.0, 14.0, 35.0, 45.0, 64.0, 100.0, 110.0, 141.0, 118.0, 87.0, 60.0, 47.0, 29.0, 26.0, 19.0, 15.0, 8.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.625, -60.11328125, -58.6015625, -57.08984375, -55.578125, -54.06640625, -52.5546875, -51.04296875, -49.53125, -48.01953125, -46.5078125, -44.99609375, -43.484375, -41.97265625, -40.4609375, -38.94921875, -37.4375, -35.92578125, -34.4140625, -32.90234375, -31.390625, -29.87890625, -28.3671875, -26.85546875, -25.34375, -23.83203125, -22.3203125, -20.80859375, -19.296875, -17.78515625, -16.2734375, -14.76171875, -13.25, -11.73828125, -10.2265625, -8.71484375, -7.203125, -5.69140625, -4.1796875, -2.66796875, -1.15625, 0.35546875, 1.8671875, 3.37890625, 4.890625, 6.40234375, 7.9140625, 9.42578125, 10.9375, 12.44921875, 13.9609375, 15.47265625, 16.984375, 18.49609375, 20.0078125, 21.51953125, 23.03125, 24.54296875, 26.0546875, 27.56640625, 29.078125, 30.58984375, 32.1015625, 33.61328125, 35.125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 17.0, 41.0, 85.0, 172.0, 272.0, 199.0, 111.0, 49.0, 24.0, 9.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1484.2841796875, -1448.778564453125, -1413.2730712890625, -1377.7674560546875, -1342.261962890625, -1306.75634765625, -1271.2508544921875, -1235.7452392578125, -1200.23974609375, -1164.734130859375, -1129.2286376953125, -1093.7230224609375, -1058.217529296875, -1022.7119750976562, -987.2064208984375, -951.7008056640625, -916.1952514648438, -880.689697265625, -845.1841430664062, -809.6785888671875, -774.1730346679688, -738.66748046875, -703.161865234375, -667.6563720703125, -632.1507568359375, -596.6452026367188, -561.1396484375, -525.6340942382812, -490.1285400390625, -454.62298583984375, -419.1174011230469, -383.6118469238281, -348.1063232421875, -312.60076904296875, -277.09521484375, -241.5896453857422, -206.08409118652344, -170.5785369873047, -135.07296752929688, -99.56741333007812, -64.06185913085938, -28.55630111694336, 6.949256896972656, 42.45481872558594, 77.96037292480469, 113.46592712402344, 148.97149658203125, 184.47705078125, 219.98260498046875, 255.4881591796875, 290.99371337890625, 326.499267578125, 362.00482177734375, 397.5103759765625, 433.0159606933594, 468.5215148925781, 504.0270690917969, 539.5326538085938, 575.0382080078125, 610.5437622070312, 646.04931640625, 681.5548706054688, 717.0604248046875, 752.5659790039062, 788.071533203125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 15.0, 9.0, 16.0, 25.0, 22.0, 26.0, 32.0, 33.0, 33.0, 43.0, 43.0, 47.0, 62.0, 56.0, 39.0, 43.0, 56.0, 41.0, 50.0, 47.0, 34.0, 34.0, 26.0, 28.0, 23.0, 13.0, 16.0, 21.0, 17.0, 12.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-648.2952880859375, -630.0960083007812, -611.896728515625, -593.6974487304688, -575.4981689453125, -557.2989501953125, -539.099609375, -520.900390625, -502.70111083984375, -484.5018310546875, -466.30255126953125, -448.103271484375, -429.9040222167969, -411.7047424316406, -393.5054626464844, -375.3061828613281, -357.1069030761719, -338.9076232910156, -320.7083435058594, -302.50909423828125, -284.309814453125, -266.11053466796875, -247.9112548828125, -229.71197509765625, -211.51271057128906, -193.3134307861328, -175.11416625976562, -156.91488647460938, -138.71560668945312, -120.51634216308594, -102.31706237792969, -84.11779022216797, -65.91851806640625, -47.71924591064453, -29.519969940185547, -11.320693969726562, 6.878578186035156, 25.077850341796875, 43.277130126953125, 61.476402282714844, 79.67567443847656, 97.87494659423828, 116.07421875, 134.27349853515625, 152.4727783203125, 170.6720428466797, 188.87132263183594, 207.07058715820312, 225.26986694335938, 243.46914672851562, 261.6684265136719, 279.86767578125, 298.06695556640625, 316.2662353515625, 334.46551513671875, 352.664794921875, 370.86407470703125, 389.0633544921875, 407.26263427734375, 425.4619140625, 443.6611633300781, 461.8604431152344, 480.0597229003906, 498.2590026855469, 516.458251953125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 8.0, 19.0, 27.0, 34.0, 43.0, 50.0, 64.0, 108.0, 176.0, 291.0, 549.0, 1120.0, 2453.0, 6227.0, 20222.0, 104748.0, 3834577.0, 183036.0, 26981.0, 7856.0, 2944.0, 1224.0, 571.0, 308.0, 181.0, 124.0, 73.0, 73.0, 52.0, 26.0, 26.0, 9.0, 11.0, 10.0, 6.0, 7.0, 6.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-118.5, -114.498046875, -110.49609375, -106.494140625, -102.4921875, -98.490234375, -94.48828125, -90.486328125, -86.484375, -82.482421875, -78.48046875, -74.478515625, -70.4765625, -66.474609375, -62.47265625, -58.470703125, -54.46875, -50.466796875, -46.46484375, -42.462890625, -38.4609375, -34.458984375, -30.45703125, -26.455078125, -22.453125, -18.451171875, -14.44921875, -10.447265625, -6.4453125, -2.443359375, 1.55859375, 5.560546875, 9.5625, 13.564453125, 17.56640625, 21.568359375, 25.5703125, 29.572265625, 33.57421875, 37.576171875, 41.578125, 45.580078125, 49.58203125, 53.583984375, 57.5859375, 61.587890625, 65.58984375, 69.591796875, 73.59375, 77.595703125, 81.59765625, 85.599609375, 89.6015625, 93.603515625, 97.60546875, 101.607421875, 105.609375, 109.611328125, 113.61328125, 117.615234375, 121.6171875, 125.619140625, 129.62109375, 133.623046875, 137.625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 5.0, 1.0, 9.0, 11.0, 21.0, 13.0, 18.0, 31.0, 46.0, 42.0, 45.0, 66.0, 61.0, 93.0, 54.0, 56.0, 86.0, 82.0, 55.0, 38.0, 40.0, 34.0, 31.0, 25.0, 14.0, 12.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.61083984375, -22.4716796875, -21.33251953125, -20.193359375, -19.05419921875, -17.9150390625, -16.77587890625, -15.63671875, -14.49755859375, -13.3583984375, -12.21923828125, -11.080078125, -9.94091796875, -8.8017578125, -7.66259765625, -6.5234375, -5.38427734375, -4.2451171875, -3.10595703125, -1.966796875, -0.82763671875, 0.3115234375, 1.45068359375, 2.58984375, 3.72900390625, 4.8681640625, 6.00732421875, 7.146484375, 8.28564453125, 9.4248046875, 10.56396484375, 11.703125, 12.84228515625, 13.9814453125, 15.12060546875, 16.259765625, 17.39892578125, 18.5380859375, 19.67724609375, 20.81640625, 21.95556640625, 23.0947265625, 24.23388671875, 25.373046875, 26.51220703125, 27.6513671875, 28.79052734375, 29.9296875, 31.06884765625, 32.2080078125, 33.34716796875, 34.486328125, 35.62548828125, 36.7646484375, 37.90380859375, 39.04296875, 40.18212890625, 41.3212890625, 42.46044921875, 43.599609375, 44.73876953125, 45.8779296875, 47.01708984375, 48.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 8.0, 5.0, 15.0, 25.0, 42.0, 37.0, 85.0, 137.0, 255.0, 424.0, 781.0, 1665.0, 4542.0, 17067.0, 153410.0, 3901076.0, 94582.0, 13116.0, 3822.0, 1573.0, 727.0, 369.0, 182.0, 132.0, 84.0, 30.0, 36.0, 20.0, 12.0, 5.0, 3.0, 3.0, 8.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.875, -149.9453125, -145.015625, -140.0859375, -135.15625, -130.2265625, -125.296875, -120.3671875, -115.4375, -110.5078125, -105.578125, -100.6484375, -95.71875, -90.7890625, -85.859375, -80.9296875, -76.0, -71.0703125, -66.140625, -61.2109375, -56.28125, -51.3515625, -46.421875, -41.4921875, -36.5625, -31.6328125, -26.703125, -21.7734375, -16.84375, -11.9140625, -6.984375, -2.0546875, 2.875, 7.8046875, 12.734375, 17.6640625, 22.59375, 27.5234375, 32.453125, 37.3828125, 42.3125, 47.2421875, 52.171875, 57.1015625, 62.03125, 66.9609375, 71.890625, 76.8203125, 81.75, 86.6796875, 91.609375, 96.5390625, 101.46875, 106.3984375, 111.328125, 116.2578125, 121.1875, 126.1171875, 131.046875, 135.9765625, 140.90625, 145.8359375, 150.765625, 155.6953125, 160.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 8.0, 13.0, 18.0, 32.0, 77.0, 188.0, 2031.0, 1327.0, 189.0, 80.0, 30.0, 19.0, 11.0, 13.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-110.6875, -107.521484375, -104.35546875, -101.189453125, -98.0234375, -94.857421875, -91.69140625, -88.525390625, -85.359375, -82.193359375, -79.02734375, -75.861328125, -72.6953125, -69.529296875, -66.36328125, -63.197265625, -60.03125, -56.865234375, -53.69921875, -50.533203125, -47.3671875, -44.201171875, -41.03515625, -37.869140625, -34.703125, -31.537109375, -28.37109375, -25.205078125, -22.0390625, -18.873046875, -15.70703125, -12.541015625, -9.375, -6.208984375, -3.04296875, 0.123046875, 3.2890625, 6.455078125, 9.62109375, 12.787109375, 15.953125, 19.119140625, 22.28515625, 25.451171875, 28.6171875, 31.783203125, 34.94921875, 38.115234375, 41.28125, 44.447265625, 47.61328125, 50.779296875, 53.9453125, 57.111328125, 60.27734375, 63.443359375, 66.609375, 69.775390625, 72.94140625, 76.107421875, 79.2734375, 82.439453125, 85.60546875, 88.771484375, 91.9375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 14.0, 66.0, 126.0, 311.0, 304.0, 107.0, 29.0, 15.0, 5.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-339.3290100097656, -318.2330017089844, -297.1369934082031, -276.0409851074219, -254.94497680664062, -233.84896850585938, -212.7529754638672, -191.65696716308594, -170.5609588623047, -149.46495056152344, -128.3689422607422, -107.27294158935547, -86.17693328857422, -65.08092498779297, -43.98492431640625, -22.888916015625, -1.79290771484375, 19.303098678588867, 40.399105072021484, 61.49510955810547, 82.59111785888672, 103.68712615966797, 124.78312683105469, 145.87913513183594, 166.9751434326172, 188.07115173339844, 209.1671600341797, 230.26315307617188, 251.35916137695312, 272.4551696777344, 293.5511779785156, 314.6471862792969, 335.74322509765625, 356.8392333984375, 377.93524169921875, 399.03125, 420.12725830078125, 441.2232666015625, 462.31927490234375, 483.415283203125, 504.51129150390625, 525.6072998046875, 546.7033081054688, 567.79931640625, 588.8953247070312, 609.9913330078125, 631.0873413085938, 652.183349609375, 673.279296875, 694.3753051757812, 715.4713134765625, 736.5673217773438, 757.663330078125, 778.7593383789062, 799.8553466796875, 820.9513549804688, 842.04736328125, 863.1433715820312, 884.2393798828125, 905.3353881835938, 926.431396484375, 947.5274047851562, 968.6234130859375, 989.7194213867188, 1010.8154296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 7.0, 11.0, 22.0, 39.0, 46.0, 64.0, 87.0, 95.0, 84.0, 120.0, 83.0, 86.0, 79.0, 59.0, 37.0, 25.0, 19.0, 12.0, 6.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-365.9420166015625, -352.9200439453125, -339.8980712890625, -326.8761291503906, -313.8541564941406, -300.8321838378906, -287.8102111816406, -274.78826904296875, -261.76629638671875, -248.74432373046875, -235.7223663330078, -222.7003936767578, -209.67843627929688, -196.65646362304688, -183.63449096679688, -170.61253356933594, -157.59056091308594, -144.56858825683594, -131.546630859375, -118.524658203125, -105.50270080566406, -92.48072814941406, -79.4587631225586, -66.43679809570312, -53.414833068847656, -40.39286804199219, -27.370901107788086, -14.348934173583984, -1.3269691467285156, 11.694999694824219, 24.716964721679688, 37.738929748535156, 50.760894775390625, 63.782859802246094, 76.80482482910156, 89.82679748535156, 102.8487548828125, 115.8707275390625, 128.8927001953125, 141.91465759277344, 154.93661499023438, 167.95858764648438, 180.9805450439453, 194.0025177001953, 207.02447509765625, 220.04644775390625, 233.06842041015625, 246.0903778076172, 259.11236572265625, 272.13433837890625, 285.15631103515625, 298.1782531738281, 311.2002258300781, 324.2221984863281, 337.2441711425781, 350.26611328125, 363.2880859375, 376.31005859375, 389.33203125, 402.3539733886719, 415.3759460449219, 428.3979187011719, 441.4198913574219, 454.44183349609375, 467.46380615234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 23.0, 23.0, 27.0, 50.0, 83.0, 155.0, 315.0, 672.0, 1602.0, 5382.0, 20877.0, 96457.0, 453223.0, 372011.0, 74582.0, 16171.0, 4308.0, 1356.0, 555.0, 299.0, 158.0, 77.0, 46.0, 39.0, 20.0, 11.0, 8.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-127.5, -123.23828125, -118.9765625, -114.71484375, -110.453125, -106.19140625, -101.9296875, -97.66796875, -93.40625, -89.14453125, -84.8828125, -80.62109375, -76.359375, -72.09765625, -67.8359375, -63.57421875, -59.3125, -55.05078125, -50.7890625, -46.52734375, -42.265625, -38.00390625, -33.7421875, -29.48046875, -25.21875, -20.95703125, -16.6953125, -12.43359375, -8.171875, -3.91015625, 0.3515625, 4.61328125, 8.875, 13.13671875, 17.3984375, 21.66015625, 25.921875, 30.18359375, 34.4453125, 38.70703125, 42.96875, 47.23046875, 51.4921875, 55.75390625, 60.015625, 64.27734375, 68.5390625, 72.80078125, 77.0625, 81.32421875, 85.5859375, 89.84765625, 94.109375, 98.37109375, 102.6328125, 106.89453125, 111.15625, 115.41796875, 119.6796875, 123.94140625, 128.203125, 132.46484375, 136.7265625, 140.98828125, 145.25]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 10.0, 9.0, 16.0, 35.0, 31.0, 46.0, 66.0, 73.0, 75.0, 75.0, 85.0, 79.0, 88.0, 71.0, 65.0, 41.0, 43.0, 40.0, 17.0, 13.0, 10.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5625, -28.1982421875, -26.833984375, -25.4697265625, -24.10546875, -22.7412109375, -21.376953125, -20.0126953125, -18.6484375, -17.2841796875, -15.919921875, -14.5556640625, -13.19140625, -11.8271484375, -10.462890625, -9.0986328125, -7.734375, -6.3701171875, -5.005859375, -3.6416015625, -2.27734375, -0.9130859375, 0.451171875, 1.8154296875, 3.1796875, 4.5439453125, 5.908203125, 7.2724609375, 8.63671875, 10.0009765625, 11.365234375, 12.7294921875, 14.09375, 15.4580078125, 16.822265625, 18.1865234375, 19.55078125, 20.9150390625, 22.279296875, 23.6435546875, 25.0078125, 26.3720703125, 27.736328125, 29.1005859375, 30.46484375, 31.8291015625, 33.193359375, 34.5576171875, 35.921875, 37.2861328125, 38.650390625, 40.0146484375, 41.37890625, 42.7431640625, 44.107421875, 45.4716796875, 46.8359375, 48.2001953125, 49.564453125, 50.9287109375, 52.29296875, 53.6572265625, 55.021484375, 56.3857421875, 57.75]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 10.0, 10.0, 8.0, 13.0, 19.0, 25.0, 44.0, 44.0, 68.0, 105.0, 189.0, 240.0, 406.0, 715.0, 1478.0, 5263.0, 51064.0, 801384.0, 172726.0, 10151.0, 2271.0, 903.0, 498.0, 305.0, 190.0, 137.0, 94.0, 52.0, 38.0, 25.0, 19.0, 22.0, 10.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.5, -270.232421875, -261.96484375, -253.697265625, -245.4296875, -237.162109375, -228.89453125, -220.626953125, -212.359375, -204.091796875, -195.82421875, -187.556640625, -179.2890625, -171.021484375, -162.75390625, -154.486328125, -146.21875, -137.951171875, -129.68359375, -121.416015625, -113.1484375, -104.880859375, -96.61328125, -88.345703125, -80.078125, -71.810546875, -63.54296875, -55.275390625, -47.0078125, -38.740234375, -30.47265625, -22.205078125, -13.9375, -5.669921875, 2.59765625, 10.865234375, 19.1328125, 27.400390625, 35.66796875, 43.935546875, 52.203125, 60.470703125, 68.73828125, 77.005859375, 85.2734375, 93.541015625, 101.80859375, 110.076171875, 118.34375, 126.611328125, 134.87890625, 143.146484375, 151.4140625, 159.681640625, 167.94921875, 176.216796875, 184.484375, 192.751953125, 201.01953125, 209.287109375, 217.5546875, 225.822265625, 234.08984375, 242.357421875, 250.625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 9.0, 9.0, 10.0, 15.0, 12.0, 12.0, 23.0, 19.0, 25.0, 30.0, 35.0, 35.0, 36.0, 48.0, 53.0, 52.0, 46.0, 35.0, 66.0, 52.0, 49.0, 37.0, 40.0, 29.0, 32.0, 35.0, 28.0, 17.0, 14.0, 22.0, 15.0, 14.0, 8.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.125, -122.79296875, -118.4609375, -114.12890625, -109.796875, -105.46484375, -101.1328125, -96.80078125, -92.46875, -88.13671875, -83.8046875, -79.47265625, -75.140625, -70.80859375, -66.4765625, -62.14453125, -57.8125, -53.48046875, -49.1484375, -44.81640625, -40.484375, -36.15234375, -31.8203125, -27.48828125, -23.15625, -18.82421875, -14.4921875, -10.16015625, -5.828125, -1.49609375, 2.8359375, 7.16796875, 11.5, 15.83203125, 20.1640625, 24.49609375, 28.828125, 33.16015625, 37.4921875, 41.82421875, 46.15625, 50.48828125, 54.8203125, 59.15234375, 63.484375, 67.81640625, 72.1484375, 76.48046875, 80.8125, 85.14453125, 89.4765625, 93.80859375, 98.140625, 102.47265625, 106.8046875, 111.13671875, 115.46875, 119.80078125, 124.1328125, 128.46484375, 132.796875, 137.12890625, 141.4609375, 145.79296875, 150.125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 7.0, 12.0, 15.0, 28.0, 40.0, 44.0, 68.0, 83.0, 162.0, 263.0, 407.0, 787.0, 1520.0, 3534.0, 9237.0, 30349.0, 140452.0, 545589.0, 245056.0, 48501.0, 13358.0, 4714.0, 2046.0, 973.0, 513.0, 280.0, 164.0, 100.0, 57.0, 52.0, 41.0, 21.0, 17.0, 9.0, 10.0, 10.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.34375, -45.8486328125, -44.353515625, -42.8583984375, -41.36328125, -39.8681640625, -38.373046875, -36.8779296875, -35.3828125, -33.8876953125, -32.392578125, -30.8974609375, -29.40234375, -27.9072265625, -26.412109375, -24.9169921875, -23.421875, -21.9267578125, -20.431640625, -18.9365234375, -17.44140625, -15.9462890625, -14.451171875, -12.9560546875, -11.4609375, -9.9658203125, -8.470703125, -6.9755859375, -5.48046875, -3.9853515625, -2.490234375, -0.9951171875, 0.5, 1.9951171875, 3.490234375, 4.9853515625, 6.48046875, 7.9755859375, 9.470703125, 10.9658203125, 12.4609375, 13.9560546875, 15.451171875, 16.9462890625, 18.44140625, 19.9365234375, 21.431640625, 22.9267578125, 24.421875, 25.9169921875, 27.412109375, 28.9072265625, 30.40234375, 31.8974609375, 33.392578125, 34.8876953125, 36.3828125, 37.8779296875, 39.373046875, 40.8681640625, 42.36328125, 43.8583984375, 45.353515625, 46.8486328125, 48.34375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 13.0, 19.0, 22.0, 31.0, 36.0, 56.0, 90.0, 85.0, 97.0, 121.0, 111.0, 80.0, 62.0, 49.0, 28.0, 21.0, 16.0, 14.0, 12.0, 3.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00638580322265625, -0.006151080131530762, -0.0059163570404052734, -0.005681633949279785, -0.005446910858154297, -0.005212187767028809, -0.00497746467590332, -0.004742741584777832, -0.004508018493652344, -0.0042732954025268555, -0.004038572311401367, -0.003803849220275879, -0.0035691261291503906, -0.0033344030380249023, -0.003099679946899414, -0.0028649568557739258, -0.0026302337646484375, -0.0023955106735229492, -0.002160787582397461, -0.0019260644912719727, -0.0016913414001464844, -0.001456618309020996, -0.0012218952178955078, -0.0009871721267700195, -0.0007524490356445312, -0.000517725944519043, -0.0002830028533935547, -4.8279762268066406e-05, 0.00018644332885742188, 0.00042116641998291016, 0.0006558895111083984, 0.0008906126022338867, 0.001125335693359375, 0.0013600587844848633, 0.0015947818756103516, 0.0018295049667358398, 0.002064228057861328, 0.0022989511489868164, 0.0025336742401123047, 0.002768397331237793, 0.0030031204223632812, 0.0032378435134887695, 0.003472566604614258, 0.003707289695739746, 0.003942012786865234, 0.004176735877990723, 0.004411458969116211, 0.004646182060241699, 0.0048809051513671875, 0.005115628242492676, 0.005350351333618164, 0.005585074424743652, 0.005819797515869141, 0.006054520606994629, 0.006289243698120117, 0.0065239667892456055, 0.006758689880371094, 0.006993412971496582, 0.00722813606262207, 0.007462859153747559, 0.007697582244873047, 0.007932305335998535, 0.008167028427124023, 0.008401751518249512, 0.008636474609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 12.0, 18.0, 13.0, 43.0, 46.0, 68.0, 104.0, 179.0, 318.0, 587.0, 1215.0, 3364.0, 14316.0, 117098.0, 754400.0, 134801.0, 15524.0, 3662.0, 1329.0, 606.0, 301.0, 208.0, 94.0, 67.0, 43.0, 30.0, 22.0, 25.0, 14.0, 8.0, 5.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-75.3125, -72.9970703125, -70.681640625, -68.3662109375, -66.05078125, -63.7353515625, -61.419921875, -59.1044921875, -56.7890625, -54.4736328125, -52.158203125, -49.8427734375, -47.52734375, -45.2119140625, -42.896484375, -40.5810546875, -38.265625, -35.9501953125, -33.634765625, -31.3193359375, -29.00390625, -26.6884765625, -24.373046875, -22.0576171875, -19.7421875, -17.4267578125, -15.111328125, -12.7958984375, -10.48046875, -8.1650390625, -5.849609375, -3.5341796875, -1.21875, 1.0966796875, 3.412109375, 5.7275390625, 8.04296875, 10.3583984375, 12.673828125, 14.9892578125, 17.3046875, 19.6201171875, 21.935546875, 24.2509765625, 26.56640625, 28.8818359375, 31.197265625, 33.5126953125, 35.828125, 38.1435546875, 40.458984375, 42.7744140625, 45.08984375, 47.4052734375, 49.720703125, 52.0361328125, 54.3515625, 56.6669921875, 58.982421875, 61.2978515625, 63.61328125, 65.9287109375, 68.244140625, 70.5595703125, 72.875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 6.0, 8.0, 7.0, 9.0, 15.0, 18.0, 19.0, 34.0, 39.0, 44.0, 60.0, 98.0, 104.0, 86.0, 106.0, 77.0, 66.0, 47.0, 48.0, 25.0, 14.0, 22.0, 17.0, 8.0, 6.0, 5.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.65625, -42.974609375, -41.29296875, -39.611328125, -37.9296875, -36.248046875, -34.56640625, -32.884765625, -31.203125, -29.521484375, -27.83984375, -26.158203125, -24.4765625, -22.794921875, -21.11328125, -19.431640625, -17.75, -16.068359375, -14.38671875, -12.705078125, -11.0234375, -9.341796875, -7.66015625, -5.978515625, -4.296875, -2.615234375, -0.93359375, 0.748046875, 2.4296875, 4.111328125, 5.79296875, 7.474609375, 9.15625, 10.837890625, 12.51953125, 14.201171875, 15.8828125, 17.564453125, 19.24609375, 20.927734375, 22.609375, 24.291015625, 25.97265625, 27.654296875, 29.3359375, 31.017578125, 32.69921875, 34.380859375, 36.0625, 37.744140625, 39.42578125, 41.107421875, 42.7890625, 44.470703125, 46.15234375, 47.833984375, 49.515625, 51.197265625, 52.87890625, 54.560546875, 56.2421875, 57.923828125, 59.60546875, 61.287109375, 62.96875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 17.0, 40.0, 164.0, 288.0, 281.0, 123.0, 51.0, 23.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1671.16015625, -1615.161376953125, -1559.16259765625, -1503.163818359375, -1447.1650390625, -1391.166259765625, -1335.16748046875, -1279.168701171875, -1223.169921875, -1167.171142578125, -1111.17236328125, -1055.173583984375, -999.1748046875, -943.176025390625, -887.1771850585938, -831.1784057617188, -775.1795654296875, -719.1807861328125, -663.1820068359375, -607.1832275390625, -551.1844482421875, -495.1856384277344, -439.18682861328125, -383.18804931640625, -327.18927001953125, -271.19049072265625, -215.1916961669922, -159.19290161132812, -103.19412231445312, -47.195343017578125, 8.803466796875, 64.80224609375, 120.8009033203125, 176.7996826171875, 232.79847717285156, 288.7972717285156, 344.7960510253906, 400.7948303222656, 456.79364013671875, 512.7924194335938, 568.7911987304688, 624.7899780273438, 680.7887573242188, 736.78759765625, 792.786376953125, 848.78515625, 904.783935546875, 960.78271484375, 1016.781494140625, 1072.7802734375, 1128.779052734375, 1184.77783203125, 1240.776611328125, 1296.775390625, 1352.774169921875, 1408.77294921875, 1464.771728515625, 1520.7705078125, 1576.769287109375, 1632.76806640625, 1688.766845703125, 1744.765625, 1800.764404296875, 1856.76318359375, 1912.7620849609375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 5.0, 3.0, 10.0, 12.0, 12.0, 17.0, 17.0, 24.0, 22.0, 24.0, 35.0, 30.0, 40.0, 43.0, 40.0, 43.0, 41.0, 45.0, 45.0, 50.0, 46.0, 46.0, 39.0, 45.0, 41.0, 40.0, 28.0, 15.0, 26.0, 21.0, 16.0, 12.0, 8.0, 8.0, 7.0, 8.0, 5.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-729.532470703125, -708.1761474609375, -686.81982421875, -665.4635009765625, -644.107177734375, -622.7507934570312, -601.3944702148438, -580.0381469726562, -558.6818237304688, -537.3255004882812, -515.9691772460938, -494.6128234863281, -473.2565002441406, -451.9001770019531, -430.5438232421875, -409.1875, -387.8311767578125, -366.474853515625, -345.1185302734375, -323.7621765136719, -302.4058532714844, -281.0495300292969, -259.69317626953125, -238.33685302734375, -216.98052978515625, -195.62420654296875, -174.2678680419922, -152.91152954101562, -131.55520629882812, -110.1988754272461, -88.84254455566406, -67.4862060546875, -46.1298828125, -24.77355194091797, -3.4172210693359375, 17.939109802246094, 39.295440673828125, 60.651771545410156, 82.00810241699219, 103.36444091796875, 124.72076416015625, 146.07708740234375, 167.4334259033203, 188.78976440429688, 210.14608764648438, 231.50241088867188, 252.85874938964844, 274.215087890625, 295.5714111328125, 316.927734375, 338.2840576171875, 359.6404113769531, 380.9967346191406, 402.3530578613281, 423.70941162109375, 445.06573486328125, 466.42205810546875, 487.77838134765625, 509.13470458984375, 530.4910278320312, 551.847412109375, 573.2037353515625, 594.56005859375, 615.9163818359375, 637.272705078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 10.0, 5.0, 24.0, 28.0, 58.0, 100.0, 170.0, 352.0, 875.0, 2577.0, 20211.0, 4148973.0, 16993.0, 2379.0, 762.0, 352.0, 192.0, 84.0, 33.0, 32.0, 19.0, 8.0, 9.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-295.75, -286.3515625, -276.953125, -267.5546875, -258.15625, -248.7578125, -239.359375, -229.9609375, -220.5625, -211.1640625, -201.765625, -192.3671875, -182.96875, -173.5703125, -164.171875, -154.7734375, -145.375, -135.9765625, -126.578125, -117.1796875, -107.78125, -98.3828125, -88.984375, -79.5859375, -70.1875, -60.7890625, -51.390625, -41.9921875, -32.59375, -23.1953125, -13.796875, -4.3984375, 5.0, 14.3984375, 23.796875, 33.1953125, 42.59375, 51.9921875, 61.390625, 70.7890625, 80.1875, 89.5859375, 98.984375, 108.3828125, 117.78125, 127.1796875, 136.578125, 145.9765625, 155.375, 164.7734375, 174.171875, 183.5703125, 192.96875, 202.3671875, 211.765625, 221.1640625, 230.5625, 239.9609375, 249.359375, 258.7578125, 268.15625, 277.5546875, 286.953125, 296.3515625, 305.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 9.0, 2.0, 9.0, 5.0, 8.0, 16.0, 31.0, 28.0, 46.0, 60.0, 55.0, 88.0, 70.0, 94.0, 83.0, 92.0, 76.0, 58.0, 48.0, 37.0, 36.0, 19.0, 12.0, 9.0, 8.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -48.5625, -46.8125, -45.0625, -43.3125, -41.5625, -39.8125, -38.0625, -36.3125, -34.5625, -32.8125, -31.0625, -29.3125, -27.5625, -25.8125, -24.0625, -22.3125, -20.5625, -18.8125, -17.0625, -15.3125, -13.5625, -11.8125, -10.0625, -8.3125, -6.5625, -4.8125, -3.0625, -1.3125, 0.4375, 2.1875, 3.9375, 5.6875, 7.4375, 9.1875, 10.9375, 12.6875, 14.4375, 16.1875, 17.9375, 19.6875, 21.4375, 23.1875, 24.9375, 26.6875, 28.4375, 30.1875, 31.9375, 33.6875, 35.4375, 37.1875, 38.9375, 40.6875, 42.4375, 44.1875, 45.9375, 47.6875, 49.4375, 51.1875, 52.9375, 54.6875, 56.4375, 58.1875, 59.9375, 61.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 4.0, 11.0, 14.0, 17.0, 28.0, 34.0, 42.0, 47.0, 80.0, 121.0, 168.0, 236.0, 355.0, 613.0, 1033.0, 2039.0, 4670.0, 14135.0, 115891.0, 4009301.0, 31281.0, 7620.0, 2926.0, 1420.0, 790.0, 456.0, 262.0, 194.0, 136.0, 93.0, 74.0, 51.0, 34.0, 27.0, 25.0, 16.0, 11.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.375, -142.94140625, -138.5078125, -134.07421875, -129.640625, -125.20703125, -120.7734375, -116.33984375, -111.90625, -107.47265625, -103.0390625, -98.60546875, -94.171875, -89.73828125, -85.3046875, -80.87109375, -76.4375, -72.00390625, -67.5703125, -63.13671875, -58.703125, -54.26953125, -49.8359375, -45.40234375, -40.96875, -36.53515625, -32.1015625, -27.66796875, -23.234375, -18.80078125, -14.3671875, -9.93359375, -5.5, -1.06640625, 3.3671875, 7.80078125, 12.234375, 16.66796875, 21.1015625, 25.53515625, 29.96875, 34.40234375, 38.8359375, 43.26953125, 47.703125, 52.13671875, 56.5703125, 61.00390625, 65.4375, 69.87109375, 74.3046875, 78.73828125, 83.171875, 87.60546875, 92.0390625, 96.47265625, 100.90625, 105.33984375, 109.7734375, 114.20703125, 118.640625, 123.07421875, 127.5078125, 131.94140625, 136.375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 3.0, 7.0, 12.0, 37.0, 92.0, 3590.0, 213.0, 55.0, 22.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.78125, -51.42041015625, -50.0595703125, -48.69873046875, -47.337890625, -45.97705078125, -44.6162109375, -43.25537109375, -41.89453125, -40.53369140625, -39.1728515625, -37.81201171875, -36.451171875, -35.09033203125, -33.7294921875, -32.36865234375, -31.0078125, -29.64697265625, -28.2861328125, -26.92529296875, -25.564453125, -24.20361328125, -22.8427734375, -21.48193359375, -20.12109375, -18.76025390625, -17.3994140625, -16.03857421875, -14.677734375, -13.31689453125, -11.9560546875, -10.59521484375, -9.234375, -7.87353515625, -6.5126953125, -5.15185546875, -3.791015625, -2.43017578125, -1.0693359375, 0.29150390625, 1.65234375, 3.01318359375, 4.3740234375, 5.73486328125, 7.095703125, 8.45654296875, 9.8173828125, 11.17822265625, 12.5390625, 13.89990234375, 15.2607421875, 16.62158203125, 17.982421875, 19.34326171875, 20.7041015625, 22.06494140625, 23.42578125, 24.78662109375, 26.1474609375, 27.50830078125, 28.869140625, 30.22998046875, 31.5908203125, 32.95166015625, 34.3125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 11.0, 38.0, 124.0, 275.0, 365.0, 143.0, 36.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-347.22235107421875, -338.36297607421875, -329.50360107421875, -320.6442565917969, -311.7848815917969, -302.9255065917969, -294.0661315917969, -285.2067565917969, -276.347412109375, -267.488037109375, -258.628662109375, -249.76930236816406, -240.90994262695312, -232.05056762695312, -223.19119262695312, -214.33181762695312, -205.47244262695312, -196.61306762695312, -187.7537078857422, -178.8943328857422, -170.03497314453125, -161.17559814453125, -152.31622314453125, -143.45684814453125, -134.5974884033203, -125.73812103271484, -116.87875366210938, -108.01937866210938, -99.1600112915039, -90.30064392089844, -81.44126892089844, -72.58190155029297, -63.7225341796875, -54.86316680908203, -46.0037956237793, -37.14442443847656, -28.285057067871094, -19.425689697265625, -10.56631851196289, -1.7069473266601562, 7.1524200439453125, 16.011789321899414, 24.871158599853516, 33.73052978515625, 42.58989715576172, 51.44926452636719, 60.30863571166992, 69.16800689697266, 78.02737426757812, 86.8867416381836, 95.74610900878906, 104.60548400878906, 113.46485137939453, 122.32421875, 131.18359375, 140.04296875, 148.90232849121094, 157.76170349121094, 166.62106323242188, 175.48043823242188, 184.33981323242188, 193.1991729736328, 202.0585479736328, 210.91790771484375, 219.77728271484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 4.0, 4.0, 5.0, 6.0, 12.0, 9.0, 14.0, 14.0, 24.0, 24.0, 19.0, 24.0, 33.0, 17.0, 28.0, 34.0, 31.0, 36.0, 26.0, 41.0, 37.0, 41.0, 45.0, 37.0, 31.0, 41.0, 27.0, 36.0, 36.0, 31.0, 34.0, 29.0, 28.0, 30.0, 21.0, 13.0, 15.0, 14.0, 8.0, 12.0, 7.0, 8.0, 8.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.54640197753906, -45.96523666381836, -44.384071350097656, -42.80290603637695, -41.22174072265625, -39.64057159423828, -38.059410095214844, -36.478240966796875, -34.89707565307617, -33.31591033935547, -31.734745025634766, -30.153579711914062, -28.572412490844727, -26.991247177124023, -25.41008186340332, -23.828914642333984, -22.247751235961914, -20.66658592224121, -19.085420608520508, -17.504253387451172, -15.923088073730469, -14.341922760009766, -12.760757446289062, -11.179591178894043, -9.59842586517334, -8.017260551452637, -6.436094284057617, -4.854928970336914, -3.2737631797790527, -1.6925973892211914, -0.11143207550048828, 1.4697341918945312, 3.0508995056152344, 4.632065296173096, 6.213231086730957, 7.79439640045166, 9.37556266784668, 10.956727981567383, 12.537893295288086, 14.119059562683105, 15.700224876403809, 17.281391143798828, 18.86255645751953, 20.443721771240234, 22.024887084960938, 23.60605239868164, 25.187217712402344, 26.76838493347168, 28.349550247192383, 29.930715560913086, 31.51188087463379, 33.093048095703125, 34.67421340942383, 36.25537872314453, 37.836544036865234, 39.41770935058594, 40.99887466430664, 42.580039978027344, 44.16120529174805, 45.74237060546875, 47.32353591918945, 48.904701232910156, 50.485870361328125, 52.06703567504883, 53.64820098876953]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 15.0, 24.0, 40.0, 49.0, 104.0, 153.0, 237.0, 479.0, 840.0, 1795.0, 4218.0, 11702.0, 39015.0, 142741.0, 393163.0, 315531.0, 96873.0, 26764.0, 8505.0, 3189.0, 1499.0, 672.0, 367.0, 208.0, 135.0, 78.0, 52.0, 38.0, 18.0, 12.0, 10.0, 4.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.0, -106.6513671875, -103.302734375, -99.9541015625, -96.60546875, -93.2568359375, -89.908203125, -86.5595703125, -83.2109375, -79.8623046875, -76.513671875, -73.1650390625, -69.81640625, -66.4677734375, -63.119140625, -59.7705078125, -56.421875, -53.0732421875, -49.724609375, -46.3759765625, -43.02734375, -39.6787109375, -36.330078125, -32.9814453125, -29.6328125, -26.2841796875, -22.935546875, -19.5869140625, -16.23828125, -12.8896484375, -9.541015625, -6.1923828125, -2.84375, 0.5048828125, 3.853515625, 7.2021484375, 10.55078125, 13.8994140625, 17.248046875, 20.5966796875, 23.9453125, 27.2939453125, 30.642578125, 33.9912109375, 37.33984375, 40.6884765625, 44.037109375, 47.3857421875, 50.734375, 54.0830078125, 57.431640625, 60.7802734375, 64.12890625, 67.4775390625, 70.826171875, 74.1748046875, 77.5234375, 80.8720703125, 84.220703125, 87.5693359375, 90.91796875, 94.2666015625, 97.615234375, 100.9638671875, 104.3125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 2.0, 6.0, 10.0, 15.0, 24.0, 25.0, 38.0, 44.0, 68.0, 73.0, 83.0, 72.0, 84.0, 83.0, 89.0, 74.0, 58.0, 42.0, 28.0, 27.0, 20.0, 13.0, 11.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.53125, -48.74462890625, -46.9580078125, -45.17138671875, -43.384765625, -41.59814453125, -39.8115234375, -38.02490234375, -36.23828125, -34.45166015625, -32.6650390625, -30.87841796875, -29.091796875, -27.30517578125, -25.5185546875, -23.73193359375, -21.9453125, -20.15869140625, -18.3720703125, -16.58544921875, -14.798828125, -13.01220703125, -11.2255859375, -9.43896484375, -7.65234375, -5.86572265625, -4.0791015625, -2.29248046875, -0.505859375, 1.28076171875, 3.0673828125, 4.85400390625, 6.640625, 8.42724609375, 10.2138671875, 12.00048828125, 13.787109375, 15.57373046875, 17.3603515625, 19.14697265625, 20.93359375, 22.72021484375, 24.5068359375, 26.29345703125, 28.080078125, 29.86669921875, 31.6533203125, 33.43994140625, 35.2265625, 37.01318359375, 38.7998046875, 40.58642578125, 42.373046875, 44.15966796875, 45.9462890625, 47.73291015625, 49.51953125, 51.30615234375, 53.0927734375, 54.87939453125, 56.666015625, 58.45263671875, 60.2392578125, 62.02587890625, 63.8125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 3.0, 11.0, 10.0, 20.0, 18.0, 34.0, 54.0, 58.0, 114.0, 127.0, 166.0, 236.0, 409.0, 637.0, 1090.0, 2984.0, 23384.0, 709338.0, 294113.0, 11176.0, 1976.0, 942.0, 510.0, 333.0, 215.0, 173.0, 128.0, 83.0, 60.0, 36.0, 22.0, 27.0, 12.0, 13.0, 10.0, 7.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.75, -275.84765625, -265.9453125, -256.04296875, -246.140625, -236.23828125, -226.3359375, -216.43359375, -206.53125, -196.62890625, -186.7265625, -176.82421875, -166.921875, -157.01953125, -147.1171875, -137.21484375, -127.3125, -117.41015625, -107.5078125, -97.60546875, -87.703125, -77.80078125, -67.8984375, -57.99609375, -48.09375, -38.19140625, -28.2890625, -18.38671875, -8.484375, 1.41796875, 11.3203125, 21.22265625, 31.125, 41.02734375, 50.9296875, 60.83203125, 70.734375, 80.63671875, 90.5390625, 100.44140625, 110.34375, 120.24609375, 130.1484375, 140.05078125, 149.953125, 159.85546875, 169.7578125, 179.66015625, 189.5625, 199.46484375, 209.3671875, 219.26953125, 229.171875, 239.07421875, 248.9765625, 258.87890625, 268.78125, 278.68359375, 288.5859375, 298.48828125, 308.390625, 318.29296875, 328.1953125, 338.09765625, 348.0]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 8.0, 14.0, 13.0, 15.0, 27.0, 30.0, 15.0, 18.0, 43.0, 34.0, 44.0, 52.0, 46.0, 57.0, 46.0, 45.0, 44.0, 47.0, 47.0, 48.0, 43.0, 35.0, 30.0, 32.0, 26.0, 19.0, 18.0, 16.0, 20.0, 14.0, 12.0, 5.0, 4.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-184.0, -178.4140625, -172.828125, -167.2421875, -161.65625, -156.0703125, -150.484375, -144.8984375, -139.3125, -133.7265625, -128.140625, -122.5546875, -116.96875, -111.3828125, -105.796875, -100.2109375, -94.625, -89.0390625, -83.453125, -77.8671875, -72.28125, -66.6953125, -61.109375, -55.5234375, -49.9375, -44.3515625, -38.765625, -33.1796875, -27.59375, -22.0078125, -16.421875, -10.8359375, -5.25, 0.3359375, 5.921875, 11.5078125, 17.09375, 22.6796875, 28.265625, 33.8515625, 39.4375, 45.0234375, 50.609375, 56.1953125, 61.78125, 67.3671875, 72.953125, 78.5390625, 84.125, 89.7109375, 95.296875, 100.8828125, 106.46875, 112.0546875, 117.640625, 123.2265625, 128.8125, 134.3984375, 139.984375, 145.5703125, 151.15625, 156.7421875, 162.328125, 167.9140625, 173.5]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 4.0, 15.0, 19.0, 27.0, 18.0, 53.0, 61.0, 105.0, 130.0, 221.0, 409.0, 791.0, 1994.0, 5782.0, 25629.0, 207531.0, 688434.0, 95464.0, 14857.0, 3986.0, 1440.0, 644.0, 331.0, 189.0, 120.0, 78.0, 60.0, 31.0, 26.0, 23.0, 10.0, 10.0, 8.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0], "bins": [-83.0625, -80.7763671875, -78.490234375, -76.2041015625, -73.91796875, -71.6318359375, -69.345703125, -67.0595703125, -64.7734375, -62.4873046875, -60.201171875, -57.9150390625, -55.62890625, -53.3427734375, -51.056640625, -48.7705078125, -46.484375, -44.1982421875, -41.912109375, -39.6259765625, -37.33984375, -35.0537109375, -32.767578125, -30.4814453125, -28.1953125, -25.9091796875, -23.623046875, -21.3369140625, -19.05078125, -16.7646484375, -14.478515625, -12.1923828125, -9.90625, -7.6201171875, -5.333984375, -3.0478515625, -0.76171875, 1.5244140625, 3.810546875, 6.0966796875, 8.3828125, 10.6689453125, 12.955078125, 15.2412109375, 17.52734375, 19.8134765625, 22.099609375, 24.3857421875, 26.671875, 28.9580078125, 31.244140625, 33.5302734375, 35.81640625, 38.1025390625, 40.388671875, 42.6748046875, 44.9609375, 47.2470703125, 49.533203125, 51.8193359375, 54.10546875, 56.3916015625, 58.677734375, 60.9638671875, 63.25]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 3.0, 3.0, 10.0, 8.0, 13.0, 13.0, 26.0, 30.0, 54.0, 48.0, 84.0, 96.0, 118.0, 116.0, 88.0, 76.0, 55.0, 42.0, 27.0, 24.0, 16.0, 13.0, 11.0, 6.0, 0.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007373809814453125, -0.007077634334564209, -0.006781458854675293, -0.006485283374786377, -0.006189107894897461, -0.005892932415008545, -0.005596756935119629, -0.005300581455230713, -0.005004405975341797, -0.004708230495452881, -0.004412055015563965, -0.004115879535675049, -0.003819704055786133, -0.003523528575897217, -0.0032273530960083008, -0.0029311776161193848, -0.0026350021362304688, -0.0023388266563415527, -0.0020426511764526367, -0.0017464756965637207, -0.0014503002166748047, -0.0011541247367858887, -0.0008579492568969727, -0.0005617737770080566, -0.0002655982971191406, 3.057718276977539e-05, 0.0003267526626586914, 0.0006229281425476074, 0.0009191036224365234, 0.0012152791023254395, 0.0015114545822143555, 0.0018076300621032715, 0.0021038055419921875, 0.0023999810218811035, 0.0026961565017700195, 0.0029923319816589355, 0.0032885074615478516, 0.0035846829414367676, 0.0038808584213256836, 0.0041770339012146, 0.004473209381103516, 0.004769384860992432, 0.005065560340881348, 0.005361735820770264, 0.00565791130065918, 0.005954086780548096, 0.006250262260437012, 0.006546437740325928, 0.006842613220214844, 0.00713878870010376, 0.007434964179992676, 0.007731139659881592, 0.008027315139770508, 0.008323490619659424, 0.00861966609954834, 0.008915841579437256, 0.009212017059326172, 0.009508192539215088, 0.009804368019104004, 0.01010054349899292, 0.010396718978881836, 0.010692894458770752, 0.010989069938659668, 0.011285245418548584, 0.0115814208984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 14.0, 25.0, 26.0, 40.0, 75.0, 130.0, 291.0, 782.0, 2977.0, 27711.0, 893993.0, 114656.0, 5775.0, 1218.0, 417.0, 164.0, 95.0, 55.0, 42.0, 25.0, 16.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.9375, -100.5068359375, -96.076171875, -91.6455078125, -87.21484375, -82.7841796875, -78.353515625, -73.9228515625, -69.4921875, -65.0615234375, -60.630859375, -56.2001953125, -51.76953125, -47.3388671875, -42.908203125, -38.4775390625, -34.046875, -29.6162109375, -25.185546875, -20.7548828125, -16.32421875, -11.8935546875, -7.462890625, -3.0322265625, 1.3984375, 5.8291015625, 10.259765625, 14.6904296875, 19.12109375, 23.5517578125, 27.982421875, 32.4130859375, 36.84375, 41.2744140625, 45.705078125, 50.1357421875, 54.56640625, 58.9970703125, 63.427734375, 67.8583984375, 72.2890625, 76.7197265625, 81.150390625, 85.5810546875, 90.01171875, 94.4423828125, 98.873046875, 103.3037109375, 107.734375, 112.1650390625, 116.595703125, 121.0263671875, 125.45703125, 129.8876953125, 134.318359375, 138.7490234375, 143.1796875, 147.6103515625, 152.041015625, 156.4716796875, 160.90234375, 165.3330078125, 169.763671875, 174.1943359375, 178.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 4.0, 8.0, 9.0, 26.0, 26.0, 35.0, 54.0, 53.0, 64.0, 80.0, 114.0, 121.0, 116.0, 68.0, 59.0, 36.0, 46.0, 22.0, 12.0, 15.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.09375, -51.82958984375, -49.5654296875, -47.30126953125, -45.037109375, -42.77294921875, -40.5087890625, -38.24462890625, -35.98046875, -33.71630859375, -31.4521484375, -29.18798828125, -26.923828125, -24.65966796875, -22.3955078125, -20.13134765625, -17.8671875, -15.60302734375, -13.3388671875, -11.07470703125, -8.810546875, -6.54638671875, -4.2822265625, -2.01806640625, 0.24609375, 2.51025390625, 4.7744140625, 7.03857421875, 9.302734375, 11.56689453125, 13.8310546875, 16.09521484375, 18.359375, 20.62353515625, 22.8876953125, 25.15185546875, 27.416015625, 29.68017578125, 31.9443359375, 34.20849609375, 36.47265625, 38.73681640625, 41.0009765625, 43.26513671875, 45.529296875, 47.79345703125, 50.0576171875, 52.32177734375, 54.5859375, 56.85009765625, 59.1142578125, 61.37841796875, 63.642578125, 65.90673828125, 68.1708984375, 70.43505859375, 72.69921875, 74.96337890625, 77.2275390625, 79.49169921875, 81.755859375, 84.02001953125, 86.2841796875, 88.54833984375, 90.8125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 10.0, 39.0, 85.0, 169.0, 273.0, 250.0, 112.0, 45.0, 10.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1913.9091796875, -1853.7603759765625, -1793.6114501953125, -1733.462646484375, -1673.3138427734375, -1613.1650390625, -1553.01611328125, -1492.8673095703125, -1432.718505859375, -1372.5697021484375, -1312.4207763671875, -1252.27197265625, -1192.1231689453125, -1131.974365234375, -1071.825439453125, -1011.6766357421875, -951.5277099609375, -891.3788452148438, -831.2300415039062, -771.0811767578125, -710.932373046875, -650.7835083007812, -590.6346435546875, -530.48583984375, -470.33697509765625, -410.1881408691406, -350.039306640625, -289.89044189453125, -229.74160766601562, -169.5927734375, -109.44390869140625, -49.295074462890625, 10.8536376953125, 71.00247955322266, 131.1513214111328, 191.3001708984375, 251.44900512695312, 311.59783935546875, 371.7467041015625, 431.8955383300781, 492.04437255859375, 552.1932373046875, 612.342041015625, 672.4909057617188, 732.6397705078125, 792.78857421875, 852.9374389648438, 913.0863037109375, 973.235107421875, 1033.3839111328125, 1093.5328369140625, 1153.681640625, 1213.8304443359375, 1273.979248046875, 1334.128173828125, 1394.2769775390625, 1454.42578125, 1514.5745849609375, 1574.7235107421875, 1634.872314453125, 1695.0211181640625, 1755.169921875, 1815.31884765625, 1875.4676513671875, 1935.6165771484375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 9.0, 7.0, 14.0, 11.0, 17.0, 24.0, 23.0, 32.0, 29.0, 38.0, 33.0, 43.0, 45.0, 46.0, 62.0, 51.0, 64.0, 43.0, 37.0, 53.0, 43.0, 41.0, 34.0, 28.0, 32.0, 21.0, 22.0, 26.0, 18.0, 16.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-933.82958984375, -908.5966186523438, -883.3636474609375, -858.1306762695312, -832.897705078125, -807.6646728515625, -782.4317016601562, -757.19873046875, -731.9657592773438, -706.7327880859375, -681.4998168945312, -656.266845703125, -631.0338134765625, -605.8008422851562, -580.56787109375, -555.3348999023438, -530.1019287109375, -504.86895751953125, -479.635986328125, -454.4029846191406, -429.1700134277344, -403.9370422363281, -378.70404052734375, -353.4710693359375, -328.23809814453125, -303.005126953125, -277.77215576171875, -252.53915405273438, -227.30618286132812, -202.07321166992188, -176.84022521972656, -151.60723876953125, -126.37432861328125, -101.14134979248047, -75.90837097167969, -50.675392150878906, -25.442413330078125, -0.20943450927734375, 25.023544311523438, 50.25653076171875, 75.489501953125, 100.72248077392578, 125.95545959472656, 151.18844604492188, 176.42141723632812, 201.65438842773438, 226.8873748779297, 252.120361328125, 277.35333251953125, 302.5863037109375, 327.81927490234375, 353.0522766113281, 378.2852478027344, 403.5182189941406, 428.751220703125, 453.98419189453125, 479.2171630859375, 504.45013427734375, 529.68310546875, 554.9160766601562, 580.1490478515625, 605.382080078125, 630.6150512695312, 655.8480224609375, 681.0809936523438]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 8.0, 18.0, 15.0, 28.0, 46.0, 62.0, 92.0, 128.0, 231.0, 402.0, 679.0, 1348.0, 3027.0, 7936.0, 27341.0, 757264.0, 3353516.0, 28213.0, 7994.0, 3009.0, 1277.0, 678.0, 348.0, 212.0, 111.0, 94.0, 55.0, 41.0, 27.0, 26.0, 13.0, 10.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.8125, -96.7880859375, -93.763671875, -90.7392578125, -87.71484375, -84.6904296875, -81.666015625, -78.6416015625, -75.6171875, -72.5927734375, -69.568359375, -66.5439453125, -63.51953125, -60.4951171875, -57.470703125, -54.4462890625, -51.421875, -48.3974609375, -45.373046875, -42.3486328125, -39.32421875, -36.2998046875, -33.275390625, -30.2509765625, -27.2265625, -24.2021484375, -21.177734375, -18.1533203125, -15.12890625, -12.1044921875, -9.080078125, -6.0556640625, -3.03125, -0.0068359375, 3.017578125, 6.0419921875, 9.06640625, 12.0908203125, 15.115234375, 18.1396484375, 21.1640625, 24.1884765625, 27.212890625, 30.2373046875, 33.26171875, 36.2861328125, 39.310546875, 42.3349609375, 45.359375, 48.3837890625, 51.408203125, 54.4326171875, 57.45703125, 60.4814453125, 63.505859375, 66.5302734375, 69.5546875, 72.5791015625, 75.603515625, 78.6279296875, 81.65234375, 84.6767578125, 87.701171875, 90.7255859375, 93.75]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 2.0, 7.0, 7.0, 7.0, 18.0, 21.0, 36.0, 41.0, 50.0, 52.0, 71.0, 57.0, 82.0, 65.0, 70.0, 76.0, 62.0, 48.0, 54.0, 32.0, 41.0, 28.0, 21.0, 13.0, 10.0, 7.0, 5.0, 5.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.28125, -42.736328125, -41.19140625, -39.646484375, -38.1015625, -36.556640625, -35.01171875, -33.466796875, -31.921875, -30.376953125, -28.83203125, -27.287109375, -25.7421875, -24.197265625, -22.65234375, -21.107421875, -19.5625, -18.017578125, -16.47265625, -14.927734375, -13.3828125, -11.837890625, -10.29296875, -8.748046875, -7.203125, -5.658203125, -4.11328125, -2.568359375, -1.0234375, 0.521484375, 2.06640625, 3.611328125, 5.15625, 6.701171875, 8.24609375, 9.791015625, 11.3359375, 12.880859375, 14.42578125, 15.970703125, 17.515625, 19.060546875, 20.60546875, 22.150390625, 23.6953125, 25.240234375, 26.78515625, 28.330078125, 29.875, 31.419921875, 32.96484375, 34.509765625, 36.0546875, 37.599609375, 39.14453125, 40.689453125, 42.234375, 43.779296875, 45.32421875, 46.869140625, 48.4140625, 49.958984375, 51.50390625, 53.048828125, 54.59375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 10.0, 12.0, 16.0, 22.0, 36.0, 69.0, 90.0, 98.0, 156.0, 251.0, 365.0, 620.0, 813.0, 1432.0, 2299.0, 3979.0, 7997.0, 21597.0, 83390.0, 3870854.0, 147744.0, 29899.0, 10496.0, 4880.0, 2654.0, 1526.0, 1044.0, 620.0, 429.0, 265.0, 199.0, 124.0, 92.0, 52.0, 51.0, 21.0, 22.0, 17.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.9375, -67.4072265625, -64.876953125, -62.3466796875, -59.81640625, -57.2861328125, -54.755859375, -52.2255859375, -49.6953125, -47.1650390625, -44.634765625, -42.1044921875, -39.57421875, -37.0439453125, -34.513671875, -31.9833984375, -29.453125, -26.9228515625, -24.392578125, -21.8623046875, -19.33203125, -16.8017578125, -14.271484375, -11.7412109375, -9.2109375, -6.6806640625, -4.150390625, -1.6201171875, 0.91015625, 3.4404296875, 5.970703125, 8.5009765625, 11.03125, 13.5615234375, 16.091796875, 18.6220703125, 21.15234375, 23.6826171875, 26.212890625, 28.7431640625, 31.2734375, 33.8037109375, 36.333984375, 38.8642578125, 41.39453125, 43.9248046875, 46.455078125, 48.9853515625, 51.515625, 54.0458984375, 56.576171875, 59.1064453125, 61.63671875, 64.1669921875, 66.697265625, 69.2275390625, 71.7578125, 74.2880859375, 76.818359375, 79.3486328125, 81.87890625, 84.4091796875, 86.939453125, 89.4697265625, 92.0]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 10.0, 9.0, 29.0, 41.0, 67.0, 187.0, 3363.0, 189.0, 69.0, 40.0, 20.0, 8.0, 6.0, 6.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.84375, -42.7880859375, -41.732421875, -40.6767578125, -39.62109375, -38.5654296875, -37.509765625, -36.4541015625, -35.3984375, -34.3427734375, -33.287109375, -32.2314453125, -31.17578125, -30.1201171875, -29.064453125, -28.0087890625, -26.953125, -25.8974609375, -24.841796875, -23.7861328125, -22.73046875, -21.6748046875, -20.619140625, -19.5634765625, -18.5078125, -17.4521484375, -16.396484375, -15.3408203125, -14.28515625, -13.2294921875, -12.173828125, -11.1181640625, -10.0625, -9.0068359375, -7.951171875, -6.8955078125, -5.83984375, -4.7841796875, -3.728515625, -2.6728515625, -1.6171875, -0.5615234375, 0.494140625, 1.5498046875, 2.60546875, 3.6611328125, 4.716796875, 5.7724609375, 6.828125, 7.8837890625, 8.939453125, 9.9951171875, 11.05078125, 12.1064453125, 13.162109375, 14.2177734375, 15.2734375, 16.3291015625, 17.384765625, 18.4404296875, 19.49609375, 20.5517578125, 21.607421875, 22.6630859375, 23.71875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 10.0, 6.0, 10.0, 15.0, 29.0, 64.0, 66.0, 82.0, 136.0, 130.0, 118.0, 109.0, 62.0, 53.0, 42.0, 28.0, 8.0, 8.0, 6.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.57127380371094, -133.9714813232422, -130.37167358398438, -126.77188110351562, -123.17208099365234, -119.57228088378906, -115.97248077392578, -112.3726806640625, -108.77288818359375, -105.17308807373047, -101.57328796386719, -97.97349548339844, -94.37369537353516, -90.77389526367188, -87.1740951538086, -83.57429504394531, -79.97449493408203, -76.37469482421875, -72.77489471435547, -69.17509460449219, -65.57530212402344, -61.975502014160156, -58.375701904296875, -54.775901794433594, -51.17610549926758, -47.5763053894043, -43.97650909423828, -40.376708984375, -36.77690887451172, -33.1771125793457, -29.577312469482422, -25.977514266967773, -22.377716064453125, -18.777917861938477, -15.178118705749512, -11.578319549560547, -7.978521347045898, -4.37872314453125, -0.7789230346679688, 2.8208751678466797, 6.420673370361328, 10.020471572875977, 13.620270729064941, 17.220069885253906, 20.819868087768555, 24.419666290283203, 28.019466400146484, 31.619264602661133, 35.21906280517578, 38.81886291503906, 42.41865921020508, 46.01845932006836, 49.618255615234375, 53.218055725097656, 56.81785583496094, 60.41765594482422, 64.0174560546875, 67.61725616455078, 71.21705627441406, 74.81684875488281, 78.4166488647461, 82.01644897460938, 85.61624908447266, 89.21604919433594, 92.81584167480469]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 11.0, 11.0, 12.0, 8.0, 14.0, 8.0, 12.0, 26.0, 22.0, 31.0, 23.0, 34.0, 40.0, 36.0, 29.0, 43.0, 37.0, 41.0, 36.0, 36.0, 41.0, 50.0, 40.0, 49.0, 36.0, 32.0, 36.0, 21.0, 18.0, 26.0, 21.0, 17.0, 14.0, 15.0, 8.0, 9.0, 7.0, 6.0, 6.0, 7.0, 8.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90528869628906, -49.03809356689453, -47.1708984375, -45.30370330810547, -43.43650436401367, -41.56930923461914, -39.70211410522461, -37.83491897583008, -35.96772003173828, -34.10052490234375, -32.23332977294922, -30.366132736206055, -28.49893569946289, -26.63174057006836, -24.764545440673828, -22.897350311279297, -21.030155181884766, -19.162960052490234, -17.29576301574707, -15.428567886352539, -13.561371803283691, -11.694175720214844, -9.826980590820312, -7.959784507751465, -6.092588424682617, -4.2253923416137695, -2.35819673538208, -0.4910011291503906, 1.376194953918457, 3.2433910369873047, 5.110586166381836, 6.977782249450684, 8.844978332519531, 10.712174415588379, 12.579370498657227, 14.446565628051758, 16.313762664794922, 18.180957794189453, 20.048152923583984, 21.915348052978516, 23.78254508972168, 25.64974021911621, 27.516937255859375, 29.384132385253906, 31.251327514648438, 33.11852264404297, 34.9857177734375, 36.8529167175293, 38.72011184692383, 40.58730697631836, 42.45450210571289, 44.32170104980469, 46.18889617919922, 48.05609130859375, 49.92328643798828, 51.79048156738281, 53.657676696777344, 55.524871826171875, 57.392066955566406, 59.25926208496094, 61.126461029052734, 62.993656158447266, 64.86085510253906, 66.7280502319336, 68.59524536132812]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 12.0, 11.0, 22.0, 46.0, 52.0, 81.0, 147.0, 227.0, 423.0, 672.0, 1183.0, 2381.0, 4474.0, 9756.0, 23857.0, 64417.0, 183830.0, 357562.0, 248944.0, 92298.0, 33034.0, 13073.0, 5722.0, 2815.0, 1496.0, 810.0, 466.0, 266.0, 164.0, 108.0, 76.0, 43.0, 32.0, 14.0, 8.0, 13.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.5, -72.955078125, -70.41015625, -67.865234375, -65.3203125, -62.775390625, -60.23046875, -57.685546875, -55.140625, -52.595703125, -50.05078125, -47.505859375, -44.9609375, -42.416015625, -39.87109375, -37.326171875, -34.78125, -32.236328125, -29.69140625, -27.146484375, -24.6015625, -22.056640625, -19.51171875, -16.966796875, -14.421875, -11.876953125, -9.33203125, -6.787109375, -4.2421875, -1.697265625, 0.84765625, 3.392578125, 5.9375, 8.482421875, 11.02734375, 13.572265625, 16.1171875, 18.662109375, 21.20703125, 23.751953125, 26.296875, 28.841796875, 31.38671875, 33.931640625, 36.4765625, 39.021484375, 41.56640625, 44.111328125, 46.65625, 49.201171875, 51.74609375, 54.291015625, 56.8359375, 59.380859375, 61.92578125, 64.470703125, 67.015625, 69.560546875, 72.10546875, 74.650390625, 77.1953125, 79.740234375, 82.28515625, 84.830078125, 87.375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 6.0, 3.0, 7.0, 6.0, 7.0, 19.0, 15.0, 32.0, 43.0, 45.0, 56.0, 58.0, 77.0, 62.0, 76.0, 74.0, 61.0, 52.0, 65.0, 44.0, 44.0, 36.0, 33.0, 16.0, 16.0, 16.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.84375, -44.26025390625, -42.6767578125, -41.09326171875, -39.509765625, -37.92626953125, -36.3427734375, -34.75927734375, -33.17578125, -31.59228515625, -30.0087890625, -28.42529296875, -26.841796875, -25.25830078125, -23.6748046875, -22.09130859375, -20.5078125, -18.92431640625, -17.3408203125, -15.75732421875, -14.173828125, -12.59033203125, -11.0068359375, -9.42333984375, -7.83984375, -6.25634765625, -4.6728515625, -3.08935546875, -1.505859375, 0.07763671875, 1.6611328125, 3.24462890625, 4.828125, 6.41162109375, 7.9951171875, 9.57861328125, 11.162109375, 12.74560546875, 14.3291015625, 15.91259765625, 17.49609375, 19.07958984375, 20.6630859375, 22.24658203125, 23.830078125, 25.41357421875, 26.9970703125, 28.58056640625, 30.1640625, 31.74755859375, 33.3310546875, 34.91455078125, 36.498046875, 38.08154296875, 39.6650390625, 41.24853515625, 42.83203125, 44.41552734375, 45.9990234375, 47.58251953125, 49.166015625, 50.74951171875, 52.3330078125, 53.91650390625, 55.5]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 7.0, 10.0, 18.0, 19.0, 29.0, 49.0, 62.0, 83.0, 130.0, 210.0, 339.0, 570.0, 1049.0, 2513.0, 13791.0, 625376.0, 389510.0, 10155.0, 2278.0, 918.0, 508.0, 321.0, 190.0, 122.0, 88.0, 53.0, 43.0, 29.0, 19.0, 15.0, 6.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-269.25, -259.25390625, -249.2578125, -239.26171875, -229.265625, -219.26953125, -209.2734375, -199.27734375, -189.28125, -179.28515625, -169.2890625, -159.29296875, -149.296875, -139.30078125, -129.3046875, -119.30859375, -109.3125, -99.31640625, -89.3203125, -79.32421875, -69.328125, -59.33203125, -49.3359375, -39.33984375, -29.34375, -19.34765625, -9.3515625, 0.64453125, 10.640625, 20.63671875, 30.6328125, 40.62890625, 50.625, 60.62109375, 70.6171875, 80.61328125, 90.609375, 100.60546875, 110.6015625, 120.59765625, 130.59375, 140.58984375, 150.5859375, 160.58203125, 170.578125, 180.57421875, 190.5703125, 200.56640625, 210.5625, 220.55859375, 230.5546875, 240.55078125, 250.546875, 260.54296875, 270.5390625, 280.53515625, 290.53125, 300.52734375, 310.5234375, 320.51953125, 330.515625, 340.51171875, 350.5078125, 360.50390625, 370.5]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 19.0, 18.0, 19.0, 35.0, 31.0, 37.0, 40.0, 65.0, 58.0, 72.0, 49.0, 63.0, 64.0, 60.0, 62.0, 42.0, 53.0, 48.0, 33.0, 30.0, 27.0, 13.0, 18.0, 8.0, 7.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-193.625, -186.623046875, -179.62109375, -172.619140625, -165.6171875, -158.615234375, -151.61328125, -144.611328125, -137.609375, -130.607421875, -123.60546875, -116.603515625, -109.6015625, -102.599609375, -95.59765625, -88.595703125, -81.59375, -74.591796875, -67.58984375, -60.587890625, -53.5859375, -46.583984375, -39.58203125, -32.580078125, -25.578125, -18.576171875, -11.57421875, -4.572265625, 2.4296875, 9.431640625, 16.43359375, 23.435546875, 30.4375, 37.439453125, 44.44140625, 51.443359375, 58.4453125, 65.447265625, 72.44921875, 79.451171875, 86.453125, 93.455078125, 100.45703125, 107.458984375, 114.4609375, 121.462890625, 128.46484375, 135.466796875, 142.46875, 149.470703125, 156.47265625, 163.474609375, 170.4765625, 177.478515625, 184.48046875, 191.482421875, 198.484375, 205.486328125, 212.48828125, 219.490234375, 226.4921875, 233.494140625, 240.49609375, 247.498046875, 254.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 8.0, 7.0, 9.0, 6.0, 13.0, 16.0, 28.0, 34.0, 50.0, 58.0, 102.0, 145.0, 222.0, 391.0, 988.0, 3025.0, 17805.0, 362650.0, 628938.0, 27612.0, 4009.0, 1164.0, 497.0, 260.0, 159.0, 99.0, 57.0, 58.0, 35.0, 30.0, 17.0, 16.0, 11.0, 6.0, 3.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-101.5625, -98.2958984375, -95.029296875, -91.7626953125, -88.49609375, -85.2294921875, -81.962890625, -78.6962890625, -75.4296875, -72.1630859375, -68.896484375, -65.6298828125, -62.36328125, -59.0966796875, -55.830078125, -52.5634765625, -49.296875, -46.0302734375, -42.763671875, -39.4970703125, -36.23046875, -32.9638671875, -29.697265625, -26.4306640625, -23.1640625, -19.8974609375, -16.630859375, -13.3642578125, -10.09765625, -6.8310546875, -3.564453125, -0.2978515625, 2.96875, 6.2353515625, 9.501953125, 12.7685546875, 16.03515625, 19.3017578125, 22.568359375, 25.8349609375, 29.1015625, 32.3681640625, 35.634765625, 38.9013671875, 42.16796875, 45.4345703125, 48.701171875, 51.9677734375, 55.234375, 58.5009765625, 61.767578125, 65.0341796875, 68.30078125, 71.5673828125, 74.833984375, 78.1005859375, 81.3671875, 84.6337890625, 87.900390625, 91.1669921875, 94.43359375, 97.7001953125, 100.966796875, 104.2333984375, 107.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 3.0, 15.0, 9.0, 23.0, 38.0, 41.0, 70.0, 72.0, 92.0, 116.0, 113.0, 103.0, 76.0, 60.0, 34.0, 18.0, 35.0, 14.0, 12.0, 18.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007762908935546875, -0.007476508617401123, -0.007190108299255371, -0.006903707981109619, -0.006617307662963867, -0.006330907344818115, -0.006044507026672363, -0.005758106708526611, -0.005471706390380859, -0.005185306072235107, -0.0048989057540893555, -0.0046125054359436035, -0.0043261051177978516, -0.0040397047996521, -0.0037533044815063477, -0.0034669041633605957, -0.0031805038452148438, -0.002894103527069092, -0.00260770320892334, -0.002321302890777588, -0.002034902572631836, -0.001748502254486084, -0.001462101936340332, -0.00117570161819458, -0.0008893013000488281, -0.0006029009819030762, -0.0003165006637573242, -3.0100345611572266e-05, 0.0002562999725341797, 0.0005427002906799316, 0.0008291006088256836, 0.0011155009269714355, 0.0014019012451171875, 0.0016883015632629395, 0.0019747018814086914, 0.0022611021995544434, 0.0025475025177001953, 0.0028339028358459473, 0.0031203031539916992, 0.003406703472137451, 0.003693103790283203, 0.003979504108428955, 0.004265904426574707, 0.004552304744720459, 0.004838705062866211, 0.005125105381011963, 0.005411505699157715, 0.005697906017303467, 0.005984306335449219, 0.006270706653594971, 0.006557106971740723, 0.006843507289886475, 0.0071299076080322266, 0.0074163079261779785, 0.0077027082443237305, 0.007989108562469482, 0.008275508880615234, 0.008561909198760986, 0.008848309516906738, 0.00913470983505249, 0.009421110153198242, 0.009707510471343994, 0.009993910789489746, 0.010280311107635498, 0.01056671142578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 11.0, 11.0, 15.0, 25.0, 33.0, 38.0, 63.0, 114.0, 205.0, 407.0, 1041.0, 3774.0, 27205.0, 839918.0, 163271.0, 9129.0, 1902.0, 650.0, 289.0, 164.0, 95.0, 56.0, 33.0, 24.0, 19.0, 13.0, 12.0, 7.0, 9.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.5, -119.349609375, -115.19921875, -111.048828125, -106.8984375, -102.748046875, -98.59765625, -94.447265625, -90.296875, -86.146484375, -81.99609375, -77.845703125, -73.6953125, -69.544921875, -65.39453125, -61.244140625, -57.09375, -52.943359375, -48.79296875, -44.642578125, -40.4921875, -36.341796875, -32.19140625, -28.041015625, -23.890625, -19.740234375, -15.58984375, -11.439453125, -7.2890625, -3.138671875, 1.01171875, 5.162109375, 9.3125, 13.462890625, 17.61328125, 21.763671875, 25.9140625, 30.064453125, 34.21484375, 38.365234375, 42.515625, 46.666015625, 50.81640625, 54.966796875, 59.1171875, 63.267578125, 67.41796875, 71.568359375, 75.71875, 79.869140625, 84.01953125, 88.169921875, 92.3203125, 96.470703125, 100.62109375, 104.771484375, 108.921875, 113.072265625, 117.22265625, 121.373046875, 125.5234375, 129.673828125, 133.82421875, 137.974609375, 142.125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 23.0, 13.0, 36.0, 32.0, 48.0, 71.0, 77.0, 91.0, 100.0, 97.0, 98.0, 73.0, 55.0, 52.0, 23.0, 19.0, 17.0, 4.0, 11.0, 7.0, 10.0, 2.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.875, -70.7255859375, -68.576171875, -66.4267578125, -64.27734375, -62.1279296875, -59.978515625, -57.8291015625, -55.6796875, -53.5302734375, -51.380859375, -49.2314453125, -47.08203125, -44.9326171875, -42.783203125, -40.6337890625, -38.484375, -36.3349609375, -34.185546875, -32.0361328125, -29.88671875, -27.7373046875, -25.587890625, -23.4384765625, -21.2890625, -19.1396484375, -16.990234375, -14.8408203125, -12.69140625, -10.5419921875, -8.392578125, -6.2431640625, -4.09375, -1.9443359375, 0.205078125, 2.3544921875, 4.50390625, 6.6533203125, 8.802734375, 10.9521484375, 13.1015625, 15.2509765625, 17.400390625, 19.5498046875, 21.69921875, 23.8486328125, 25.998046875, 28.1474609375, 30.296875, 32.4462890625, 34.595703125, 36.7451171875, 38.89453125, 41.0439453125, 43.193359375, 45.3427734375, 47.4921875, 49.6416015625, 51.791015625, 53.9404296875, 56.08984375, 58.2392578125, 60.388671875, 62.5380859375, 64.6875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 22.0, 113.0, 489.0, 321.0, 50.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6015.5625, -5881.4345703125, -5747.306640625, -5613.17919921875, -5479.05126953125, -5344.92333984375, -5210.7958984375, -5076.66796875, -4942.5400390625, -4808.412109375, -4674.2841796875, -4540.15673828125, -4406.02880859375, -4271.90087890625, -4137.7734375, -4003.6455078125, -3869.517578125, -3735.3896484375, -3601.261962890625, -3467.13427734375, -3333.00634765625, -3198.87841796875, -3064.750732421875, -2930.623046875, -2796.4951171875, -2662.3671875, -2528.239501953125, -2394.11181640625, -2259.98388671875, -2125.85595703125, -1991.728271484375, -1857.6004638671875, -1723.47216796875, -1589.3443603515625, -1455.216552734375, -1321.0887451171875, -1186.9609375, -1052.8331298828125, -918.705322265625, -784.5775146484375, -650.44970703125, -516.3218994140625, -382.194091796875, -248.0662841796875, -113.9384765625, 20.1893310546875, 154.317138671875, 288.4449462890625, 422.57275390625, 556.7005615234375, 690.828369140625, 824.9561767578125, 959.083984375, 1093.2117919921875, 1227.339599609375, 1361.4674072265625, 1495.59521484375, 1629.7230224609375, 1763.850830078125, 1897.9786376953125, 2032.1064453125, 2166.234375, 2300.362060546875, 2434.48974609375, 2568.61767578125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 8.0, 8.0, 12.0, 13.0, 27.0, 15.0, 21.0, 27.0, 27.0, 35.0, 39.0, 54.0, 44.0, 57.0, 45.0, 55.0, 67.0, 54.0, 47.0, 39.0, 44.0, 34.0, 36.0, 24.0, 22.0, 24.0, 23.0, 18.0, 14.0, 13.0, 11.0, 9.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-850.74365234375, -823.8064575195312, -796.8692626953125, -769.9320678710938, -742.994873046875, -716.0576171875, -689.1204223632812, -662.1832275390625, -635.2460327148438, -608.308837890625, -581.3716430664062, -554.4344482421875, -527.4971923828125, -500.5600280761719, -473.622802734375, -446.68560791015625, -419.7484130859375, -392.81121826171875, -365.8740234375, -338.9367980957031, -311.9996032714844, -285.0624084472656, -258.12518310546875, -231.18798828125, -204.25079345703125, -177.3135986328125, -150.3763885498047, -123.4391860961914, -96.50198364257812, -69.56478881835938, -42.62757873535156, -15.69036865234375, 11.24688720703125, 38.18408966064453, 65.12129211425781, 92.0584945678711, 118.99569702148438, 145.93289184570312, 172.87010192871094, 199.80731201171875, 226.7445068359375, 253.68170166015625, 280.618896484375, 307.5561218261719, 334.4933166503906, 361.4305114746094, 388.36773681640625, 415.304931640625, 442.24212646484375, 469.1793212890625, 496.11651611328125, 523.0537109375, 549.990966796875, 576.9281005859375, 603.8653564453125, 630.8025512695312, 657.73974609375, 684.6769409179688, 711.6141357421875, 738.5513305664062, 765.488525390625, 792.42578125, 819.3629760742188, 846.3001708984375, 873.2373657226562]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 15.0, 11.0, 22.0, 35.0, 32.0, 48.0, 74.0, 93.0, 136.0, 198.0, 305.0, 549.0, 892.0, 1648.0, 3344.0, 8942.0, 47621.0, 4095070.0, 23219.0, 6109.0, 2551.0, 1330.0, 727.0, 442.0, 282.0, 177.0, 122.0, 77.0, 41.0, 44.0, 30.0, 14.0, 19.0, 13.0, 15.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-151.5, -147.3291015625, -143.158203125, -138.9873046875, -134.81640625, -130.6455078125, -126.474609375, -122.3037109375, -118.1328125, -113.9619140625, -109.791015625, -105.6201171875, -101.44921875, -97.2783203125, -93.107421875, -88.9365234375, -84.765625, -80.5947265625, -76.423828125, -72.2529296875, -68.08203125, -63.9111328125, -59.740234375, -55.5693359375, -51.3984375, -47.2275390625, -43.056640625, -38.8857421875, -34.71484375, -30.5439453125, -26.373046875, -22.2021484375, -18.03125, -13.8603515625, -9.689453125, -5.5185546875, -1.34765625, 2.8232421875, 6.994140625, 11.1650390625, 15.3359375, 19.5068359375, 23.677734375, 27.8486328125, 32.01953125, 36.1904296875, 40.361328125, 44.5322265625, 48.703125, 52.8740234375, 57.044921875, 61.2158203125, 65.38671875, 69.5576171875, 73.728515625, 77.8994140625, 82.0703125, 86.2412109375, 90.412109375, 94.5830078125, 98.75390625, 102.9248046875, 107.095703125, 111.2666015625, 115.4375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 5.0, 13.0, 8.0, 17.0, 23.0, 20.0, 31.0, 41.0, 45.0, 57.0, 48.0, 65.0, 66.0, 78.0, 53.0, 57.0, 57.0, 52.0, 47.0, 35.0, 26.0, 28.0, 27.0, 21.0, 9.0, 12.0, 9.0, 10.0, 3.0, 4.0, 8.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.28125, -38.927734375, -37.57421875, -36.220703125, -34.8671875, -33.513671875, -32.16015625, -30.806640625, -29.453125, -28.099609375, -26.74609375, -25.392578125, -24.0390625, -22.685546875, -21.33203125, -19.978515625, -18.625, -17.271484375, -15.91796875, -14.564453125, -13.2109375, -11.857421875, -10.50390625, -9.150390625, -7.796875, -6.443359375, -5.08984375, -3.736328125, -2.3828125, -1.029296875, 0.32421875, 1.677734375, 3.03125, 4.384765625, 5.73828125, 7.091796875, 8.4453125, 9.798828125, 11.15234375, 12.505859375, 13.859375, 15.212890625, 16.56640625, 17.919921875, 19.2734375, 20.626953125, 21.98046875, 23.333984375, 24.6875, 26.041015625, 27.39453125, 28.748046875, 30.1015625, 31.455078125, 32.80859375, 34.162109375, 35.515625, 36.869140625, 38.22265625, 39.576171875, 40.9296875, 42.283203125, 43.63671875, 44.990234375, 46.34375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 11.0, 13.0, 18.0, 35.0, 36.0, 61.0, 66.0, 123.0, 213.0, 285.0, 387.0, 723.0, 1157.0, 1935.0, 3979.0, 8436.0, 23371.0, 116076.0, 3968214.0, 43367.0, 13429.0, 5698.0, 2821.0, 1382.0, 843.0, 528.0, 333.0, 237.0, 154.0, 121.0, 73.0, 47.0, 32.0, 20.0, 15.0, 16.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.25, -86.6435546875, -84.037109375, -81.4306640625, -78.82421875, -76.2177734375, -73.611328125, -71.0048828125, -68.3984375, -65.7919921875, -63.185546875, -60.5791015625, -57.97265625, -55.3662109375, -52.759765625, -50.1533203125, -47.546875, -44.9404296875, -42.333984375, -39.7275390625, -37.12109375, -34.5146484375, -31.908203125, -29.3017578125, -26.6953125, -24.0888671875, -21.482421875, -18.8759765625, -16.26953125, -13.6630859375, -11.056640625, -8.4501953125, -5.84375, -3.2373046875, -0.630859375, 1.9755859375, 4.58203125, 7.1884765625, 9.794921875, 12.4013671875, 15.0078125, 17.6142578125, 20.220703125, 22.8271484375, 25.43359375, 28.0400390625, 30.646484375, 33.2529296875, 35.859375, 38.4658203125, 41.072265625, 43.6787109375, 46.28515625, 48.8916015625, 51.498046875, 54.1044921875, 56.7109375, 59.3173828125, 61.923828125, 64.5302734375, 67.13671875, 69.7431640625, 72.349609375, 74.9560546875, 77.5625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 13.0, 18.0, 19.0, 49.0, 107.0, 3595.0, 114.0, 38.0, 26.0, 18.0, 11.0, 15.0, 3.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.21875, -21.411376953125, -20.60400390625, -19.796630859375, -18.9892578125, -18.181884765625, -17.37451171875, -16.567138671875, -15.759765625, -14.952392578125, -14.14501953125, -13.337646484375, -12.5302734375, -11.722900390625, -10.91552734375, -10.108154296875, -9.30078125, -8.493408203125, -7.68603515625, -6.878662109375, -6.0712890625, -5.263916015625, -4.45654296875, -3.649169921875, -2.841796875, -2.034423828125, -1.22705078125, -0.419677734375, 0.3876953125, 1.195068359375, 2.00244140625, 2.809814453125, 3.6171875, 4.424560546875, 5.23193359375, 6.039306640625, 6.8466796875, 7.654052734375, 8.46142578125, 9.268798828125, 10.076171875, 10.883544921875, 11.69091796875, 12.498291015625, 13.3056640625, 14.113037109375, 14.92041015625, 15.727783203125, 16.53515625, 17.342529296875, 18.14990234375, 18.957275390625, 19.7646484375, 20.572021484375, 21.37939453125, 22.186767578125, 22.994140625, 23.801513671875, 24.60888671875, 25.416259765625, 26.2236328125, 27.031005859375, 27.83837890625, 28.645751953125, 29.453125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 8.0, 20.0, 66.0, 142.0, 243.0, 239.0, 178.0, 59.0, 23.0, 14.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.30206298828125, -229.56483459472656, -223.82760620117188, -218.09036254882812, -212.35313415527344, -206.61590576171875, -200.87867736816406, -195.14144897460938, -189.40420532226562, -183.66697692871094, -177.92974853515625, -172.1925048828125, -166.4552764892578, -160.71804809570312, -154.98081970214844, -149.24359130859375, -143.50636291503906, -137.76913452148438, -132.0319061279297, -126.29467010498047, -120.55743408203125, -114.82020568847656, -109.08297729492188, -103.34574890136719, -97.60851287841797, -91.87128448486328, -86.13404846191406, -80.39682006835938, -74.65959167480469, -68.92235565185547, -63.18512725830078, -57.44789505004883, -51.710662841796875, -45.97343063354492, -40.23619842529297, -34.49897003173828, -28.761737823486328, -23.024505615234375, -17.287277221679688, -11.550045013427734, -5.812812805175781, -0.07558155059814453, 5.661649703979492, 11.398880004882812, 17.136112213134766, 22.87334442138672, 28.610572814941406, 34.34780502319336, 40.08503723144531, 45.822269439697266, 51.55950164794922, 57.296730041503906, 63.03396224975586, 68.77119445800781, 74.5084228515625, 80.24565124511719, 85.9828872680664, 91.7201156616211, 97.45735168457031, 103.194580078125, 108.93180847167969, 114.6690444946289, 120.4062728881836, 126.14350891113281, 131.8807373046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 5.0, 3.0, 13.0, 8.0, 10.0, 14.0, 18.0, 16.0, 30.0, 28.0, 32.0, 39.0, 43.0, 35.0, 42.0, 56.0, 58.0, 50.0, 57.0, 39.0, 52.0, 40.0, 41.0, 37.0, 34.0, 40.0, 28.0, 28.0, 27.0, 14.0, 16.0, 8.0, 8.0, 3.0, 14.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-63.07673645019531, -61.28229904174805, -59.48786163330078, -57.693424224853516, -55.89898681640625, -54.10455322265625, -52.31011199951172, -50.51567840576172, -48.72124099731445, -46.92680358886719, -45.13236618041992, -43.337928771972656, -41.54349136352539, -39.749053955078125, -37.954620361328125, -36.16018295288086, -34.365745544433594, -32.57130813598633, -30.776870727539062, -28.982433319091797, -27.187997817993164, -25.3935604095459, -23.599123001098633, -21.8046875, -20.01024627685547, -18.215808868408203, -16.421371459960938, -14.626935005187988, -12.832498550415039, -11.038061141967773, -9.243623733520508, -7.449187278747559, -5.654750823974609, -3.860313892364502, -2.0658767223358154, -0.2714395523071289, 1.5229973793029785, 3.317434310913086, 5.111871719360352, 6.906308174133301, 8.700745582580566, 10.495182991027832, 12.289619445800781, 14.084056854248047, 15.878494262695312, 17.672931671142578, 19.467369079589844, 21.261804580688477, 23.056241989135742, 24.850679397583008, 26.645116806030273, 28.439552307128906, 30.233989715576172, 32.02842712402344, 33.8228645324707, 35.61730194091797, 37.411739349365234, 39.2061767578125, 41.000614166259766, 42.79505157470703, 44.5894889831543, 46.38392639160156, 48.17835998535156, 49.97279739379883, 51.767234802246094]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 11.0, 10.0, 16.0, 18.0, 35.0, 49.0, 95.0, 140.0, 220.0, 438.0, 833.0, 1627.0, 3483.0, 8801.0, 25460.0, 95778.0, 392989.0, 384310.0, 93687.0, 25064.0, 8519.0, 3483.0, 1673.0, 775.0, 405.0, 224.0, 140.0, 79.0, 56.0, 36.0, 24.0, 8.0, 11.0, 12.0, 4.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-131.125, -127.150390625, -123.17578125, -119.201171875, -115.2265625, -111.251953125, -107.27734375, -103.302734375, -99.328125, -95.353515625, -91.37890625, -87.404296875, -83.4296875, -79.455078125, -75.48046875, -71.505859375, -67.53125, -63.556640625, -59.58203125, -55.607421875, -51.6328125, -47.658203125, -43.68359375, -39.708984375, -35.734375, -31.759765625, -27.78515625, -23.810546875, -19.8359375, -15.861328125, -11.88671875, -7.912109375, -3.9375, 0.037109375, 4.01171875, 7.986328125, 11.9609375, 15.935546875, 19.91015625, 23.884765625, 27.859375, 31.833984375, 35.80859375, 39.783203125, 43.7578125, 47.732421875, 51.70703125, 55.681640625, 59.65625, 63.630859375, 67.60546875, 71.580078125, 75.5546875, 79.529296875, 83.50390625, 87.478515625, 91.453125, 95.427734375, 99.40234375, 103.376953125, 107.3515625, 111.326171875, 115.30078125, 119.275390625, 123.25]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 25.0, 22.0, 28.0, 44.0, 39.0, 44.0, 48.0, 60.0, 54.0, 63.0, 62.0, 61.0, 56.0, 40.0, 42.0, 43.0, 46.0, 30.0, 25.0, 19.0, 16.0, 19.0, 12.0, 8.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.02978515625, -34.7158203125, -33.40185546875, -32.087890625, -30.77392578125, -29.4599609375, -28.14599609375, -26.83203125, -25.51806640625, -24.2041015625, -22.89013671875, -21.576171875, -20.26220703125, -18.9482421875, -17.63427734375, -16.3203125, -15.00634765625, -13.6923828125, -12.37841796875, -11.064453125, -9.75048828125, -8.4365234375, -7.12255859375, -5.80859375, -4.49462890625, -3.1806640625, -1.86669921875, -0.552734375, 0.76123046875, 2.0751953125, 3.38916015625, 4.703125, 6.01708984375, 7.3310546875, 8.64501953125, 9.958984375, 11.27294921875, 12.5869140625, 13.90087890625, 15.21484375, 16.52880859375, 17.8427734375, 19.15673828125, 20.470703125, 21.78466796875, 23.0986328125, 24.41259765625, 25.7265625, 27.04052734375, 28.3544921875, 29.66845703125, 30.982421875, 32.29638671875, 33.6103515625, 34.92431640625, 36.23828125, 37.55224609375, 38.8662109375, 40.18017578125, 41.494140625, 42.80810546875, 44.1220703125, 45.43603515625, 46.75]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 14.0, 16.0, 45.0, 69.0, 110.0, 195.0, 345.0, 759.0, 2007.0, 26142.0, 1001818.0, 13868.0, 1725.0, 670.0, 355.0, 177.0, 92.0, 52.0, 30.0, 26.0, 17.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-641.0, -623.875, -606.75, -589.625, -572.5, -555.375, -538.25, -521.125, -504.0, -486.875, -469.75, -452.625, -435.5, -418.375, -401.25, -384.125, -367.0, -349.875, -332.75, -315.625, -298.5, -281.375, -264.25, -247.125, -230.0, -212.875, -195.75, -178.625, -161.5, -144.375, -127.25, -110.125, -93.0, -75.875, -58.75, -41.625, -24.5, -7.375, 9.75, 26.875, 44.0, 61.125, 78.25, 95.375, 112.5, 129.625, 146.75, 163.875, 181.0, 198.125, 215.25, 232.375, 249.5, 266.625, 283.75, 300.875, 318.0, 335.125, 352.25, 369.375, 386.5, 403.625, 420.75, 437.875, 455.0]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 1.0, 7.0, 7.0, 10.0, 18.0, 9.0, 20.0, 30.0, 19.0, 28.0, 33.0, 27.0, 39.0, 52.0, 39.0, 46.0, 47.0, 38.0, 44.0, 33.0, 42.0, 34.0, 44.0, 27.0, 42.0, 36.0, 40.0, 32.0, 20.0, 15.0, 18.0, 19.0, 14.0, 13.0, 7.0, 6.0, 7.0, 10.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-183.25, -178.064453125, -172.87890625, -167.693359375, -162.5078125, -157.322265625, -152.13671875, -146.951171875, -141.765625, -136.580078125, -131.39453125, -126.208984375, -121.0234375, -115.837890625, -110.65234375, -105.466796875, -100.28125, -95.095703125, -89.91015625, -84.724609375, -79.5390625, -74.353515625, -69.16796875, -63.982421875, -58.796875, -53.611328125, -48.42578125, -43.240234375, -38.0546875, -32.869140625, -27.68359375, -22.498046875, -17.3125, -12.126953125, -6.94140625, -1.755859375, 3.4296875, 8.615234375, 13.80078125, 18.986328125, 24.171875, 29.357421875, 34.54296875, 39.728515625, 44.9140625, 50.099609375, 55.28515625, 60.470703125, 65.65625, 70.841796875, 76.02734375, 81.212890625, 86.3984375, 91.583984375, 96.76953125, 101.955078125, 107.140625, 112.326171875, 117.51171875, 122.697265625, 127.8828125, 133.068359375, 138.25390625, 143.439453125, 148.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 9.0, 8.0, 7.0, 10.0, 16.0, 24.0, 24.0, 30.0, 43.0, 53.0, 65.0, 102.0, 191.0, 369.0, 978.0, 6575.0, 913070.0, 122358.0, 3144.0, 693.0, 258.0, 131.0, 84.0, 68.0, 51.0, 39.0, 27.0, 25.0, 20.0, 19.0, 15.0, 6.0, 7.0, 4.0, 2.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-318.75, -309.046875, -299.34375, -289.640625, -279.9375, -270.234375, -260.53125, -250.828125, -241.125, -231.421875, -221.71875, -212.015625, -202.3125, -192.609375, -182.90625, -173.203125, -163.5, -153.796875, -144.09375, -134.390625, -124.6875, -114.984375, -105.28125, -95.578125, -85.875, -76.171875, -66.46875, -56.765625, -47.0625, -37.359375, -27.65625, -17.953125, -8.25, 1.453125, 11.15625, 20.859375, 30.5625, 40.265625, 49.96875, 59.671875, 69.375, 79.078125, 88.78125, 98.484375, 108.1875, 117.890625, 127.59375, 137.296875, 147.0, 156.703125, 166.40625, 176.109375, 185.8125, 195.515625, 205.21875, 214.921875, 224.625, 234.328125, 244.03125, 253.734375, 263.4375, 273.140625, 282.84375, 292.546875, 302.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 12.0, 18.0, 35.0, 50.0, 63.0, 131.0, 210.0, 164.0, 112.0, 84.0, 36.0, 20.0, 18.0, 10.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0137176513671875, -0.0131683349609375, -0.0126190185546875, -0.0120697021484375, -0.0115203857421875, -0.0109710693359375, -0.0104217529296875, -0.0098724365234375, -0.0093231201171875, -0.0087738037109375, -0.0082244873046875, -0.0076751708984375, -0.0071258544921875, -0.0065765380859375, -0.0060272216796875, -0.0054779052734375, -0.0049285888671875, -0.0043792724609375, -0.0038299560546875, -0.0032806396484375, -0.0027313232421875, -0.0021820068359375, -0.0016326904296875, -0.0010833740234375, -0.0005340576171875, 1.52587890625e-05, 0.0005645751953125, 0.0011138916015625, 0.0016632080078125, 0.0022125244140625, 0.0027618408203125, 0.0033111572265625, 0.0038604736328125, 0.0044097900390625, 0.0049591064453125, 0.0055084228515625, 0.0060577392578125, 0.0066070556640625, 0.0071563720703125, 0.0077056884765625, 0.0082550048828125, 0.0088043212890625, 0.0093536376953125, 0.0099029541015625, 0.0104522705078125, 0.0110015869140625, 0.0115509033203125, 0.0121002197265625, 0.0126495361328125, 0.0131988525390625, 0.0137481689453125, 0.0142974853515625, 0.0148468017578125, 0.0153961181640625, 0.0159454345703125, 0.0164947509765625, 0.0170440673828125, 0.0175933837890625, 0.0181427001953125, 0.0186920166015625, 0.0192413330078125, 0.0197906494140625, 0.0203399658203125, 0.0208892822265625, 0.0214385986328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 11.0, 9.0, 7.0, 18.0, 29.0, 41.0, 57.0, 91.0, 144.0, 254.0, 602.0, 1647.0, 6777.0, 69629.0, 943402.0, 20411.0, 3481.0, 1032.0, 381.0, 209.0, 99.0, 59.0, 43.0, 32.0, 19.0, 21.0, 16.0, 8.0, 6.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.0, -208.74609375, -200.4921875, -192.23828125, -183.984375, -175.73046875, -167.4765625, -159.22265625, -150.96875, -142.71484375, -134.4609375, -126.20703125, -117.953125, -109.69921875, -101.4453125, -93.19140625, -84.9375, -76.68359375, -68.4296875, -60.17578125, -51.921875, -43.66796875, -35.4140625, -27.16015625, -18.90625, -10.65234375, -2.3984375, 5.85546875, 14.109375, 22.36328125, 30.6171875, 38.87109375, 47.125, 55.37890625, 63.6328125, 71.88671875, 80.140625, 88.39453125, 96.6484375, 104.90234375, 113.15625, 121.41015625, 129.6640625, 137.91796875, 146.171875, 154.42578125, 162.6796875, 170.93359375, 179.1875, 187.44140625, 195.6953125, 203.94921875, 212.203125, 220.45703125, 228.7109375, 236.96484375, 245.21875, 253.47265625, 261.7265625, 269.98046875, 278.234375, 286.48828125, 294.7421875, 302.99609375, 311.25]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 4.0, 13.0, 21.0, 16.0, 18.0, 24.0, 47.0, 76.0, 134.0, 133.0, 162.0, 106.0, 67.0, 43.0, 33.0, 21.0, 15.0, 20.0, 8.0, 4.0, 4.0, 7.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.25, -127.658203125, -123.06640625, -118.474609375, -113.8828125, -109.291015625, -104.69921875, -100.107421875, -95.515625, -90.923828125, -86.33203125, -81.740234375, -77.1484375, -72.556640625, -67.96484375, -63.373046875, -58.78125, -54.189453125, -49.59765625, -45.005859375, -40.4140625, -35.822265625, -31.23046875, -26.638671875, -22.046875, -17.455078125, -12.86328125, -8.271484375, -3.6796875, 0.912109375, 5.50390625, 10.095703125, 14.6875, 19.279296875, 23.87109375, 28.462890625, 33.0546875, 37.646484375, 42.23828125, 46.830078125, 51.421875, 56.013671875, 60.60546875, 65.197265625, 69.7890625, 74.380859375, 78.97265625, 83.564453125, 88.15625, 92.748046875, 97.33984375, 101.931640625, 106.5234375, 111.115234375, 115.70703125, 120.298828125, 124.890625, 129.482421875, 134.07421875, 138.666015625, 143.2578125, 147.849609375, 152.44140625, 157.033203125, 161.625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 13.0, 126.0, 532.0, 290.0, 30.0, 10.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3490.555908203125, -3336.560546875, -3182.56494140625, -3028.5693359375, -2874.573974609375, -2720.57861328125, -2566.5830078125, -2412.58740234375, -2258.592041015625, -2104.5966796875, -1950.60107421875, -1796.6055908203125, -1642.610107421875, -1488.6146240234375, -1334.619140625, -1180.6236572265625, -1026.628173828125, -872.6326904296875, -718.63720703125, -564.6417236328125, -410.646240234375, -256.6507568359375, -102.6552734375, 51.3402099609375, 205.335693359375, 359.3311767578125, 513.32666015625, 667.3221435546875, 821.317626953125, 975.3131103515625, 1129.30859375, 1283.3040771484375, 1437.2998046875, 1591.2952880859375, 1745.290771484375, 1899.2862548828125, 2053.28173828125, 2207.27734375, 2361.272705078125, 2515.26806640625, 2669.263671875, 2823.25927734375, 2977.254638671875, 3131.25, 3285.24560546875, 3439.2412109375, 3593.236572265625, 3747.23193359375, 3901.2275390625, 4055.22314453125, 4209.21875, 4363.2138671875, 4517.20947265625, 4671.205078125, 4825.2001953125, 4979.19580078125, 5133.19140625, 5287.18701171875, 5441.1826171875, 5595.177734375, 5749.17333984375, 5903.1689453125, 6057.1640625, 6211.15966796875, 6365.1552734375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 7.0, 8.0, 9.0, 17.0, 17.0, 15.0, 25.0, 30.0, 24.0, 42.0, 34.0, 31.0, 57.0, 72.0, 49.0, 44.0, 50.0, 58.0, 53.0, 47.0, 40.0, 40.0, 38.0, 28.0, 36.0, 24.0, 13.0, 22.0, 14.0, 4.0, 10.0, 4.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1033.558349609375, -1004.7240600585938, -975.8897705078125, -947.0555419921875, -918.2212524414062, -889.386962890625, -860.5526733398438, -831.7183837890625, -802.8841552734375, -774.0498657226562, -745.215576171875, -716.38134765625, -687.5470581054688, -658.7127685546875, -629.8784790039062, -601.044189453125, -572.2099609375, -543.3756713867188, -514.5413818359375, -485.7071228027344, -456.87286376953125, -428.03857421875, -399.20428466796875, -370.3700256347656, -341.53570556640625, -312.701416015625, -283.8671569824219, -255.03286743164062, -226.1986083984375, -197.36431884765625, -168.53004455566406, -139.69577026367188, -110.86151123046875, -82.02723693847656, -53.19295883178711, -24.358680725097656, 4.475593566894531, 33.30987548828125, 62.14414978027344, 90.97842407226562, 119.81269836425781, 148.64697265625, 177.4812469482422, 206.31552124023438, 235.14981079101562, 263.98406982421875, 292.818359375, 321.65264892578125, 350.4869079589844, 379.3211975097656, 408.15545654296875, 436.98974609375, 465.8240051269531, 494.6582946777344, 523.4925537109375, 552.3268432617188, 581.1611328125, 609.9954223632812, 638.8297119140625, 667.6639404296875, 696.4982299804688, 725.33251953125, 754.1668090820312, 783.0010986328125, 811.8353271484375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 20.0, 24.0, 37.0, 46.0, 98.0, 156.0, 290.0, 541.0, 1015.0, 2402.0, 5668.0, 17883.0, 123069.0, 3992427.0, 35130.0, 8975.0, 3460.0, 1484.0, 708.0, 342.0, 179.0, 110.0, 50.0, 44.0, 21.0, 16.0, 15.0, 11.0, 7.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-109.75, -106.54296875, -103.3359375, -100.12890625, -96.921875, -93.71484375, -90.5078125, -87.30078125, -84.09375, -80.88671875, -77.6796875, -74.47265625, -71.265625, -68.05859375, -64.8515625, -61.64453125, -58.4375, -55.23046875, -52.0234375, -48.81640625, -45.609375, -42.40234375, -39.1953125, -35.98828125, -32.78125, -29.57421875, -26.3671875, -23.16015625, -19.953125, -16.74609375, -13.5390625, -10.33203125, -7.125, -3.91796875, -0.7109375, 2.49609375, 5.703125, 8.91015625, 12.1171875, 15.32421875, 18.53125, 21.73828125, 24.9453125, 28.15234375, 31.359375, 34.56640625, 37.7734375, 40.98046875, 44.1875, 47.39453125, 50.6015625, 53.80859375, 57.015625, 60.22265625, 63.4296875, 66.63671875, 69.84375, 73.05078125, 76.2578125, 79.46484375, 82.671875, 85.87890625, 89.0859375, 92.29296875, 95.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 10.0, 9.0, 9.0, 26.0, 44.0, 64.0, 81.0, 69.0, 103.0, 98.0, 103.0, 93.0, 88.0, 46.0, 54.0, 29.0, 20.0, 19.0, 13.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-92.5, -90.17333984375, -87.8466796875, -85.52001953125, -83.193359375, -80.86669921875, -78.5400390625, -76.21337890625, -73.88671875, -71.56005859375, -69.2333984375, -66.90673828125, -64.580078125, -62.25341796875, -59.9267578125, -57.60009765625, -55.2734375, -52.94677734375, -50.6201171875, -48.29345703125, -45.966796875, -43.64013671875, -41.3134765625, -38.98681640625, -36.66015625, -34.33349609375, -32.0068359375, -29.68017578125, -27.353515625, -25.02685546875, -22.7001953125, -20.37353515625, -18.046875, -15.72021484375, -13.3935546875, -11.06689453125, -8.740234375, -6.41357421875, -4.0869140625, -1.76025390625, 0.56640625, 2.89306640625, 5.2197265625, 7.54638671875, 9.873046875, 12.19970703125, 14.5263671875, 16.85302734375, 19.1796875, 21.50634765625, 23.8330078125, 26.15966796875, 28.486328125, 30.81298828125, 33.1396484375, 35.46630859375, 37.79296875, 40.11962890625, 42.4462890625, 44.77294921875, 47.099609375, 49.42626953125, 51.7529296875, 54.07958984375, 56.40625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 7.0, 10.0, 16.0, 11.0, 4.0, 13.0, 22.0, 23.0, 39.0, 36.0, 62.0, 95.0, 229.0, 469.0, 1182.0, 3763.0, 27866.0, 4103345.0, 49513.0, 5099.0, 1335.0, 529.0, 202.0, 125.0, 84.0, 54.0, 30.0, 20.0, 16.0, 20.0, 12.0, 15.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-266.0, -258.923828125, -251.84765625, -244.771484375, -237.6953125, -230.619140625, -223.54296875, -216.466796875, -209.390625, -202.314453125, -195.23828125, -188.162109375, -181.0859375, -174.009765625, -166.93359375, -159.857421875, -152.78125, -145.705078125, -138.62890625, -131.552734375, -124.4765625, -117.400390625, -110.32421875, -103.248046875, -96.171875, -89.095703125, -82.01953125, -74.943359375, -67.8671875, -60.791015625, -53.71484375, -46.638671875, -39.5625, -32.486328125, -25.41015625, -18.333984375, -11.2578125, -4.181640625, 2.89453125, 9.970703125, 17.046875, 24.123046875, 31.19921875, 38.275390625, 45.3515625, 52.427734375, 59.50390625, 66.580078125, 73.65625, 80.732421875, 87.80859375, 94.884765625, 101.9609375, 109.037109375, 116.11328125, 123.189453125, 130.265625, 137.341796875, 144.41796875, 151.494140625, 158.5703125, 165.646484375, 172.72265625, 179.798828125, 186.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 10.0, 13.0, 42.0, 90.0, 3266.0, 509.0, 80.0, 27.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-143.875, -140.740234375, -137.60546875, -134.470703125, -131.3359375, -128.201171875, -125.06640625, -121.931640625, -118.796875, -115.662109375, -112.52734375, -109.392578125, -106.2578125, -103.123046875, -99.98828125, -96.853515625, -93.71875, -90.583984375, -87.44921875, -84.314453125, -81.1796875, -78.044921875, -74.91015625, -71.775390625, -68.640625, -65.505859375, -62.37109375, -59.236328125, -56.1015625, -52.966796875, -49.83203125, -46.697265625, -43.5625, -40.427734375, -37.29296875, -34.158203125, -31.0234375, -27.888671875, -24.75390625, -21.619140625, -18.484375, -15.349609375, -12.21484375, -9.080078125, -5.9453125, -2.810546875, 0.32421875, 3.458984375, 6.59375, 9.728515625, 12.86328125, 15.998046875, 19.1328125, 22.267578125, 25.40234375, 28.537109375, 31.671875, 34.806640625, 37.94140625, 41.076171875, 44.2109375, 47.345703125, 50.48046875, 53.615234375, 56.75]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 14.0, 29.0, 143.0, 317.0, 298.0, 145.0, 32.0, 17.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1023.88720703125, -1005.2698364257812, -986.6524658203125, -968.0350952148438, -949.417724609375, -930.8003540039062, -912.1829833984375, -893.5656127929688, -874.9482421875, -856.3308715820312, -837.7135009765625, -819.0961303710938, -800.478759765625, -781.8613891601562, -763.2440185546875, -744.6266479492188, -726.00927734375, -707.3919067382812, -688.7745361328125, -670.1571655273438, -651.539794921875, -632.9224243164062, -614.3050537109375, -595.6876831054688, -577.0703125, -558.4529418945312, -539.8355712890625, -521.2182006835938, -502.600830078125, -483.98345947265625, -465.3660888671875, -446.74871826171875, -428.13140869140625, -409.5140380859375, -390.89666748046875, -372.279296875, -353.66192626953125, -335.0445556640625, -316.42718505859375, -297.809814453125, -279.19244384765625, -260.5750732421875, -241.95770263671875, -223.34033203125, -204.72296142578125, -186.1055908203125, -167.48822021484375, -148.870849609375, -130.25347900390625, -111.6361083984375, -93.01873779296875, -74.4013671875, -55.78399658203125, -37.1666259765625, -18.54925537109375, 0.068115234375, 18.68548583984375, 37.3028564453125, 55.92022705078125, 74.53759765625, 93.15496826171875, 111.7723388671875, 130.38970947265625, 149.007080078125, 167.62445068359375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 12.0, 21.0, 25.0, 31.0, 33.0, 59.0, 65.0, 78.0, 81.0, 95.0, 89.0, 86.0, 79.0, 67.0, 43.0, 36.0, 34.0, 26.0, 15.0, 14.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.74136352539062, -236.0111846923828, -227.28102111816406, -218.55084228515625, -209.8206787109375, -201.0904998779297, -192.36032104492188, -183.63015747070312, -174.8999786376953, -166.1697998046875, -157.43963623046875, -148.70945739746094, -139.97927856445312, -131.24911499023438, -122.51893615722656, -113.78876495361328, -105.05859375, -96.32842254638672, -87.59825134277344, -78.86807250976562, -70.13790130615234, -61.40773010253906, -52.677555084228516, -43.94738006591797, -35.21720886230469, -26.487035751342773, -17.75686264038086, -9.026689529418945, -0.29651641845703125, 8.43365478515625, 17.163829803466797, 25.894004821777344, 34.62420654296875, 43.35437774658203, 52.08455276489258, 60.814727783203125, 69.5448989868164, 78.27507019042969, 87.0052490234375, 95.73542022705078, 104.46559143066406, 113.19576263427734, 121.92593383789062, 130.65611267089844, 139.38629150390625, 148.116455078125, 156.8466339111328, 165.57681274414062, 174.30697631835938, 183.0371551513672, 191.76731872558594, 200.49749755859375, 209.2276611328125, 217.9578399658203, 226.68801879882812, 235.41818237304688, 244.1483612060547, 252.8785400390625, 261.60870361328125, 270.3388671875, 279.0690612792969, 287.7992248535156, 296.5293884277344, 305.25958251953125, 313.98974609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 10.0, 3.0, 6.0, 1.0, 11.0, 15.0, 32.0, 33.0, 43.0, 73.0, 130.0, 168.0, 298.0, 540.0, 932.0, 1723.0, 3957.0, 10667.0, 40975.0, 250033.0, 572525.0, 128693.0, 24142.0, 7305.0, 2961.0, 1360.0, 795.0, 424.0, 225.0, 154.0, 110.0, 66.0, 40.0, 29.0, 23.0, 17.0, 16.0, 6.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-165.0, -160.048828125, -155.09765625, -150.146484375, -145.1953125, -140.244140625, -135.29296875, -130.341796875, -125.390625, -120.439453125, -115.48828125, -110.537109375, -105.5859375, -100.634765625, -95.68359375, -90.732421875, -85.78125, -80.830078125, -75.87890625, -70.927734375, -65.9765625, -61.025390625, -56.07421875, -51.123046875, -46.171875, -41.220703125, -36.26953125, -31.318359375, -26.3671875, -21.416015625, -16.46484375, -11.513671875, -6.5625, -1.611328125, 3.33984375, 8.291015625, 13.2421875, 18.193359375, 23.14453125, 28.095703125, 33.046875, 37.998046875, 42.94921875, 47.900390625, 52.8515625, 57.802734375, 62.75390625, 67.705078125, 72.65625, 77.607421875, 82.55859375, 87.509765625, 92.4609375, 97.412109375, 102.36328125, 107.314453125, 112.265625, 117.216796875, 122.16796875, 127.119140625, 132.0703125, 137.021484375, 141.97265625, 146.923828125, 151.875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 3.0, 8.0, 16.0, 14.0, 21.0, 27.0, 39.0, 60.0, 65.0, 77.0, 81.0, 103.0, 83.0, 76.0, 74.0, 59.0, 49.0, 41.0, 30.0, 21.0, 15.0, 7.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.25, -81.1103515625, -78.970703125, -76.8310546875, -74.69140625, -72.5517578125, -70.412109375, -68.2724609375, -66.1328125, -63.9931640625, -61.853515625, -59.7138671875, -57.57421875, -55.4345703125, -53.294921875, -51.1552734375, -49.015625, -46.8759765625, -44.736328125, -42.5966796875, -40.45703125, -38.3173828125, -36.177734375, -34.0380859375, -31.8984375, -29.7587890625, -27.619140625, -25.4794921875, -23.33984375, -21.2001953125, -19.060546875, -16.9208984375, -14.78125, -12.6416015625, -10.501953125, -8.3623046875, -6.22265625, -4.0830078125, -1.943359375, 0.1962890625, 2.3359375, 4.4755859375, 6.615234375, 8.7548828125, 10.89453125, 13.0341796875, 15.173828125, 17.3134765625, 19.453125, 21.5927734375, 23.732421875, 25.8720703125, 28.01171875, 30.1513671875, 32.291015625, 34.4306640625, 36.5703125, 38.7099609375, 40.849609375, 42.9892578125, 45.12890625, 47.2685546875, 49.408203125, 51.5478515625, 53.6875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 5.0, 10.0, 9.0, 26.0, 46.0, 55.0, 72.0, 89.0, 150.0, 234.0, 451.0, 682.0, 1419.0, 3742.0, 18116.0, 531906.0, 467796.0, 16973.0, 3547.0, 1418.0, 697.0, 411.0, 224.0, 153.0, 97.0, 70.0, 40.0, 34.0, 15.0, 21.0, 6.0, 7.0, 6.0, 10.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5, -280.72265625, -271.9453125, -263.16796875, -254.390625, -245.61328125, -236.8359375, -228.05859375, -219.28125, -210.50390625, -201.7265625, -192.94921875, -184.171875, -175.39453125, -166.6171875, -157.83984375, -149.0625, -140.28515625, -131.5078125, -122.73046875, -113.953125, -105.17578125, -96.3984375, -87.62109375, -78.84375, -70.06640625, -61.2890625, -52.51171875, -43.734375, -34.95703125, -26.1796875, -17.40234375, -8.625, 0.15234375, 8.9296875, 17.70703125, 26.484375, 35.26171875, 44.0390625, 52.81640625, 61.59375, 70.37109375, 79.1484375, 87.92578125, 96.703125, 105.48046875, 114.2578125, 123.03515625, 131.8125, 140.58984375, 149.3671875, 158.14453125, 166.921875, 175.69921875, 184.4765625, 193.25390625, 202.03125, 210.80859375, 219.5859375, 228.36328125, 237.140625, 245.91796875, 254.6953125, 263.47265625, 272.25]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 13.0, 18.0, 27.0, 31.0, 51.0, 64.0, 64.0, 93.0, 112.0, 101.0, 83.0, 85.0, 84.0, 61.0, 35.0, 27.0, 15.0, 13.0, 11.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-485.25, -474.462890625, -463.67578125, -452.888671875, -442.1015625, -431.314453125, -420.52734375, -409.740234375, -398.953125, -388.166015625, -377.37890625, -366.591796875, -355.8046875, -345.017578125, -334.23046875, -323.443359375, -312.65625, -301.869140625, -291.08203125, -280.294921875, -269.5078125, -258.720703125, -247.93359375, -237.146484375, -226.359375, -215.572265625, -204.78515625, -193.998046875, -183.2109375, -172.423828125, -161.63671875, -150.849609375, -140.0625, -129.275390625, -118.48828125, -107.701171875, -96.9140625, -86.126953125, -75.33984375, -64.552734375, -53.765625, -42.978515625, -32.19140625, -21.404296875, -10.6171875, 0.169921875, 10.95703125, 21.744140625, 32.53125, 43.318359375, 54.10546875, 64.892578125, 75.6796875, 86.466796875, 97.25390625, 108.041015625, 118.828125, 129.615234375, 140.40234375, 151.189453125, 161.9765625, 172.763671875, 183.55078125, 194.337890625, 205.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 9.0, 4.0, 8.0, 7.0, 13.0, 18.0, 12.0, 22.0, 32.0, 38.0, 55.0, 68.0, 96.0, 179.0, 342.0, 670.0, 1972.0, 10057.0, 221397.0, 785068.0, 23173.0, 3300.0, 926.0, 394.0, 206.0, 140.0, 75.0, 53.0, 54.0, 36.0, 20.0, 24.0, 16.0, 10.0, 10.0, 2.0, 6.0, 7.0, 6.0, 5.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-108.25, -104.9873046875, -101.724609375, -98.4619140625, -95.19921875, -91.9365234375, -88.673828125, -85.4111328125, -82.1484375, -78.8857421875, -75.623046875, -72.3603515625, -69.09765625, -65.8349609375, -62.572265625, -59.3095703125, -56.046875, -52.7841796875, -49.521484375, -46.2587890625, -42.99609375, -39.7333984375, -36.470703125, -33.2080078125, -29.9453125, -26.6826171875, -23.419921875, -20.1572265625, -16.89453125, -13.6318359375, -10.369140625, -7.1064453125, -3.84375, -0.5810546875, 2.681640625, 5.9443359375, 9.20703125, 12.4697265625, 15.732421875, 18.9951171875, 22.2578125, 25.5205078125, 28.783203125, 32.0458984375, 35.30859375, 38.5712890625, 41.833984375, 45.0966796875, 48.359375, 51.6220703125, 54.884765625, 58.1474609375, 61.41015625, 64.6728515625, 67.935546875, 71.1982421875, 74.4609375, 77.7236328125, 80.986328125, 84.2490234375, 87.51171875, 90.7744140625, 94.037109375, 97.2998046875, 100.5625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 0.0, 6.0, 7.0, 8.0, 6.0, 12.0, 17.0, 16.0, 22.0, 45.0, 59.0, 70.0, 82.0, 124.0, 113.0, 105.0, 78.0, 51.0, 44.0, 23.0, 31.0, 17.0, 18.0, 11.0, 4.0, 7.0, 3.0, 6.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00843048095703125, -0.008150339126586914, -0.007870197296142578, -0.007590055465698242, -0.007309913635253906, -0.00702977180480957, -0.006749629974365234, -0.0064694881439208984, -0.0061893463134765625, -0.0059092044830322266, -0.005629062652587891, -0.005348920822143555, -0.005068778991699219, -0.004788637161254883, -0.004508495330810547, -0.004228353500366211, -0.003948211669921875, -0.003668069839477539, -0.003387928009033203, -0.003107786178588867, -0.0028276443481445312, -0.0025475025177001953, -0.0022673606872558594, -0.0019872188568115234, -0.0017070770263671875, -0.0014269351959228516, -0.0011467933654785156, -0.0008666515350341797, -0.0005865097045898438, -0.0003063678741455078, -2.6226043701171875e-05, 0.00025391578674316406, 0.0005340576171875, 0.0008141994476318359, 0.0010943412780761719, 0.0013744831085205078, 0.0016546249389648438, 0.0019347667694091797, 0.0022149085998535156, 0.0024950504302978516, 0.0027751922607421875, 0.0030553340911865234, 0.0033354759216308594, 0.0036156177520751953, 0.0038957595825195312, 0.004175901412963867, 0.004456043243408203, 0.004736185073852539, 0.005016326904296875, 0.005296468734741211, 0.005576610565185547, 0.005856752395629883, 0.006136894226074219, 0.006417036056518555, 0.006697177886962891, 0.0069773197174072266, 0.0072574615478515625, 0.0075376033782958984, 0.007817745208740234, 0.00809788703918457, 0.008378028869628906, 0.008658170700073242, 0.008938312530517578, 0.009218454360961914, 0.00949859619140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 8.0, 5.0, 6.0, 10.0, 17.0, 19.0, 49.0, 65.0, 111.0, 240.0, 448.0, 1016.0, 2542.0, 8130.0, 56474.0, 914908.0, 52286.0, 7779.0, 2475.0, 981.0, 450.0, 184.0, 118.0, 70.0, 43.0, 27.0, 18.0, 17.0, 8.0, 11.0, 5.0, 8.0, 4.0, 2.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-151.625, -147.580078125, -143.53515625, -139.490234375, -135.4453125, -131.400390625, -127.35546875, -123.310546875, -119.265625, -115.220703125, -111.17578125, -107.130859375, -103.0859375, -99.041015625, -94.99609375, -90.951171875, -86.90625, -82.861328125, -78.81640625, -74.771484375, -70.7265625, -66.681640625, -62.63671875, -58.591796875, -54.546875, -50.501953125, -46.45703125, -42.412109375, -38.3671875, -34.322265625, -30.27734375, -26.232421875, -22.1875, -18.142578125, -14.09765625, -10.052734375, -6.0078125, -1.962890625, 2.08203125, 6.126953125, 10.171875, 14.216796875, 18.26171875, 22.306640625, 26.3515625, 30.396484375, 34.44140625, 38.486328125, 42.53125, 46.576171875, 50.62109375, 54.666015625, 58.7109375, 62.755859375, 66.80078125, 70.845703125, 74.890625, 78.935546875, 82.98046875, 87.025390625, 91.0703125, 95.115234375, 99.16015625, 103.205078125, 107.25]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 7.0, 7.0, 19.0, 36.0, 62.0, 106.0, 180.0, 183.0, 136.0, 94.0, 60.0, 42.0, 13.0, 13.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.75, -84.15234375, -80.5546875, -76.95703125, -73.359375, -69.76171875, -66.1640625, -62.56640625, -58.96875, -55.37109375, -51.7734375, -48.17578125, -44.578125, -40.98046875, -37.3828125, -33.78515625, -30.1875, -26.58984375, -22.9921875, -19.39453125, -15.796875, -12.19921875, -8.6015625, -5.00390625, -1.40625, 2.19140625, 5.7890625, 9.38671875, 12.984375, 16.58203125, 20.1796875, 23.77734375, 27.375, 30.97265625, 34.5703125, 38.16796875, 41.765625, 45.36328125, 48.9609375, 52.55859375, 56.15625, 59.75390625, 63.3515625, 66.94921875, 70.546875, 74.14453125, 77.7421875, 81.33984375, 84.9375, 88.53515625, 92.1328125, 95.73046875, 99.328125, 102.92578125, 106.5234375, 110.12109375, 113.71875, 117.31640625, 120.9140625, 124.51171875, 128.109375, 131.70703125, 135.3046875, 138.90234375, 142.5]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 14.0, 44.0, 94.0, 219.0, 281.0, 180.0, 93.0, 33.0, 18.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3132.603515625, -3066.642822265625, -3000.681884765625, -2934.72119140625, -2868.76025390625, -2802.799560546875, -2736.838623046875, -2670.8779296875, -2604.9169921875, -2538.956298828125, -2472.995361328125, -2407.03466796875, -2341.07373046875, -2275.113037109375, -2209.152099609375, -2143.19140625, -2077.23046875, -2011.2696533203125, -1945.308837890625, -1879.3480224609375, -1813.38720703125, -1747.4263916015625, -1681.465576171875, -1615.5048828125, -1549.544189453125, -1483.5833740234375, -1417.62255859375, -1351.6617431640625, -1285.700927734375, -1219.7401123046875, -1153.779296875, -1087.818603515625, -1021.857666015625, -955.8968505859375, -889.93603515625, -823.9752197265625, -758.014404296875, -692.0535888671875, -626.0928344726562, -560.1320190429688, -494.17120361328125, -428.21038818359375, -362.24957275390625, -296.2887878417969, -230.32797241210938, -164.36715698242188, -98.4063720703125, -32.445556640625, 33.5152587890625, 99.47606658935547, 165.43687438964844, 231.39767456054688, 297.3584899902344, 363.3193054199219, 429.28009033203125, 495.24090576171875, 561.2017211914062, 627.1625366210938, 693.1233520507812, 759.0841064453125, 825.044921875, 891.0057373046875, 956.966552734375, 1022.9273681640625, 1088.88818359375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 7.0, 10.0, 11.0, 14.0, 23.0, 36.0, 41.0, 35.0, 56.0, 61.0, 60.0, 65.0, 75.0, 72.0, 56.0, 51.0, 53.0, 41.0, 43.0, 34.0, 37.0, 22.0, 23.0, 19.0, 9.0, 5.0, 10.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1139.2607421875, -1104.7119140625, -1070.1630859375, -1035.6141357421875, -1001.0653076171875, -966.5164794921875, -931.9675903320312, -897.418701171875, -862.869873046875, -828.321044921875, -793.7721557617188, -759.2232666015625, -724.6744384765625, -690.1256103515625, -655.5767211914062, -621.02783203125, -586.47900390625, -551.93017578125, -517.3812866210938, -482.8324279785156, -448.2835693359375, -413.7347106933594, -379.18585205078125, -344.6369934082031, -310.088134765625, -275.5392761230469, -240.99041748046875, -206.44155883789062, -171.8927001953125, -137.34384155273438, -102.79498291015625, -68.24612426757812, -33.6971435546875, 0.851715087890625, 35.40057373046875, 69.94943237304688, 104.498291015625, 139.04714965820312, 173.59600830078125, 208.14486694335938, 242.6937255859375, 277.2425842285156, 311.79144287109375, 346.3403015136719, 380.88916015625, 415.4380187988281, 449.98687744140625, 484.5357360839844, 519.0845947265625, 553.6334228515625, 588.1823120117188, 622.731201171875, 657.280029296875, 691.828857421875, 726.3777465820312, 760.9266357421875, 795.4754638671875, 830.0242919921875, 864.5731811523438, 899.1220703125, 933.6708984375, 968.2197265625, 1002.7686157226562, 1037.3175048828125, 1071.8663330078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 8.0, 4.0, 8.0, 12.0, 13.0, 11.0, 27.0, 30.0, 53.0, 76.0, 134.0, 216.0, 475.0, 1066.0, 3056.0, 11482.0, 72450.0, 3759963.0, 311821.0, 24527.0, 5647.0, 1700.0, 707.0, 317.0, 169.0, 99.0, 62.0, 36.0, 31.0, 17.0, 12.0, 6.0, 8.0, 6.0, 2.0, 6.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0], "bins": [-131.625, -127.197265625, -122.76953125, -118.341796875, -113.9140625, -109.486328125, -105.05859375, -100.630859375, -96.203125, -91.775390625, -87.34765625, -82.919921875, -78.4921875, -74.064453125, -69.63671875, -65.208984375, -60.78125, -56.353515625, -51.92578125, -47.498046875, -43.0703125, -38.642578125, -34.21484375, -29.787109375, -25.359375, -20.931640625, -16.50390625, -12.076171875, -7.6484375, -3.220703125, 1.20703125, 5.634765625, 10.0625, 14.490234375, 18.91796875, 23.345703125, 27.7734375, 32.201171875, 36.62890625, 41.056640625, 45.484375, 49.912109375, 54.33984375, 58.767578125, 63.1953125, 67.623046875, 72.05078125, 76.478515625, 80.90625, 85.333984375, 89.76171875, 94.189453125, 98.6171875, 103.044921875, 107.47265625, 111.900390625, 116.328125, 120.755859375, 125.18359375, 129.611328125, 134.0390625, 138.466796875, 142.89453125, 147.322265625, 151.75]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 6.0, 8.0, 5.0, 7.0, 23.0, 16.0, 23.0, 36.0, 32.0, 46.0, 49.0, 51.0, 47.0, 54.0, 67.0, 49.0, 51.0, 62.0, 50.0, 43.0, 49.0, 48.0, 31.0, 32.0, 29.0, 21.0, 14.0, 14.0, 10.0, 8.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.96875, -39.7138671875, -38.458984375, -37.2041015625, -35.94921875, -34.6943359375, -33.439453125, -32.1845703125, -30.9296875, -29.6748046875, -28.419921875, -27.1650390625, -25.91015625, -24.6552734375, -23.400390625, -22.1455078125, -20.890625, -19.6357421875, -18.380859375, -17.1259765625, -15.87109375, -14.6162109375, -13.361328125, -12.1064453125, -10.8515625, -9.5966796875, -8.341796875, -7.0869140625, -5.83203125, -4.5771484375, -3.322265625, -2.0673828125, -0.8125, 0.4423828125, 1.697265625, 2.9521484375, 4.20703125, 5.4619140625, 6.716796875, 7.9716796875, 9.2265625, 10.4814453125, 11.736328125, 12.9912109375, 14.24609375, 15.5009765625, 16.755859375, 18.0107421875, 19.265625, 20.5205078125, 21.775390625, 23.0302734375, 24.28515625, 25.5400390625, 26.794921875, 28.0498046875, 29.3046875, 30.5595703125, 31.814453125, 33.0693359375, 34.32421875, 35.5791015625, 36.833984375, 38.0888671875, 39.34375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 10.0, 8.0, 17.0, 34.0, 48.0, 106.0, 186.0, 469.0, 1749.0, 10491.0, 174818.0, 3946128.0, 53394.0, 5230.0, 1020.0, 310.0, 111.0, 59.0, 30.0, 20.0, 10.0, 7.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.125, -121.494140625, -114.86328125, -108.232421875, -101.6015625, -94.970703125, -88.33984375, -81.708984375, -75.078125, -68.447265625, -61.81640625, -55.185546875, -48.5546875, -41.923828125, -35.29296875, -28.662109375, -22.03125, -15.400390625, -8.76953125, -2.138671875, 4.4921875, 11.123046875, 17.75390625, 24.384765625, 31.015625, 37.646484375, 44.27734375, 50.908203125, 57.5390625, 64.169921875, 70.80078125, 77.431640625, 84.0625, 90.693359375, 97.32421875, 103.955078125, 110.5859375, 117.216796875, 123.84765625, 130.478515625, 137.109375, 143.740234375, 150.37109375, 157.001953125, 163.6328125, 170.263671875, 176.89453125, 183.525390625, 190.15625, 196.787109375, 203.41796875, 210.048828125, 216.6796875, 223.310546875, 229.94140625, 236.572265625, 243.203125, 249.833984375, 256.46484375, 263.095703125, 269.7265625, 276.357421875, 282.98828125, 289.619140625, 296.25]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 10.0, 11.0, 15.0, 18.0, 21.0, 24.0, 50.0, 76.0, 122.0, 238.0, 718.0, 1598.0, 637.0, 206.0, 86.0, 70.0, 44.0, 44.0, 16.0, 11.0, 12.0, 11.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-133.5, -129.728515625, -125.95703125, -122.185546875, -118.4140625, -114.642578125, -110.87109375, -107.099609375, -103.328125, -99.556640625, -95.78515625, -92.013671875, -88.2421875, -84.470703125, -80.69921875, -76.927734375, -73.15625, -69.384765625, -65.61328125, -61.841796875, -58.0703125, -54.298828125, -50.52734375, -46.755859375, -42.984375, -39.212890625, -35.44140625, -31.669921875, -27.8984375, -24.126953125, -20.35546875, -16.583984375, -12.8125, -9.041015625, -5.26953125, -1.498046875, 2.2734375, 6.044921875, 9.81640625, 13.587890625, 17.359375, 21.130859375, 24.90234375, 28.673828125, 32.4453125, 36.216796875, 39.98828125, 43.759765625, 47.53125, 51.302734375, 55.07421875, 58.845703125, 62.6171875, 66.388671875, 70.16015625, 73.931640625, 77.703125, 81.474609375, 85.24609375, 89.017578125, 92.7890625, 96.560546875, 100.33203125, 104.103515625, 107.875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 12.0, 16.0, 54.0, 196.0, 411.0, 241.0, 41.0, 20.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3091.7822265625, -3024.01318359375, -2956.244384765625, -2888.475341796875, -2820.706298828125, -2752.9375, -2685.16845703125, -2617.3994140625, -2549.63037109375, -2481.861328125, -2414.092529296875, -2346.323486328125, -2278.554443359375, -2210.78564453125, -2143.0166015625, -2075.24755859375, -2007.478759765625, -1939.7098388671875, -1871.9407958984375, -1804.171875, -1736.40283203125, -1668.6339111328125, -1600.864990234375, -1533.095947265625, -1465.3270263671875, -1397.55810546875, -1329.7890625, -1262.0201416015625, -1194.251220703125, -1126.482177734375, -1058.7132568359375, -990.9442749023438, -923.175537109375, -855.4065551757812, -787.6375732421875, -719.86865234375, -652.0996704101562, -584.3306884765625, -516.561767578125, -448.79278564453125, -381.0238037109375, -313.25482177734375, -245.48587036132812, -177.71690368652344, -109.94793701171875, -42.178955078125, 25.589996337890625, 93.35894775390625, 161.1279296875, 228.8968963623047, 296.6658630371094, 364.434814453125, 432.20379638671875, 499.9727783203125, 567.74169921875, 635.5106811523438, 703.2796630859375, 771.0486450195312, 838.817626953125, 906.5865478515625, 974.3555297851562, 1042.12451171875, 1109.8934326171875, 1177.662353515625, 1245.431396484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 6.0, 2.0, 7.0, 14.0, 18.0, 17.0, 27.0, 23.0, 18.0, 24.0, 36.0, 33.0, 42.0, 39.0, 57.0, 44.0, 48.0, 44.0, 47.0, 51.0, 45.0, 39.0, 51.0, 32.0, 39.0, 38.0, 26.0, 23.0, 14.0, 24.0, 16.0, 12.0, 11.0, 5.0, 4.0, 1.0, 1.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0], "bins": [-602.1848754882812, -586.462646484375, -570.740478515625, -555.0182495117188, -539.2960205078125, -523.5737915039062, -507.8515930175781, -492.12939453125, -476.40716552734375, -460.6849670410156, -444.9627380371094, -429.24053955078125, -413.518310546875, -397.7961120605469, -382.0738830566406, -366.3516845703125, -350.62945556640625, -334.9072570800781, -319.1850280761719, -303.46282958984375, -287.7406005859375, -272.0184020996094, -256.2961730957031, -240.573974609375, -224.85177612304688, -209.1295623779297, -193.4073486328125, -177.6851348876953, -161.96292114257812, -146.24072265625, -130.51849365234375, -114.7962875366211, -99.07406616210938, -83.35185241699219, -67.629638671875, -51.90742874145508, -36.18521499633789, -20.46300506591797, -4.740791320800781, 10.981422424316406, 26.703636169433594, 42.42584991455078, 58.14806365966797, 73.87026977539062, 89.59248352050781, 105.314697265625, 121.03691101074219, 136.75912475585938, 152.48133850097656, 168.20355224609375, 183.92576599121094, 199.64797973632812, 215.3701934814453, 231.0924072265625, 246.81460571289062, 262.5368347167969, 278.259033203125, 293.9812316894531, 309.7034606933594, 325.4256591796875, 341.14788818359375, 356.8700866699219, 372.5923156738281, 388.31451416015625, 404.0367431640625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 18.0, 38.0, 69.0, 125.0, 246.0, 552.0, 1396.0, 4870.0, 28061.0, 379187.0, 582439.0, 42034.0, 6460.0, 1766.0, 654.0, 300.0, 142.0, 67.0, 29.0, 26.0, 16.0, 13.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.125, -212.296875, -205.46875, -198.640625, -191.8125, -184.984375, -178.15625, -171.328125, -164.5, -157.671875, -150.84375, -144.015625, -137.1875, -130.359375, -123.53125, -116.703125, -109.875, -103.046875, -96.21875, -89.390625, -82.5625, -75.734375, -68.90625, -62.078125, -55.25, -48.421875, -41.59375, -34.765625, -27.9375, -21.109375, -14.28125, -7.453125, -0.625, 6.203125, 13.03125, 19.859375, 26.6875, 33.515625, 40.34375, 47.171875, 54.0, 60.828125, 67.65625, 74.484375, 81.3125, 88.140625, 94.96875, 101.796875, 108.625, 115.453125, 122.28125, 129.109375, 135.9375, 142.765625, 149.59375, 156.421875, 163.25, 170.078125, 176.90625, 183.734375, 190.5625, 197.390625, 204.21875, 211.046875, 217.875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 7.0, 5.0, 8.0, 11.0, 16.0, 22.0, 27.0, 30.0, 32.0, 30.0, 44.0, 60.0, 61.0, 58.0, 56.0, 55.0, 62.0, 53.0, 39.0, 51.0, 48.0, 47.0, 33.0, 22.0, 26.0, 16.0, 12.0, 16.0, 13.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.05712890625, -33.7705078125, -32.48388671875, -31.197265625, -29.91064453125, -28.6240234375, -27.33740234375, -26.05078125, -24.76416015625, -23.4775390625, -22.19091796875, -20.904296875, -19.61767578125, -18.3310546875, -17.04443359375, -15.7578125, -14.47119140625, -13.1845703125, -11.89794921875, -10.611328125, -9.32470703125, -8.0380859375, -6.75146484375, -5.46484375, -4.17822265625, -2.8916015625, -1.60498046875, -0.318359375, 0.96826171875, 2.2548828125, 3.54150390625, 4.828125, 6.11474609375, 7.4013671875, 8.68798828125, 9.974609375, 11.26123046875, 12.5478515625, 13.83447265625, 15.12109375, 16.40771484375, 17.6943359375, 18.98095703125, 20.267578125, 21.55419921875, 22.8408203125, 24.12744140625, 25.4140625, 26.70068359375, 27.9873046875, 29.27392578125, 30.560546875, 31.84716796875, 33.1337890625, 34.42041015625, 35.70703125, 36.99365234375, 38.2802734375, 39.56689453125, 40.853515625, 42.14013671875, 43.4267578125, 44.71337890625, 46.0]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 9.0, 6.0, 8.0, 20.0, 21.0, 29.0, 56.0, 85.0, 124.0, 258.0, 430.0, 830.0, 2172.0, 8703.0, 154857.0, 849077.0, 25320.0, 3881.0, 1281.0, 569.0, 308.0, 162.0, 117.0, 78.0, 47.0, 27.0, 25.0, 10.0, 12.0, 13.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-275.25, -265.50390625, -255.7578125, -246.01171875, -236.265625, -226.51953125, -216.7734375, -207.02734375, -197.28125, -187.53515625, -177.7890625, -168.04296875, -158.296875, -148.55078125, -138.8046875, -129.05859375, -119.3125, -109.56640625, -99.8203125, -90.07421875, -80.328125, -70.58203125, -60.8359375, -51.08984375, -41.34375, -31.59765625, -21.8515625, -12.10546875, -2.359375, 7.38671875, 17.1328125, 26.87890625, 36.625, 46.37109375, 56.1171875, 65.86328125, 75.609375, 85.35546875, 95.1015625, 104.84765625, 114.59375, 124.33984375, 134.0859375, 143.83203125, 153.578125, 163.32421875, 173.0703125, 182.81640625, 192.5625, 202.30859375, 212.0546875, 221.80078125, 231.546875, 241.29296875, 251.0390625, 260.78515625, 270.53125, 280.27734375, 290.0234375, 299.76953125, 309.515625, 319.26171875, 329.0078125, 338.75390625, 348.5]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 9.0, 5.0, 5.0, 12.0, 16.0, 16.0, 20.0, 19.0, 28.0, 28.0, 31.0, 40.0, 34.0, 55.0, 41.0, 44.0, 57.0, 44.0, 55.0, 49.0, 51.0, 49.0, 34.0, 30.0, 44.0, 30.0, 27.0, 19.0, 22.0, 16.0, 11.0, 11.0, 6.0, 7.0, 10.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-152.5, -147.4765625, -142.453125, -137.4296875, -132.40625, -127.3828125, -122.359375, -117.3359375, -112.3125, -107.2890625, -102.265625, -97.2421875, -92.21875, -87.1953125, -82.171875, -77.1484375, -72.125, -67.1015625, -62.078125, -57.0546875, -52.03125, -47.0078125, -41.984375, -36.9609375, -31.9375, -26.9140625, -21.890625, -16.8671875, -11.84375, -6.8203125, -1.796875, 3.2265625, 8.25, 13.2734375, 18.296875, 23.3203125, 28.34375, 33.3671875, 38.390625, 43.4140625, 48.4375, 53.4609375, 58.484375, 63.5078125, 68.53125, 73.5546875, 78.578125, 83.6015625, 88.625, 93.6484375, 98.671875, 103.6953125, 108.71875, 113.7421875, 118.765625, 123.7890625, 128.8125, 133.8359375, 138.859375, 143.8828125, 148.90625, 153.9296875, 158.953125, 163.9765625, 169.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 11.0, 8.0, 10.0, 17.0, 17.0, 29.0, 41.0, 62.0, 103.0, 210.0, 480.0, 1731.0, 12817.0, 1000879.0, 28516.0, 2380.0, 642.0, 268.0, 103.0, 69.0, 42.0, 24.0, 24.0, 17.0, 12.0, 12.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.75, -220.05859375, -212.3671875, -204.67578125, -196.984375, -189.29296875, -181.6015625, -173.91015625, -166.21875, -158.52734375, -150.8359375, -143.14453125, -135.453125, -127.76171875, -120.0703125, -112.37890625, -104.6875, -96.99609375, -89.3046875, -81.61328125, -73.921875, -66.23046875, -58.5390625, -50.84765625, -43.15625, -35.46484375, -27.7734375, -20.08203125, -12.390625, -4.69921875, 2.9921875, 10.68359375, 18.375, 26.06640625, 33.7578125, 41.44921875, 49.140625, 56.83203125, 64.5234375, 72.21484375, 79.90625, 87.59765625, 95.2890625, 102.98046875, 110.671875, 118.36328125, 126.0546875, 133.74609375, 141.4375, 149.12890625, 156.8203125, 164.51171875, 172.203125, 179.89453125, 187.5859375, 195.27734375, 202.96875, 210.66015625, 218.3515625, 226.04296875, 233.734375, 241.42578125, 249.1171875, 256.80859375, 264.5]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 17.0, 30.0, 55.0, 128.0, 263.0, 262.0, 129.0, 60.0, 21.0, 11.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0266876220703125, -0.025855302810668945, -0.02502298355102539, -0.024190664291381836, -0.02335834503173828, -0.022526025772094727, -0.021693706512451172, -0.020861387252807617, -0.020029067993164062, -0.019196748733520508, -0.018364429473876953, -0.0175321102142334, -0.016699790954589844, -0.01586747169494629, -0.015035152435302734, -0.01420283317565918, -0.013370513916015625, -0.01253819465637207, -0.011705875396728516, -0.010873556137084961, -0.010041236877441406, -0.009208917617797852, -0.008376598358154297, -0.007544279098510742, -0.0067119598388671875, -0.005879640579223633, -0.005047321319580078, -0.0042150020599365234, -0.0033826828002929688, -0.002550363540649414, -0.0017180442810058594, -0.0008857250213623047, -5.340576171875e-05, 0.0007789134979248047, 0.0016112327575683594, 0.002443552017211914, 0.0032758712768554688, 0.0041081905364990234, 0.004940509796142578, 0.005772829055786133, 0.0066051483154296875, 0.007437467575073242, 0.008269786834716797, 0.009102106094360352, 0.009934425354003906, 0.010766744613647461, 0.011599063873291016, 0.01243138313293457, 0.013263702392578125, 0.01409602165222168, 0.014928340911865234, 0.01576066017150879, 0.016592979431152344, 0.0174252986907959, 0.018257617950439453, 0.019089937210083008, 0.019922256469726562, 0.020754575729370117, 0.021586894989013672, 0.022419214248657227, 0.02325153350830078, 0.024083852767944336, 0.02491617202758789, 0.025748491287231445, 0.026580810546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 13.0, 9.0, 18.0, 37.0, 29.0, 66.0, 86.0, 221.0, 480.0, 1260.0, 4983.0, 47196.0, 961710.0, 26760.0, 3736.0, 1057.0, 406.0, 176.0, 109.0, 67.0, 39.0, 21.0, 17.0, 9.0, 11.0, 9.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.625, -196.736328125, -190.84765625, -184.958984375, -179.0703125, -173.181640625, -167.29296875, -161.404296875, -155.515625, -149.626953125, -143.73828125, -137.849609375, -131.9609375, -126.072265625, -120.18359375, -114.294921875, -108.40625, -102.517578125, -96.62890625, -90.740234375, -84.8515625, -78.962890625, -73.07421875, -67.185546875, -61.296875, -55.408203125, -49.51953125, -43.630859375, -37.7421875, -31.853515625, -25.96484375, -20.076171875, -14.1875, -8.298828125, -2.41015625, 3.478515625, 9.3671875, 15.255859375, 21.14453125, 27.033203125, 32.921875, 38.810546875, 44.69921875, 50.587890625, 56.4765625, 62.365234375, 68.25390625, 74.142578125, 80.03125, 85.919921875, 91.80859375, 97.697265625, 103.5859375, 109.474609375, 115.36328125, 121.251953125, 127.140625, 133.029296875, 138.91796875, 144.806640625, 150.6953125, 156.583984375, 162.47265625, 168.361328125, 174.25]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 4.0, 10.0, 8.0, 11.0, 8.0, 17.0, 23.0, 24.0, 49.0, 93.0, 134.0, 135.0, 133.0, 114.0, 78.0, 44.0, 21.0, 19.0, 14.0, 6.0, 6.0, 11.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-109.75, -106.50390625, -103.2578125, -100.01171875, -96.765625, -93.51953125, -90.2734375, -87.02734375, -83.78125, -80.53515625, -77.2890625, -74.04296875, -70.796875, -67.55078125, -64.3046875, -61.05859375, -57.8125, -54.56640625, -51.3203125, -48.07421875, -44.828125, -41.58203125, -38.3359375, -35.08984375, -31.84375, -28.59765625, -25.3515625, -22.10546875, -18.859375, -15.61328125, -12.3671875, -9.12109375, -5.875, -2.62890625, 0.6171875, 3.86328125, 7.109375, 10.35546875, 13.6015625, 16.84765625, 20.09375, 23.33984375, 26.5859375, 29.83203125, 33.078125, 36.32421875, 39.5703125, 42.81640625, 46.0625, 49.30859375, 52.5546875, 55.80078125, 59.046875, 62.29296875, 65.5390625, 68.78515625, 72.03125, 75.27734375, 78.5234375, 81.76953125, 85.015625, 88.26171875, 91.5078125, 94.75390625, 98.0]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 12.0, 39.0, 127.0, 343.0, 313.0, 119.0, 33.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1218.513916015625, -1142.3702392578125, -1066.2266845703125, -990.0830078125, -913.939453125, -837.7957763671875, -761.6521606445312, -685.508544921875, -609.3649291992188, -533.2213134765625, -457.07769775390625, -380.9340515136719, -304.7904357910156, -228.64682006835938, -152.503173828125, -76.35955810546875, -0.2159423828125, 75.92768096923828, 152.07130432128906, 228.21493530273438, 304.3585510253906, 380.5021667480469, 456.64581298828125, 532.7894287109375, 608.9330444335938, 685.07666015625, 761.2202758789062, 837.3638916015625, 913.507568359375, 989.651123046875, 1065.7947998046875, 1141.9384765625, 1218.08203125, 1294.2257080078125, 1370.3692626953125, 1446.512939453125, 1522.656494140625, 1598.8001708984375, 1674.94384765625, 1751.08740234375, 1827.23095703125, 1903.3746337890625, 1979.5181884765625, 2055.661865234375, 2131.805419921875, 2207.948974609375, 2284.0927734375, 2360.236328125, 2436.3798828125, 2512.5234375, 2588.667236328125, 2664.810791015625, 2740.954345703125, 2817.097900390625, 2893.24169921875, 2969.38525390625, 3045.529052734375, 3121.672607421875, 3197.81640625, 3273.9599609375, 3350.103515625, 3426.2470703125, 3502.390869140625, 3578.534423828125, 3654.677978515625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 7.0, 4.0, 8.0, 12.0, 12.0, 14.0, 14.0, 21.0, 36.0, 18.0, 35.0, 39.0, 35.0, 51.0, 54.0, 62.0, 62.0, 69.0, 46.0, 60.0, 37.0, 56.0, 40.0, 29.0, 33.0, 26.0, 18.0, 24.0, 16.0, 11.0, 16.0, 5.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-765.71240234375, -741.8490600585938, -717.9856567382812, -694.122314453125, -670.2589111328125, -646.3955688476562, -622.5322265625, -598.6688232421875, -574.805419921875, -550.9420776367188, -527.0786743164062, -503.21533203125, -479.3519287109375, -455.48858642578125, -431.6252136230469, -407.7618408203125, -383.89849853515625, -360.0351257324219, -336.1717529296875, -312.30841064453125, -288.44500732421875, -264.5816650390625, -240.71829223632812, -216.85491943359375, -192.99154663085938, -169.128173828125, -145.26480102539062, -121.40144348144531, -97.53807067871094, -73.67469787597656, -49.81134033203125, -25.947967529296875, -2.08465576171875, 21.77871322631836, 45.64208221435547, 69.50544738769531, 93.36882019042969, 117.23219299316406, 141.09555053710938, 164.95892333984375, 188.82229614257812, 212.6856689453125, 236.54904174804688, 260.41241455078125, 284.2757568359375, 308.13916015625, 332.00250244140625, 355.8658752441406, 379.729248046875, 403.5926208496094, 427.45599365234375, 451.3193359375, 475.1827392578125, 499.04608154296875, 522.909423828125, 546.7728271484375, 570.63623046875, 594.4995727539062, 618.3629760742188, 642.226318359375, 666.0897216796875, 689.9530639648438, 713.81640625, 737.6798095703125, 761.5431518554688]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 8.0, 10.0, 10.0, 14.0, 17.0, 35.0, 55.0, 58.0, 98.0, 162.0, 282.0, 483.0, 1002.0, 2408.0, 7244.0, 32457.0, 577502.0, 3475254.0, 76796.0, 13405.0, 3927.0, 1484.0, 696.0, 333.0, 194.0, 110.0, 58.0, 64.0, 32.0, 24.0, 18.0, 7.0, 12.0, 6.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.5, -92.3388671875, -89.177734375, -86.0166015625, -82.85546875, -79.6943359375, -76.533203125, -73.3720703125, -70.2109375, -67.0498046875, -63.888671875, -60.7275390625, -57.56640625, -54.4052734375, -51.244140625, -48.0830078125, -44.921875, -41.7607421875, -38.599609375, -35.4384765625, -32.27734375, -29.1162109375, -25.955078125, -22.7939453125, -19.6328125, -16.4716796875, -13.310546875, -10.1494140625, -6.98828125, -3.8271484375, -0.666015625, 2.4951171875, 5.65625, 8.8173828125, 11.978515625, 15.1396484375, 18.30078125, 21.4619140625, 24.623046875, 27.7841796875, 30.9453125, 34.1064453125, 37.267578125, 40.4287109375, 43.58984375, 46.7509765625, 49.912109375, 53.0732421875, 56.234375, 59.3955078125, 62.556640625, 65.7177734375, 68.87890625, 72.0400390625, 75.201171875, 78.3623046875, 81.5234375, 84.6845703125, 87.845703125, 91.0068359375, 94.16796875, 97.3291015625, 100.490234375, 103.6513671875, 106.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 4.0, 9.0, 13.0, 28.0, 31.0, 40.0, 60.0, 64.0, 71.0, 91.0, 84.0, 91.0, 62.0, 66.0, 59.0, 55.0, 38.0, 40.0, 24.0, 20.0, 19.0, 5.0, 9.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.125, -60.3525390625, -58.580078125, -56.8076171875, -55.03515625, -53.2626953125, -51.490234375, -49.7177734375, -47.9453125, -46.1728515625, -44.400390625, -42.6279296875, -40.85546875, -39.0830078125, -37.310546875, -35.5380859375, -33.765625, -31.9931640625, -30.220703125, -28.4482421875, -26.67578125, -24.9033203125, -23.130859375, -21.3583984375, -19.5859375, -17.8134765625, -16.041015625, -14.2685546875, -12.49609375, -10.7236328125, -8.951171875, -7.1787109375, -5.40625, -3.6337890625, -1.861328125, -0.0888671875, 1.68359375, 3.4560546875, 5.228515625, 7.0009765625, 8.7734375, 10.5458984375, 12.318359375, 14.0908203125, 15.86328125, 17.6357421875, 19.408203125, 21.1806640625, 22.953125, 24.7255859375, 26.498046875, 28.2705078125, 30.04296875, 31.8154296875, 33.587890625, 35.3603515625, 37.1328125, 38.9052734375, 40.677734375, 42.4501953125, 44.22265625, 45.9951171875, 47.767578125, 49.5400390625, 51.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 15.0, 17.0, 28.0, 48.0, 96.0, 138.0, 297.0, 924.0, 3580.0, 20039.0, 304146.0, 3771930.0, 79422.0, 10385.0, 2173.0, 599.0, 202.0, 92.0, 55.0, 29.0, 30.0, 15.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.1875, -110.6337890625, -106.080078125, -101.5263671875, -96.97265625, -92.4189453125, -87.865234375, -83.3115234375, -78.7578125, -74.2041015625, -69.650390625, -65.0966796875, -60.54296875, -55.9892578125, -51.435546875, -46.8818359375, -42.328125, -37.7744140625, -33.220703125, -28.6669921875, -24.11328125, -19.5595703125, -15.005859375, -10.4521484375, -5.8984375, -1.3447265625, 3.208984375, 7.7626953125, 12.31640625, 16.8701171875, 21.423828125, 25.9775390625, 30.53125, 35.0849609375, 39.638671875, 44.1923828125, 48.74609375, 53.2998046875, 57.853515625, 62.4072265625, 66.9609375, 71.5146484375, 76.068359375, 80.6220703125, 85.17578125, 89.7294921875, 94.283203125, 98.8369140625, 103.390625, 107.9443359375, 112.498046875, 117.0517578125, 121.60546875, 126.1591796875, 130.712890625, 135.2666015625, 139.8203125, 144.3740234375, 148.927734375, 153.4814453125, 158.03515625, 162.5888671875, 167.142578125, 171.6962890625, 176.25]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 2.0, 9.0, 12.0, 15.0, 39.0, 57.0, 121.0, 344.0, 1092.0, 1504.0, 491.0, 154.0, 85.0, 52.0, 31.0, 23.0, 15.0, 9.0, 4.0, 5.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-175.25, -171.0908203125, -166.931640625, -162.7724609375, -158.61328125, -154.4541015625, -150.294921875, -146.1357421875, -141.9765625, -137.8173828125, -133.658203125, -129.4990234375, -125.33984375, -121.1806640625, -117.021484375, -112.8623046875, -108.703125, -104.5439453125, -100.384765625, -96.2255859375, -92.06640625, -87.9072265625, -83.748046875, -79.5888671875, -75.4296875, -71.2705078125, -67.111328125, -62.9521484375, -58.79296875, -54.6337890625, -50.474609375, -46.3154296875, -42.15625, -37.9970703125, -33.837890625, -29.6787109375, -25.51953125, -21.3603515625, -17.201171875, -13.0419921875, -8.8828125, -4.7236328125, -0.564453125, 3.5947265625, 7.75390625, 11.9130859375, 16.072265625, 20.2314453125, 24.390625, 28.5498046875, 32.708984375, 36.8681640625, 41.02734375, 45.1865234375, 49.345703125, 53.5048828125, 57.6640625, 61.8232421875, 65.982421875, 70.1416015625, 74.30078125, 78.4599609375, 82.619140625, 86.7783203125, 90.9375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 9.0, 17.0, 29.0, 56.0, 107.0, 163.0, 196.0, 155.0, 124.0, 51.0, 25.0, 21.0, 5.0, 10.0, 5.0, 4.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-666.39501953125, -644.3047485351562, -622.2144165039062, -600.1241455078125, -578.0338134765625, -555.9435424804688, -533.853271484375, -511.762939453125, -489.6726379394531, -467.58233642578125, -445.4920349121094, -423.4017333984375, -401.31146240234375, -379.22113037109375, -357.130859375, -335.0405578613281, -312.95025634765625, -290.8599548339844, -268.7696533203125, -246.6793670654297, -224.5890655517578, -202.49876403808594, -180.40847778320312, -158.31817626953125, -136.22787475585938, -114.1375732421875, -92.04727935791016, -69.95698547363281, -47.86668395996094, -25.776382446289062, -3.68609619140625, 18.404205322265625, 40.4945068359375, 62.58480453491211, 84.67510223388672, 106.76539611816406, 128.85569763183594, 150.9459991455078, 173.03628540039062, 195.1265869140625, 217.21688842773438, 239.30718994140625, 261.3974914550781, 283.48779296875, 305.57806396484375, 327.66839599609375, 349.7586669921875, 371.8489685058594, 393.93927001953125, 416.0295715332031, 438.119873046875, 460.21014404296875, 482.30047607421875, 504.3907470703125, 526.4810791015625, 548.5713500976562, 570.66162109375, 592.7518920898438, 614.8422241210938, 636.9324951171875, 659.0228271484375, 681.1130981445312, 703.203369140625, 725.293701171875, 747.384033203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 10.0, 7.0, 15.0, 17.0, 12.0, 15.0, 30.0, 30.0, 35.0, 37.0, 35.0, 41.0, 49.0, 43.0, 40.0, 46.0, 50.0, 43.0, 52.0, 45.0, 41.0, 37.0, 47.0, 41.0, 32.0, 28.0, 20.0, 13.0, 18.0, 19.0, 9.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-409.6883850097656, -398.821044921875, -387.9537353515625, -377.0863952636719, -366.21905517578125, -355.35174560546875, -344.4844055175781, -333.6170654296875, -322.749755859375, -311.8824157714844, -301.0151062011719, -290.14776611328125, -279.2804260253906, -268.4130859375, -257.5457763671875, -246.67843627929688, -235.81109619140625, -224.9437713623047, -214.07643127441406, -203.2091064453125, -192.34176635742188, -181.4744415283203, -170.60711669921875, -159.73977661132812, -148.87245178222656, -138.005126953125, -127.13778686523438, -116.27046203613281, -105.40312957763672, -94.53579711914062, -83.66847229003906, -72.80113983154297, -61.93377685546875, -51.066444396972656, -40.19911575317383, -29.331787109375, -18.464454650878906, -7.5971221923828125, 3.27020263671875, 14.137535095214844, 25.004867553710938, 35.87220001220703, 46.73952865600586, 57.60685729980469, 68.47418975830078, 79.34152221679688, 90.20884704589844, 101.07617950439453, 111.94351196289062, 122.81084442138672, 133.6781768798828, 144.54550170898438, 155.412841796875, 166.28016662597656, 177.14749145507812, 188.01483154296875, 198.8821563720703, 209.74948120117188, 220.6168212890625, 231.48414611816406, 242.35147094726562, 253.21881103515625, 264.08612060546875, 274.9534606933594, 285.82080078125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 9.0, 3.0, 12.0, 11.0, 13.0, 23.0, 29.0, 25.0, 39.0, 70.0, 78.0, 130.0, 196.0, 316.0, 512.0, 925.0, 1889.0, 3750.0, 8413.0, 20089.0, 52341.0, 148511.0, 373817.0, 278684.0, 97312.0, 35154.0, 14009.0, 6062.0, 2714.0, 1389.0, 698.0, 402.0, 296.0, 181.0, 124.0, 100.0, 50.0, 47.0, 40.0, 22.0, 15.0, 14.0, 11.0, 8.0, 4.0, 4.0, 5.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.75, -69.5625, -67.375, -65.1875, -63.0, -60.8125, -58.625, -56.4375, -54.25, -52.0625, -49.875, -47.6875, -45.5, -43.3125, -41.125, -38.9375, -36.75, -34.5625, -32.375, -30.1875, -28.0, -25.8125, -23.625, -21.4375, -19.25, -17.0625, -14.875, -12.6875, -10.5, -8.3125, -6.125, -3.9375, -1.75, 0.4375, 2.625, 4.8125, 7.0, 9.1875, 11.375, 13.5625, 15.75, 17.9375, 20.125, 22.3125, 24.5, 26.6875, 28.875, 31.0625, 33.25, 35.4375, 37.625, 39.8125, 42.0, 44.1875, 46.375, 48.5625, 50.75, 52.9375, 55.125, 57.3125, 59.5, 61.6875, 63.875, 66.0625, 68.25]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 7.0, 17.0, 15.0, 39.0, 29.0, 48.0, 60.0, 63.0, 74.0, 75.0, 75.0, 65.0, 83.0, 73.0, 45.0, 53.0, 36.0, 26.0, 22.0, 27.0, 21.0, 15.0, 5.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.28125, -52.63134765625, -50.9814453125, -49.33154296875, -47.681640625, -46.03173828125, -44.3818359375, -42.73193359375, -41.08203125, -39.43212890625, -37.7822265625, -36.13232421875, -34.482421875, -32.83251953125, -31.1826171875, -29.53271484375, -27.8828125, -26.23291015625, -24.5830078125, -22.93310546875, -21.283203125, -19.63330078125, -17.9833984375, -16.33349609375, -14.68359375, -13.03369140625, -11.3837890625, -9.73388671875, -8.083984375, -6.43408203125, -4.7841796875, -3.13427734375, -1.484375, 0.16552734375, 1.8154296875, 3.46533203125, 5.115234375, 6.76513671875, 8.4150390625, 10.06494140625, 11.71484375, 13.36474609375, 15.0146484375, 16.66455078125, 18.314453125, 19.96435546875, 21.6142578125, 23.26416015625, 24.9140625, 26.56396484375, 28.2138671875, 29.86376953125, 31.513671875, 33.16357421875, 34.8134765625, 36.46337890625, 38.11328125, 39.76318359375, 41.4130859375, 43.06298828125, 44.712890625, 46.36279296875, 48.0126953125, 49.66259765625, 51.3125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 3.0, 8.0, 15.0, 13.0, 21.0, 34.0, 55.0, 86.0, 129.0, 239.0, 443.0, 899.0, 2372.0, 8759.0, 67491.0, 799276.0, 148815.0, 14216.0, 3275.0, 1171.0, 518.0, 272.0, 154.0, 94.0, 54.0, 38.0, 32.0, 21.0, 6.0, 9.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-224.375, -218.080078125, -211.78515625, -205.490234375, -199.1953125, -192.900390625, -186.60546875, -180.310546875, -174.015625, -167.720703125, -161.42578125, -155.130859375, -148.8359375, -142.541015625, -136.24609375, -129.951171875, -123.65625, -117.361328125, -111.06640625, -104.771484375, -98.4765625, -92.181640625, -85.88671875, -79.591796875, -73.296875, -67.001953125, -60.70703125, -54.412109375, -48.1171875, -41.822265625, -35.52734375, -29.232421875, -22.9375, -16.642578125, -10.34765625, -4.052734375, 2.2421875, 8.537109375, 14.83203125, 21.126953125, 27.421875, 33.716796875, 40.01171875, 46.306640625, 52.6015625, 58.896484375, 65.19140625, 71.486328125, 77.78125, 84.076171875, 90.37109375, 96.666015625, 102.9609375, 109.255859375, 115.55078125, 121.845703125, 128.140625, 134.435546875, 140.73046875, 147.025390625, 153.3203125, 159.615234375, 165.91015625, 172.205078125, 178.5]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 4.0, 7.0, 9.0, 14.0, 24.0, 18.0, 21.0, 38.0, 40.0, 39.0, 40.0, 65.0, 55.0, 60.0, 64.0, 60.0, 59.0, 47.0, 43.0, 64.0, 42.0, 46.0, 30.0, 22.0, 20.0, 18.0, 10.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.125, -185.3203125, -179.515625, -173.7109375, -167.90625, -162.1015625, -156.296875, -150.4921875, -144.6875, -138.8828125, -133.078125, -127.2734375, -121.46875, -115.6640625, -109.859375, -104.0546875, -98.25, -92.4453125, -86.640625, -80.8359375, -75.03125, -69.2265625, -63.421875, -57.6171875, -51.8125, -46.0078125, -40.203125, -34.3984375, -28.59375, -22.7890625, -16.984375, -11.1796875, -5.375, 0.4296875, 6.234375, 12.0390625, 17.84375, 23.6484375, 29.453125, 35.2578125, 41.0625, 46.8671875, 52.671875, 58.4765625, 64.28125, 70.0859375, 75.890625, 81.6953125, 87.5, 93.3046875, 99.109375, 104.9140625, 110.71875, 116.5234375, 122.328125, 128.1328125, 133.9375, 139.7421875, 145.546875, 151.3515625, 157.15625, 162.9609375, 168.765625, 174.5703125, 180.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 9.0, 15.0, 29.0, 39.0, 101.0, 202.0, 478.0, 1563.0, 8282.0, 174766.0, 831401.0, 27173.0, 3100.0, 840.0, 277.0, 137.0, 61.0, 32.0, 18.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.125, -72.26171875, -69.3984375, -66.53515625, -63.671875, -60.80859375, -57.9453125, -55.08203125, -52.21875, -49.35546875, -46.4921875, -43.62890625, -40.765625, -37.90234375, -35.0390625, -32.17578125, -29.3125, -26.44921875, -23.5859375, -20.72265625, -17.859375, -14.99609375, -12.1328125, -9.26953125, -6.40625, -3.54296875, -0.6796875, 2.18359375, 5.046875, 7.91015625, 10.7734375, 13.63671875, 16.5, 19.36328125, 22.2265625, 25.08984375, 27.953125, 30.81640625, 33.6796875, 36.54296875, 39.40625, 42.26953125, 45.1328125, 47.99609375, 50.859375, 53.72265625, 56.5859375, 59.44921875, 62.3125, 65.17578125, 68.0390625, 70.90234375, 73.765625, 76.62890625, 79.4921875, 82.35546875, 85.21875, 88.08203125, 90.9453125, 93.80859375, 96.671875, 99.53515625, 102.3984375, 105.26171875, 108.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 9.0, 14.0, 20.0, 10.0, 26.0, 28.0, 33.0, 64.0, 75.0, 106.0, 108.0, 85.0, 86.0, 61.0, 53.0, 50.0, 30.0, 25.0, 25.0, 12.0, 11.0, 11.0, 5.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008575439453125, -0.00830686092376709, -0.00803828239440918, -0.0077697038650512695, -0.007501125335693359, -0.007232546806335449, -0.006963968276977539, -0.006695389747619629, -0.006426811218261719, -0.006158232688903809, -0.0058896541595458984, -0.005621075630187988, -0.005352497100830078, -0.005083918571472168, -0.004815340042114258, -0.004546761512756348, -0.0042781829833984375, -0.004009604454040527, -0.003741025924682617, -0.003472447395324707, -0.003203868865966797, -0.0029352903366088867, -0.0026667118072509766, -0.0023981332778930664, -0.0021295547485351562, -0.001860976219177246, -0.001592397689819336, -0.0013238191604614258, -0.0010552406311035156, -0.0007866621017456055, -0.0005180835723876953, -0.00024950504302978516, 1.9073486328125e-05, 0.00028765201568603516, 0.0005562305450439453, 0.0008248090744018555, 0.0010933876037597656, 0.0013619661331176758, 0.001630544662475586, 0.001899123191833496, 0.0021677017211914062, 0.0024362802505493164, 0.0027048587799072266, 0.0029734373092651367, 0.003242015838623047, 0.003510594367980957, 0.003779172897338867, 0.004047751426696777, 0.0043163299560546875, 0.004584908485412598, 0.004853487014770508, 0.005122065544128418, 0.005390644073486328, 0.005659222602844238, 0.0059278011322021484, 0.006196379661560059, 0.006464958190917969, 0.006733536720275879, 0.007002115249633789, 0.007270693778991699, 0.007539272308349609, 0.0078078508377075195, 0.00807642936706543, 0.00834500789642334, 0.00861358642578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 12.0, 12.0, 15.0, 19.0, 31.0, 38.0, 60.0, 97.0, 171.0, 270.0, 512.0, 852.0, 1955.0, 4532.0, 14900.0, 101154.0, 783036.0, 116047.0, 15813.0, 4863.0, 1918.0, 944.0, 506.0, 312.0, 158.0, 90.0, 73.0, 41.0, 40.0, 23.0, 18.0, 7.0, 6.0, 7.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.125, -59.18603515625, -57.2470703125, -55.30810546875, -53.369140625, -51.43017578125, -49.4912109375, -47.55224609375, -45.61328125, -43.67431640625, -41.7353515625, -39.79638671875, -37.857421875, -35.91845703125, -33.9794921875, -32.04052734375, -30.1015625, -28.16259765625, -26.2236328125, -24.28466796875, -22.345703125, -20.40673828125, -18.4677734375, -16.52880859375, -14.58984375, -12.65087890625, -10.7119140625, -8.77294921875, -6.833984375, -4.89501953125, -2.9560546875, -1.01708984375, 0.921875, 2.86083984375, 4.7998046875, 6.73876953125, 8.677734375, 10.61669921875, 12.5556640625, 14.49462890625, 16.43359375, 18.37255859375, 20.3115234375, 22.25048828125, 24.189453125, 26.12841796875, 28.0673828125, 30.00634765625, 31.9453125, 33.88427734375, 35.8232421875, 37.76220703125, 39.701171875, 41.64013671875, 43.5791015625, 45.51806640625, 47.45703125, 49.39599609375, 51.3349609375, 53.27392578125, 55.212890625, 57.15185546875, 59.0908203125, 61.02978515625, 62.96875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 13.0, 18.0, 23.0, 34.0, 39.0, 65.0, 79.0, 84.0, 102.0, 126.0, 102.0, 100.0, 62.0, 36.0, 31.0, 24.0, 16.0, 7.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.125, -54.181640625, -52.23828125, -50.294921875, -48.3515625, -46.408203125, -44.46484375, -42.521484375, -40.578125, -38.634765625, -36.69140625, -34.748046875, -32.8046875, -30.861328125, -28.91796875, -26.974609375, -25.03125, -23.087890625, -21.14453125, -19.201171875, -17.2578125, -15.314453125, -13.37109375, -11.427734375, -9.484375, -7.541015625, -5.59765625, -3.654296875, -1.7109375, 0.232421875, 2.17578125, 4.119140625, 6.0625, 8.005859375, 9.94921875, 11.892578125, 13.8359375, 15.779296875, 17.72265625, 19.666015625, 21.609375, 23.552734375, 25.49609375, 27.439453125, 29.3828125, 31.326171875, 33.26953125, 35.212890625, 37.15625, 39.099609375, 41.04296875, 42.986328125, 44.9296875, 46.873046875, 48.81640625, 50.759765625, 52.703125, 54.646484375, 56.58984375, 58.533203125, 60.4765625, 62.419921875, 64.36328125, 66.306640625, 68.25]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 8.0, 5.0, 26.0, 60.0, 127.0, 204.0, 251.0, 165.0, 68.0, 34.0, 21.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1095.5286865234375, -1055.3272705078125, -1015.1258544921875, -974.9244384765625, -934.7230224609375, -894.5216064453125, -854.3201904296875, -814.1187744140625, -773.9173583984375, -733.7159423828125, -693.5145263671875, -653.3131103515625, -613.1116943359375, -572.9102783203125, -532.7088623046875, -492.5074768066406, -452.30609130859375, -412.10467529296875, -371.90325927734375, -331.70184326171875, -291.50042724609375, -251.2990264892578, -211.09762573242188, -170.89620971679688, -130.69479370117188, -90.49337768554688, -50.291969299316406, -10.090560913085938, 30.110855102539062, 70.31227111816406, 110.513671875, 150.715087890625, 190.91650390625, 231.117919921875, 271.3193359375, 311.520751953125, 351.72216796875, 391.923583984375, 432.1249694824219, 472.3263854980469, 512.52783203125, 552.729248046875, 592.9306640625, 633.132080078125, 673.33349609375, 713.534912109375, 753.736328125, 793.937744140625, 834.1390991210938, 874.3405151367188, 914.5419311523438, 954.7433471679688, 994.9447631835938, 1035.1461181640625, 1075.3475341796875, 1115.5489501953125, 1155.7503662109375, 1195.9517822265625, 1236.1531982421875, 1276.3546142578125, 1316.5560302734375, 1356.7574462890625, 1396.9588623046875, 1437.1602783203125, 1477.3616943359375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 2.0, 15.0, 14.0, 14.0, 22.0, 22.0, 25.0, 26.0, 46.0, 17.0, 29.0, 49.0, 42.0, 43.0, 58.0, 67.0, 78.0, 44.0, 55.0, 40.0, 42.0, 37.0, 34.0, 25.0, 30.0, 20.0, 18.0, 12.0, 17.0, 5.0, 9.0, 13.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-673.5874633789062, -652.2804565429688, -630.9734497070312, -609.66650390625, -588.3594970703125, -567.052490234375, -545.7454833984375, -524.4384765625, -503.1315002441406, -481.8244934082031, -460.51751708984375, -439.21051025390625, -417.90350341796875, -396.5965270996094, -375.2895202636719, -353.9825439453125, -332.675537109375, -311.3685302734375, -290.0615539550781, -268.7545471191406, -247.4475555419922, -226.14056396484375, -204.83355712890625, -183.5265655517578, -162.21957397460938, -140.91258239746094, -119.60558319091797, -98.298583984375, -76.99159240722656, -55.684600830078125, -34.377601623535156, -13.070602416992188, 8.23638916015625, 29.543384552001953, 50.850379943847656, 72.15737915039062, 93.46437072753906, 114.7713623046875, 136.078369140625, 157.38536071777344, 178.69235229492188, 199.9993438720703, 221.30633544921875, 242.61334228515625, 263.92034912109375, 285.2273254394531, 306.5343322753906, 327.84130859375, 349.1483154296875, 370.455322265625, 391.7622985839844, 413.0693054199219, 434.37628173828125, 455.68328857421875, 476.99029541015625, 498.29730224609375, 519.604248046875, 540.9112548828125, 562.21826171875, 583.5252075195312, 604.8322143554688, 626.1392211914062, 647.4462280273438, 668.7532348632812, 690.0602416992188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 19.0, 11.0, 25.0, 28.0, 40.0, 47.0, 77.0, 109.0, 213.0, 392.0, 842.0, 2333.0, 9306.0, 61095.0, 1785306.0, 2249464.0, 69632.0, 10738.0, 2668.0, 888.0, 372.0, 197.0, 134.0, 88.0, 57.0, 33.0, 35.0, 34.0, 22.0, 17.0, 16.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.0625, -95.763671875, -92.46484375, -89.166015625, -85.8671875, -82.568359375, -79.26953125, -75.970703125, -72.671875, -69.373046875, -66.07421875, -62.775390625, -59.4765625, -56.177734375, -52.87890625, -49.580078125, -46.28125, -42.982421875, -39.68359375, -36.384765625, -33.0859375, -29.787109375, -26.48828125, -23.189453125, -19.890625, -16.591796875, -13.29296875, -9.994140625, -6.6953125, -3.396484375, -0.09765625, 3.201171875, 6.5, 9.798828125, 13.09765625, 16.396484375, 19.6953125, 22.994140625, 26.29296875, 29.591796875, 32.890625, 36.189453125, 39.48828125, 42.787109375, 46.0859375, 49.384765625, 52.68359375, 55.982421875, 59.28125, 62.580078125, 65.87890625, 69.177734375, 72.4765625, 75.775390625, 79.07421875, 82.373046875, 85.671875, 88.970703125, 92.26953125, 95.568359375, 98.8671875, 102.166015625, 105.46484375, 108.763671875, 112.0625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 11.0, 16.0, 23.0, 31.0, 40.0, 57.0, 60.0, 77.0, 103.0, 100.0, 101.0, 83.0, 62.0, 60.0, 45.0, 37.0, 25.0, 23.0, 15.0, 14.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-78.6875, -76.8515625, -75.015625, -73.1796875, -71.34375, -69.5078125, -67.671875, -65.8359375, -64.0, -62.1640625, -60.328125, -58.4921875, -56.65625, -54.8203125, -52.984375, -51.1484375, -49.3125, -47.4765625, -45.640625, -43.8046875, -41.96875, -40.1328125, -38.296875, -36.4609375, -34.625, -32.7890625, -30.953125, -29.1171875, -27.28125, -25.4453125, -23.609375, -21.7734375, -19.9375, -18.1015625, -16.265625, -14.4296875, -12.59375, -10.7578125, -8.921875, -7.0859375, -5.25, -3.4140625, -1.578125, 0.2578125, 2.09375, 3.9296875, 5.765625, 7.6015625, 9.4375, 11.2734375, 13.109375, 14.9453125, 16.78125, 18.6171875, 20.453125, 22.2890625, 24.125, 25.9609375, 27.796875, 29.6328125, 31.46875, 33.3046875, 35.140625, 36.9765625, 38.8125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 14.0, 20.0, 37.0, 57.0, 102.0, 172.0, 336.0, 753.0, 1925.0, 6151.0, 26757.0, 200115.0, 3445967.0, 455405.0, 43443.0, 8677.0, 2524.0, 936.0, 394.0, 184.0, 102.0, 77.0, 37.0, 23.0, 17.0, 18.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.375, -82.287109375, -79.19921875, -76.111328125, -73.0234375, -69.935546875, -66.84765625, -63.759765625, -60.671875, -57.583984375, -54.49609375, -51.408203125, -48.3203125, -45.232421875, -42.14453125, -39.056640625, -35.96875, -32.880859375, -29.79296875, -26.705078125, -23.6171875, -20.529296875, -17.44140625, -14.353515625, -11.265625, -8.177734375, -5.08984375, -2.001953125, 1.0859375, 4.173828125, 7.26171875, 10.349609375, 13.4375, 16.525390625, 19.61328125, 22.701171875, 25.7890625, 28.876953125, 31.96484375, 35.052734375, 38.140625, 41.228515625, 44.31640625, 47.404296875, 50.4921875, 53.580078125, 56.66796875, 59.755859375, 62.84375, 65.931640625, 69.01953125, 72.107421875, 75.1953125, 78.283203125, 81.37109375, 84.458984375, 87.546875, 90.634765625, 93.72265625, 96.810546875, 99.8984375, 102.986328125, 106.07421875, 109.162109375, 112.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 8.0, 10.0, 12.0, 16.0, 21.0, 25.0, 41.0, 55.0, 65.0, 100.0, 183.0, 267.0, 516.0, 768.0, 788.0, 497.0, 278.0, 124.0, 77.0, 63.0, 40.0, 32.0, 24.0, 13.0, 7.0, 12.0, 7.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.75, -94.8671875, -91.984375, -89.1015625, -86.21875, -83.3359375, -80.453125, -77.5703125, -74.6875, -71.8046875, -68.921875, -66.0390625, -63.15625, -60.2734375, -57.390625, -54.5078125, -51.625, -48.7421875, -45.859375, -42.9765625, -40.09375, -37.2109375, -34.328125, -31.4453125, -28.5625, -25.6796875, -22.796875, -19.9140625, -17.03125, -14.1484375, -11.265625, -8.3828125, -5.5, -2.6171875, 0.265625, 3.1484375, 6.03125, 8.9140625, 11.796875, 14.6796875, 17.5625, 20.4453125, 23.328125, 26.2109375, 29.09375, 31.9765625, 34.859375, 37.7421875, 40.625, 43.5078125, 46.390625, 49.2734375, 52.15625, 55.0390625, 57.921875, 60.8046875, 63.6875, 66.5703125, 69.453125, 72.3359375, 75.21875, 78.1015625, 80.984375, 83.8671875, 86.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 7.0, 8.0, 5.0, 22.0, 88.0, 265.0, 350.0, 180.0, 50.0, 14.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2868.54833984375, -2815.765869140625, -2762.9833984375, -2710.20068359375, -2657.418212890625, -2604.6357421875, -2551.853271484375, -2499.07080078125, -2446.2880859375, -2393.505615234375, -2340.72314453125, -2287.9404296875, -2235.157958984375, -2182.37548828125, -2129.593017578125, -2076.810546875, -2024.0279541015625, -1971.2454833984375, -1918.462890625, -1865.680419921875, -1812.8978271484375, -1760.1153564453125, -1707.332763671875, -1654.55029296875, -1601.767822265625, -1548.9853515625, -1496.2027587890625, -1443.4202880859375, -1390.6376953125, -1337.855224609375, -1285.07275390625, -1232.2901611328125, -1179.507568359375, -1126.72509765625, -1073.9425048828125, -1021.1600341796875, -968.37744140625, -915.594970703125, -862.8124389648438, -810.0299072265625, -757.247314453125, -704.4647827148438, -651.6822509765625, -598.8997802734375, -546.1171875, -493.3346862792969, -440.55218505859375, -387.7696533203125, -334.98712158203125, -282.20458984375, -229.4220733642578, -176.63955688476562, -123.85702514648438, -71.07449340820312, -18.2919921875, 34.49053955078125, 87.2730712890625, 140.05560302734375, 192.83811950683594, 245.62063598632812, 298.4031677246094, 351.1856994628906, 403.96820068359375, 456.750732421875, 509.53326416015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 13.0, 4.0, 7.0, 15.0, 21.0, 15.0, 16.0, 27.0, 25.0, 26.0, 37.0, 36.0, 43.0, 55.0, 41.0, 52.0, 54.0, 55.0, 45.0, 58.0, 45.0, 41.0, 45.0, 35.0, 27.0, 16.0, 26.0, 20.0, 18.0, 12.0, 10.0, 8.0, 10.0, 10.0, 8.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-407.34918212890625, -394.2499084472656, -381.150634765625, -368.0513610839844, -354.95208740234375, -341.852783203125, -328.7535095214844, -315.65423583984375, -302.5549621582031, -289.4556884765625, -276.3564147949219, -263.25714111328125, -250.15785217285156, -237.05857849121094, -223.95928955078125, -210.86001586914062, -197.7607421875, -184.66146850585938, -171.56219482421875, -158.46290588378906, -145.36363220214844, -132.2643585205078, -119.16507720947266, -106.0657958984375, -92.96652221679688, -79.86724853515625, -66.7679672241211, -53.6686897277832, -40.56941223144531, -27.470138549804688, -14.370857238769531, -1.271575927734375, 11.82769775390625, 24.92697525024414, 38.02625274658203, 51.12553024291992, 64.22480773925781, 77.32408142089844, 90.4233627319336, 103.52264404296875, 116.62191772460938, 129.72119140625, 142.82046508789062, 155.9197540283203, 169.01902770996094, 182.11830139160156, 195.21759033203125, 208.31686401367188, 221.4161376953125, 234.51541137695312, 247.61468505859375, 260.7139587402344, 273.813232421875, 286.91253662109375, 300.0118103027344, 313.111083984375, 326.2103576660156, 339.30963134765625, 352.4089050292969, 365.5081787109375, 378.60748291015625, 391.70672607421875, 404.8060302734375, 417.9053039550781, 431.00457763671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 7.0, 6.0, 13.0, 21.0, 26.0, 41.0, 43.0, 67.0, 114.0, 206.0, 280.0, 563.0, 1088.0, 2389.0, 7048.0, 25335.0, 98292.0, 372347.0, 393738.0, 107093.0, 27172.0, 7500.0, 2647.0, 1016.0, 607.0, 313.0, 191.0, 106.0, 98.0, 53.0, 34.0, 31.0, 20.0, 10.0, 8.0, 11.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.3125, -91.45703125, -88.6015625, -85.74609375, -82.890625, -80.03515625, -77.1796875, -74.32421875, -71.46875, -68.61328125, -65.7578125, -62.90234375, -60.046875, -57.19140625, -54.3359375, -51.48046875, -48.625, -45.76953125, -42.9140625, -40.05859375, -37.203125, -34.34765625, -31.4921875, -28.63671875, -25.78125, -22.92578125, -20.0703125, -17.21484375, -14.359375, -11.50390625, -8.6484375, -5.79296875, -2.9375, -0.08203125, 2.7734375, 5.62890625, 8.484375, 11.33984375, 14.1953125, 17.05078125, 19.90625, 22.76171875, 25.6171875, 28.47265625, 31.328125, 34.18359375, 37.0390625, 39.89453125, 42.75, 45.60546875, 48.4609375, 51.31640625, 54.171875, 57.02734375, 59.8828125, 62.73828125, 65.59375, 68.44921875, 71.3046875, 74.16015625, 77.015625, 79.87109375, 82.7265625, 85.58203125, 88.4375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 10.0, 14.0, 17.0, 30.0, 37.0, 43.0, 52.0, 69.0, 83.0, 92.0, 103.0, 96.0, 79.0, 66.0, 61.0, 48.0, 33.0, 21.0, 18.0, 15.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-78.25, -76.4560546875, -74.662109375, -72.8681640625, -71.07421875, -69.2802734375, -67.486328125, -65.6923828125, -63.8984375, -62.1044921875, -60.310546875, -58.5166015625, -56.72265625, -54.9287109375, -53.134765625, -51.3408203125, -49.546875, -47.7529296875, -45.958984375, -44.1650390625, -42.37109375, -40.5771484375, -38.783203125, -36.9892578125, -35.1953125, -33.4013671875, -31.607421875, -29.8134765625, -28.01953125, -26.2255859375, -24.431640625, -22.6376953125, -20.84375, -19.0498046875, -17.255859375, -15.4619140625, -13.66796875, -11.8740234375, -10.080078125, -8.2861328125, -6.4921875, -4.6982421875, -2.904296875, -1.1103515625, 0.68359375, 2.4775390625, 4.271484375, 6.0654296875, 7.859375, 9.6533203125, 11.447265625, 13.2412109375, 15.03515625, 16.8291015625, 18.623046875, 20.4169921875, 22.2109375, 24.0048828125, 25.798828125, 27.5927734375, 29.38671875, 31.1806640625, 32.974609375, 34.7685546875, 36.5625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 4.0, 11.0, 6.0, 16.0, 23.0, 37.0, 41.0, 71.0, 123.0, 169.0, 262.0, 448.0, 695.0, 1273.0, 2694.0, 8189.0, 55712.0, 741081.0, 210282.0, 18602.0, 4527.0, 1806.0, 932.0, 566.0, 361.0, 198.0, 135.0, 85.0, 66.0, 32.0, 38.0, 11.0, 14.0, 8.0, 12.0, 4.0, 10.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-146.0, -140.921875, -135.84375, -130.765625, -125.6875, -120.609375, -115.53125, -110.453125, -105.375, -100.296875, -95.21875, -90.140625, -85.0625, -79.984375, -74.90625, -69.828125, -64.75, -59.671875, -54.59375, -49.515625, -44.4375, -39.359375, -34.28125, -29.203125, -24.125, -19.046875, -13.96875, -8.890625, -3.8125, 1.265625, 6.34375, 11.421875, 16.5, 21.578125, 26.65625, 31.734375, 36.8125, 41.890625, 46.96875, 52.046875, 57.125, 62.203125, 67.28125, 72.359375, 77.4375, 82.515625, 87.59375, 92.671875, 97.75, 102.828125, 107.90625, 112.984375, 118.0625, 123.140625, 128.21875, 133.296875, 138.375, 143.453125, 148.53125, 153.609375, 158.6875, 163.765625, 168.84375, 173.921875, 179.0]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 10.0, 4.0, 9.0, 13.0, 8.0, 16.0, 23.0, 30.0, 33.0, 34.0, 43.0, 56.0, 67.0, 54.0, 60.0, 63.0, 54.0, 57.0, 51.0, 55.0, 48.0, 33.0, 31.0, 27.0, 20.0, 13.0, 20.0, 12.0, 14.0, 9.0, 6.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-162.625, -157.50390625, -152.3828125, -147.26171875, -142.140625, -137.01953125, -131.8984375, -126.77734375, -121.65625, -116.53515625, -111.4140625, -106.29296875, -101.171875, -96.05078125, -90.9296875, -85.80859375, -80.6875, -75.56640625, -70.4453125, -65.32421875, -60.203125, -55.08203125, -49.9609375, -44.83984375, -39.71875, -34.59765625, -29.4765625, -24.35546875, -19.234375, -14.11328125, -8.9921875, -3.87109375, 1.25, 6.37109375, 11.4921875, 16.61328125, 21.734375, 26.85546875, 31.9765625, 37.09765625, 42.21875, 47.33984375, 52.4609375, 57.58203125, 62.703125, 67.82421875, 72.9453125, 78.06640625, 83.1875, 88.30859375, 93.4296875, 98.55078125, 103.671875, 108.79296875, 113.9140625, 119.03515625, 124.15625, 129.27734375, 134.3984375, 139.51953125, 144.640625, 149.76171875, 154.8828125, 160.00390625, 165.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 12.0, 7.0, 10.0, 16.0, 14.0, 34.0, 28.0, 30.0, 41.0, 70.0, 90.0, 156.0, 254.0, 713.0, 2500.0, 16453.0, 830380.0, 186802.0, 8211.0, 1601.0, 430.0, 183.0, 150.0, 93.0, 62.0, 37.0, 25.0, 22.0, 20.0, 12.0, 13.0, 17.0, 10.0, 11.0, 4.0, 10.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-86.6875, -83.96484375, -81.2421875, -78.51953125, -75.796875, -73.07421875, -70.3515625, -67.62890625, -64.90625, -62.18359375, -59.4609375, -56.73828125, -54.015625, -51.29296875, -48.5703125, -45.84765625, -43.125, -40.40234375, -37.6796875, -34.95703125, -32.234375, -29.51171875, -26.7890625, -24.06640625, -21.34375, -18.62109375, -15.8984375, -13.17578125, -10.453125, -7.73046875, -5.0078125, -2.28515625, 0.4375, 3.16015625, 5.8828125, 8.60546875, 11.328125, 14.05078125, 16.7734375, 19.49609375, 22.21875, 24.94140625, 27.6640625, 30.38671875, 33.109375, 35.83203125, 38.5546875, 41.27734375, 44.0, 46.72265625, 49.4453125, 52.16796875, 54.890625, 57.61328125, 60.3359375, 63.05859375, 65.78125, 68.50390625, 71.2265625, 73.94921875, 76.671875, 79.39453125, 82.1171875, 84.83984375, 87.5625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 1.0, 8.0, 9.0, 10.0, 20.0, 19.0, 32.0, 41.0, 51.0, 73.0, 104.0, 158.0, 121.0, 99.0, 72.0, 41.0, 34.0, 26.0, 24.0, 11.0, 8.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01403045654296875, -0.013669848442077637, -0.013309240341186523, -0.01294863224029541, -0.012588024139404297, -0.012227416038513184, -0.01186680793762207, -0.011506199836730957, -0.011145591735839844, -0.01078498363494873, -0.010424375534057617, -0.010063767433166504, -0.00970315933227539, -0.009342551231384277, -0.008981943130493164, -0.00862133502960205, -0.008260726928710938, -0.007900118827819824, -0.007539510726928711, -0.007178902626037598, -0.006818294525146484, -0.006457686424255371, -0.006097078323364258, -0.0057364702224731445, -0.005375862121582031, -0.005015254020690918, -0.004654645919799805, -0.004294037818908691, -0.003933429718017578, -0.003572821617126465, -0.0032122135162353516, -0.0028516054153442383, -0.002490997314453125, -0.0021303892135620117, -0.0017697811126708984, -0.0014091730117797852, -0.0010485649108886719, -0.0006879568099975586, -0.0003273487091064453, 3.325939178466797e-05, 0.00039386749267578125, 0.0007544755935668945, 0.0011150836944580078, 0.001475691795349121, 0.0018362998962402344, 0.0021969079971313477, 0.002557516098022461, 0.0029181241989135742, 0.0032787322998046875, 0.0036393404006958008, 0.003999948501586914, 0.004360556602478027, 0.004721164703369141, 0.005081772804260254, 0.005442380905151367, 0.0058029890060424805, 0.006163597106933594, 0.006524205207824707, 0.00688481330871582, 0.007245421409606934, 0.007606029510498047, 0.00796663761138916, 0.008327245712280273, 0.008687853813171387, 0.0090484619140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 2.0, 13.0, 8.0, 14.0, 19.0, 28.0, 40.0, 84.0, 106.0, 224.0, 500.0, 1215.0, 4067.0, 23006.0, 929454.0, 79430.0, 7054.0, 1898.0, 665.0, 295.0, 145.0, 95.0, 57.0, 34.0, 30.0, 22.0, 11.0, 14.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.75, -87.5869140625, -84.423828125, -81.2607421875, -78.09765625, -74.9345703125, -71.771484375, -68.6083984375, -65.4453125, -62.2822265625, -59.119140625, -55.9560546875, -52.79296875, -49.6298828125, -46.466796875, -43.3037109375, -40.140625, -36.9775390625, -33.814453125, -30.6513671875, -27.48828125, -24.3251953125, -21.162109375, -17.9990234375, -14.8359375, -11.6728515625, -8.509765625, -5.3466796875, -2.18359375, 0.9794921875, 4.142578125, 7.3056640625, 10.46875, 13.6318359375, 16.794921875, 19.9580078125, 23.12109375, 26.2841796875, 29.447265625, 32.6103515625, 35.7734375, 38.9365234375, 42.099609375, 45.2626953125, 48.42578125, 51.5888671875, 54.751953125, 57.9150390625, 61.078125, 64.2412109375, 67.404296875, 70.5673828125, 73.73046875, 76.8935546875, 80.056640625, 83.2197265625, 86.3828125, 89.5458984375, 92.708984375, 95.8720703125, 99.03515625, 102.1982421875, 105.361328125, 108.5244140625, 111.6875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 7.0, 19.0, 49.0, 107.0, 223.0, 243.0, 182.0, 73.0, 38.0, 18.0, 12.0, 3.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.5, -70.193359375, -66.88671875, -63.580078125, -60.2734375, -56.966796875, -53.66015625, -50.353515625, -47.046875, -43.740234375, -40.43359375, -37.126953125, -33.8203125, -30.513671875, -27.20703125, -23.900390625, -20.59375, -17.287109375, -13.98046875, -10.673828125, -7.3671875, -4.060546875, -0.75390625, 2.552734375, 5.859375, 9.166015625, 12.47265625, 15.779296875, 19.0859375, 22.392578125, 25.69921875, 29.005859375, 32.3125, 35.619140625, 38.92578125, 42.232421875, 45.5390625, 48.845703125, 52.15234375, 55.458984375, 58.765625, 62.072265625, 65.37890625, 68.685546875, 71.9921875, 75.298828125, 78.60546875, 81.912109375, 85.21875, 88.525390625, 91.83203125, 95.138671875, 98.4453125, 101.751953125, 105.05859375, 108.365234375, 111.671875, 114.978515625, 118.28515625, 121.591796875, 124.8984375, 128.205078125, 131.51171875, 134.818359375, 138.125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 7.0, 18.0, 18.0, 49.0, 119.0, 190.0, 296.0, 155.0, 67.0, 37.0, 16.0, 11.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1079.8812255859375, -1046.6134033203125, -1013.345703125, -980.0779418945312, -946.8101806640625, -913.5423583984375, -880.2745971679688, -847.0068359375, -813.7390747070312, -780.4713134765625, -747.2035522460938, -713.935791015625, -680.66796875, -647.4002685546875, -614.1324462890625, -580.8646850585938, -547.596923828125, -514.3291625976562, -481.0614013671875, -447.7936096191406, -414.5258483886719, -381.2580871582031, -347.99029541015625, -314.7225341796875, -281.45477294921875, -248.18701171875, -214.9192352294922, -181.65145874023438, -148.38369750976562, -115.11593627929688, -81.84815979003906, -48.58038330078125, -15.312744140625, 17.95502471923828, 51.22279357910156, 84.49056243896484, 117.75833129882812, 151.02609252929688, 184.2938690185547, 217.5616455078125, 250.82940673828125, 284.09716796875, 317.36492919921875, 350.6327209472656, 383.9004821777344, 417.1682434082031, 450.43603515625, 483.70379638671875, 516.9715576171875, 550.2393188476562, 583.507080078125, 616.7748413085938, 650.0426025390625, 683.3104248046875, 716.5781860351562, 749.845947265625, 783.1137084960938, 816.3814697265625, 849.6492309570312, 882.9169921875, 916.184814453125, 949.4525146484375, 982.7203369140625, 1015.9880981445312, 1049.255859375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 16.0, 22.0, 29.0, 31.0, 38.0, 41.0, 52.0, 65.0, 85.0, 98.0, 112.0, 76.0, 46.0, 58.0, 65.0, 26.0, 23.0, 26.0, 20.0, 19.0, 11.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-686.9322509765625, -661.5528564453125, -636.1734619140625, -610.7941284179688, -585.4147338867188, -560.0353393554688, -534.6559448242188, -509.2765808105469, -483.897216796875, -458.517822265625, -433.1384582519531, -407.7590637207031, -382.37969970703125, -357.00030517578125, -331.62091064453125, -306.2415466308594, -280.8621520996094, -255.48277282714844, -230.1033935546875, -204.7239990234375, -179.34463500976562, -153.96524047851562, -128.5858612060547, -103.20648193359375, -77.82710266113281, -52.447723388671875, -27.068340301513672, -1.6889572143554688, 23.69042205810547, 49.069801330566406, 74.44918823242188, 99.82856750488281, 125.20794677734375, 150.5873260498047, 175.96670532226562, 201.34609985351562, 226.7254638671875, 252.1048583984375, 277.4842529296875, 302.8636169433594, 328.24298095703125, 353.62237548828125, 379.0017395019531, 404.3811340332031, 429.760498046875, 455.139892578125, 480.519287109375, 505.8986511230469, 531.278076171875, 556.657470703125, 582.036865234375, 607.4161987304688, 632.7955932617188, 658.1749877929688, 683.5543823242188, 708.9337158203125, 734.3131103515625, 759.6925048828125, 785.0718994140625, 810.4512329101562, 835.8306274414062, 861.2100219726562, 886.5894165039062, 911.96875, 937.34814453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 16.0, 19.0, 40.0, 48.0, 62.0, 126.0, 221.0, 491.0, 1612.0, 9873.0, 393830.0, 3739358.0, 43076.0, 3724.0, 838.0, 347.0, 225.0, 118.0, 85.0, 47.0, 37.0, 21.0, 17.0, 13.0, 3.0, 6.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.5625, -106.3525390625, -102.142578125, -97.9326171875, -93.72265625, -89.5126953125, -85.302734375, -81.0927734375, -76.8828125, -72.6728515625, -68.462890625, -64.2529296875, -60.04296875, -55.8330078125, -51.623046875, -47.4130859375, -43.203125, -38.9931640625, -34.783203125, -30.5732421875, -26.36328125, -22.1533203125, -17.943359375, -13.7333984375, -9.5234375, -5.3134765625, -1.103515625, 3.1064453125, 7.31640625, 11.5263671875, 15.736328125, 19.9462890625, 24.15625, 28.3662109375, 32.576171875, 36.7861328125, 40.99609375, 45.2060546875, 49.416015625, 53.6259765625, 57.8359375, 62.0458984375, 66.255859375, 70.4658203125, 74.67578125, 78.8857421875, 83.095703125, 87.3056640625, 91.515625, 95.7255859375, 99.935546875, 104.1455078125, 108.35546875, 112.5654296875, 116.775390625, 120.9853515625, 125.1953125, 129.4052734375, 133.615234375, 137.8251953125, 142.03515625, 146.2451171875, 150.455078125, 154.6650390625, 158.875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 5.0, 5.0, 5.0, 10.0, 17.0, 14.0, 11.0, 15.0, 21.0, 29.0, 41.0, 33.0, 28.0, 48.0, 60.0, 35.0, 53.0, 56.0, 58.0, 29.0, 52.0, 43.0, 45.0, 53.0, 37.0, 26.0, 36.0, 31.0, 19.0, 24.0, 17.0, 13.0, 9.0, 6.0, 8.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.021240234375, -24.99560546875, -23.969970703125, -22.9443359375, -21.918701171875, -20.89306640625, -19.867431640625, -18.841796875, -17.816162109375, -16.79052734375, -15.764892578125, -14.7392578125, -13.713623046875, -12.68798828125, -11.662353515625, -10.63671875, -9.611083984375, -8.58544921875, -7.559814453125, -6.5341796875, -5.508544921875, -4.48291015625, -3.457275390625, -2.431640625, -1.406005859375, -0.38037109375, 0.645263671875, 1.6708984375, 2.696533203125, 3.72216796875, 4.747802734375, 5.7734375, 6.799072265625, 7.82470703125, 8.850341796875, 9.8759765625, 10.901611328125, 11.92724609375, 12.952880859375, 13.978515625, 15.004150390625, 16.02978515625, 17.055419921875, 18.0810546875, 19.106689453125, 20.13232421875, 21.157958984375, 22.18359375, 23.209228515625, 24.23486328125, 25.260498046875, 26.2861328125, 27.311767578125, 28.33740234375, 29.363037109375, 30.388671875, 31.414306640625, 32.43994140625, 33.465576171875, 34.4912109375, 35.516845703125, 36.54248046875, 37.568115234375, 38.59375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 15.0, 17.0, 23.0, 34.0, 58.0, 106.0, 214.0, 445.0, 1173.0, 3358.0, 12758.0, 77189.0, 1986288.0, 2010719.0, 80964.0, 14048.0, 4073.0, 1461.0, 666.0, 322.0, 136.0, 76.0, 51.0, 35.0, 10.0, 16.0, 10.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.6875, -82.041015625, -79.39453125, -76.748046875, -74.1015625, -71.455078125, -68.80859375, -66.162109375, -63.515625, -60.869140625, -58.22265625, -55.576171875, -52.9296875, -50.283203125, -47.63671875, -44.990234375, -42.34375, -39.697265625, -37.05078125, -34.404296875, -31.7578125, -29.111328125, -26.46484375, -23.818359375, -21.171875, -18.525390625, -15.87890625, -13.232421875, -10.5859375, -7.939453125, -5.29296875, -2.646484375, 0.0, 2.646484375, 5.29296875, 7.939453125, 10.5859375, 13.232421875, 15.87890625, 18.525390625, 21.171875, 23.818359375, 26.46484375, 29.111328125, 31.7578125, 34.404296875, 37.05078125, 39.697265625, 42.34375, 44.990234375, 47.63671875, 50.283203125, 52.9296875, 55.576171875, 58.22265625, 60.869140625, 63.515625, 66.162109375, 68.80859375, 71.455078125, 74.1015625, 76.748046875, 79.39453125, 82.041015625, 84.6875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 18.0, 22.0, 29.0, 47.0, 78.0, 118.0, 202.0, 340.0, 694.0, 877.0, 635.0, 386.0, 232.0, 132.0, 66.0, 39.0, 39.0, 27.0, 20.0, 12.0, 7.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.125, -66.515625, -63.90625, -61.296875, -58.6875, -56.078125, -53.46875, -50.859375, -48.25, -45.640625, -43.03125, -40.421875, -37.8125, -35.203125, -32.59375, -29.984375, -27.375, -24.765625, -22.15625, -19.546875, -16.9375, -14.328125, -11.71875, -9.109375, -6.5, -3.890625, -1.28125, 1.328125, 3.9375, 6.546875, 9.15625, 11.765625, 14.375, 16.984375, 19.59375, 22.203125, 24.8125, 27.421875, 30.03125, 32.640625, 35.25, 37.859375, 40.46875, 43.078125, 45.6875, 48.296875, 50.90625, 53.515625, 56.125, 58.734375, 61.34375, 63.953125, 66.5625, 69.171875, 71.78125, 74.390625, 77.0, 79.609375, 82.21875, 84.828125, 87.4375, 90.046875, 92.65625, 95.265625, 97.875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 3.0, 8.0, 15.0, 23.0, 57.0, 127.0, 224.0, 270.0, 156.0, 60.0, 25.0, 13.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-657.460205078125, -627.7137451171875, -597.9672241210938, -568.2207641601562, -538.4743041992188, -508.7278137207031, -478.9813232421875, -449.23486328125, -419.4883728027344, -389.74188232421875, -359.99542236328125, -330.2489318847656, -300.50244140625, -270.7559814453125, -241.00949096679688, -211.2630157470703, -181.51654052734375, -151.7700653076172, -122.0235824584961, -92.277099609375, -62.53062438964844, -32.784149169921875, -3.03765869140625, 26.708816528320312, 56.455291748046875, 86.20176696777344, 115.94824981689453, 145.69473266601562, 175.4412078857422, 205.18768310546875, 234.93417358398438, 264.6806640625, 294.4271240234375, 324.1736145019531, 353.9200744628906, 383.66656494140625, 413.41302490234375, 443.1595153808594, 472.906005859375, 502.6524658203125, 532.39892578125, 562.1453857421875, 591.8919067382812, 621.6383666992188, 651.3848266601562, 681.13134765625, 710.8778076171875, 740.624267578125, 770.3707885742188, 800.1172485351562, 829.86376953125, 859.6102294921875, 889.356689453125, 919.1031494140625, 948.8496704101562, 978.5961303710938, 1008.3426513671875, 1038.089111328125, 1067.8355712890625, 1097.58203125, 1127.32861328125, 1157.0750732421875, 1186.821533203125, 1216.5679931640625, 1246.314453125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 11.0, 11.0, 7.0, 14.0, 9.0, 15.0, 35.0, 22.0, 26.0, 48.0, 49.0, 55.0, 67.0, 63.0, 50.0, 53.0, 49.0, 57.0, 49.0, 38.0, 44.0, 39.0, 34.0, 28.0, 26.0, 23.0, 14.0, 11.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-426.2154541015625, -414.5389709472656, -402.86248779296875, -391.18597412109375, -379.5094909667969, -367.8330078125, -356.1565246582031, -344.48004150390625, -332.80352783203125, -321.1270446777344, -309.4505615234375, -297.7740478515625, -286.0975646972656, -274.42108154296875, -262.7445983886719, -251.06809997558594, -239.39161682128906, -227.7151336669922, -216.03863525390625, -204.36215209960938, -192.68565368652344, -181.00917053222656, -169.33267211914062, -157.65618896484375, -145.97970581054688, -134.30322265625, -122.62672424316406, -110.95024108886719, -99.27374267578125, -87.59725952148438, -75.92076873779297, -64.24427795410156, -52.567779541015625, -40.89128875732422, -29.214799880981445, -17.538311004638672, -5.861820220947266, 5.814670562744141, 17.49115753173828, 29.167648315429688, 40.844139099121094, 52.5206298828125, 64.1971206665039, 75.87361145019531, 87.55009460449219, 99.22659301757812, 110.903076171875, 122.5795669555664, 134.2560577392578, 145.9325408935547, 157.60903930664062, 169.2855224609375, 180.96202087402344, 192.6385040283203, 204.31500244140625, 215.99148559570312, 227.66796875, 239.34445190429688, 251.0209503173828, 262.69744873046875, 274.3739318847656, 286.0504150390625, 297.7268981933594, 309.40338134765625, 321.07989501953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 10.0, 4.0, 8.0, 9.0, 25.0, 25.0, 31.0, 31.0, 63.0, 90.0, 127.0, 183.0, 313.0, 544.0, 1058.0, 2075.0, 4609.0, 11896.0, 34788.0, 117439.0, 402453.0, 334228.0, 92629.0, 28231.0, 9622.0, 3861.0, 1847.0, 954.0, 486.0, 309.0, 185.0, 108.0, 85.0, 50.0, 33.0, 40.0, 23.0, 18.0, 17.0, 10.0, 12.0, 9.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-74.1875, -71.8623046875, -69.537109375, -67.2119140625, -64.88671875, -62.5615234375, -60.236328125, -57.9111328125, -55.5859375, -53.2607421875, -50.935546875, -48.6103515625, -46.28515625, -43.9599609375, -41.634765625, -39.3095703125, -36.984375, -34.6591796875, -32.333984375, -30.0087890625, -27.68359375, -25.3583984375, -23.033203125, -20.7080078125, -18.3828125, -16.0576171875, -13.732421875, -11.4072265625, -9.08203125, -6.7568359375, -4.431640625, -2.1064453125, 0.21875, 2.5439453125, 4.869140625, 7.1943359375, 9.51953125, 11.8447265625, 14.169921875, 16.4951171875, 18.8203125, 21.1455078125, 23.470703125, 25.7958984375, 28.12109375, 30.4462890625, 32.771484375, 35.0966796875, 37.421875, 39.7470703125, 42.072265625, 44.3974609375, 46.72265625, 49.0478515625, 51.373046875, 53.6982421875, 56.0234375, 58.3486328125, 60.673828125, 62.9990234375, 65.32421875, 67.6494140625, 69.974609375, 72.2998046875, 74.625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 6.0, 7.0, 7.0, 13.0, 14.0, 14.0, 23.0, 24.0, 24.0, 27.0, 41.0, 43.0, 52.0, 51.0, 58.0, 51.0, 56.0, 41.0, 39.0, 55.0, 44.0, 48.0, 40.0, 27.0, 41.0, 33.0, 23.0, 20.0, 19.0, 19.0, 6.0, 9.0, 11.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.109375, -29.073974609375, -28.03857421875, -27.003173828125, -25.9677734375, -24.932373046875, -23.89697265625, -22.861572265625, -21.826171875, -20.790771484375, -19.75537109375, -18.719970703125, -17.6845703125, -16.649169921875, -15.61376953125, -14.578369140625, -13.54296875, -12.507568359375, -11.47216796875, -10.436767578125, -9.4013671875, -8.365966796875, -7.33056640625, -6.295166015625, -5.259765625, -4.224365234375, -3.18896484375, -2.153564453125, -1.1181640625, -0.082763671875, 0.95263671875, 1.988037109375, 3.0234375, 4.058837890625, 5.09423828125, 6.129638671875, 7.1650390625, 8.200439453125, 9.23583984375, 10.271240234375, 11.306640625, 12.342041015625, 13.37744140625, 14.412841796875, 15.4482421875, 16.483642578125, 17.51904296875, 18.554443359375, 19.58984375, 20.625244140625, 21.66064453125, 22.696044921875, 23.7314453125, 24.766845703125, 25.80224609375, 26.837646484375, 27.873046875, 28.908447265625, 29.94384765625, 30.979248046875, 32.0146484375, 33.050048828125, 34.08544921875, 35.120849609375, 36.15625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 15.0, 17.0, 18.0, 30.0, 60.0, 93.0, 150.0, 237.0, 406.0, 777.0, 1676.0, 5004.0, 35318.0, 794701.0, 191909.0, 12793.0, 2882.0, 1129.0, 530.0, 307.0, 181.0, 103.0, 63.0, 47.0, 32.0, 21.0, 8.0, 12.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-243.625, -237.5, -231.375, -225.25, -219.125, -213.0, -206.875, -200.75, -194.625, -188.5, -182.375, -176.25, -170.125, -164.0, -157.875, -151.75, -145.625, -139.5, -133.375, -127.25, -121.125, -115.0, -108.875, -102.75, -96.625, -90.5, -84.375, -78.25, -72.125, -66.0, -59.875, -53.75, -47.625, -41.5, -35.375, -29.25, -23.125, -17.0, -10.875, -4.75, 1.375, 7.5, 13.625, 19.75, 25.875, 32.0, 38.125, 44.25, 50.375, 56.5, 62.625, 68.75, 74.875, 81.0, 87.125, 93.25, 99.375, 105.5, 111.625, 117.75, 123.875, 130.0, 136.125, 142.25, 148.375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 4.0, 12.0, 8.0, 13.0, 9.0, 16.0, 18.0, 21.0, 30.0, 30.0, 26.0, 24.0, 36.0, 42.0, 31.0, 48.0, 47.0, 57.0, 60.0, 30.0, 45.0, 53.0, 53.0, 37.0, 36.0, 30.0, 30.0, 31.0, 17.0, 16.0, 19.0, 14.0, 6.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.25, -109.62109375, -105.9921875, -102.36328125, -98.734375, -95.10546875, -91.4765625, -87.84765625, -84.21875, -80.58984375, -76.9609375, -73.33203125, -69.703125, -66.07421875, -62.4453125, -58.81640625, -55.1875, -51.55859375, -47.9296875, -44.30078125, -40.671875, -37.04296875, -33.4140625, -29.78515625, -26.15625, -22.52734375, -18.8984375, -15.26953125, -11.640625, -8.01171875, -4.3828125, -0.75390625, 2.875, 6.50390625, 10.1328125, 13.76171875, 17.390625, 21.01953125, 24.6484375, 28.27734375, 31.90625, 35.53515625, 39.1640625, 42.79296875, 46.421875, 50.05078125, 53.6796875, 57.30859375, 60.9375, 64.56640625, 68.1953125, 71.82421875, 75.453125, 79.08203125, 82.7109375, 86.33984375, 89.96875, 93.59765625, 97.2265625, 100.85546875, 104.484375, 108.11328125, 111.7421875, 115.37109375, 119.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 8.0, 5.0, 18.0, 17.0, 30.0, 37.0, 59.0, 85.0, 132.0, 217.0, 434.0, 1016.0, 3454.0, 20627.0, 663979.0, 337987.0, 15566.0, 2965.0, 889.0, 412.0, 207.0, 136.0, 83.0, 37.0, 44.0, 28.0, 25.0, 14.0, 7.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-70.875, -68.90283203125, -66.9306640625, -64.95849609375, -62.986328125, -61.01416015625, -59.0419921875, -57.06982421875, -55.09765625, -53.12548828125, -51.1533203125, -49.18115234375, -47.208984375, -45.23681640625, -43.2646484375, -41.29248046875, -39.3203125, -37.34814453125, -35.3759765625, -33.40380859375, -31.431640625, -29.45947265625, -27.4873046875, -25.51513671875, -23.54296875, -21.57080078125, -19.5986328125, -17.62646484375, -15.654296875, -13.68212890625, -11.7099609375, -9.73779296875, -7.765625, -5.79345703125, -3.8212890625, -1.84912109375, 0.123046875, 2.09521484375, 4.0673828125, 6.03955078125, 8.01171875, 9.98388671875, 11.9560546875, 13.92822265625, 15.900390625, 17.87255859375, 19.8447265625, 21.81689453125, 23.7890625, 25.76123046875, 27.7333984375, 29.70556640625, 31.677734375, 33.64990234375, 35.6220703125, 37.59423828125, 39.56640625, 41.53857421875, 43.5107421875, 45.48291015625, 47.455078125, 49.42724609375, 51.3994140625, 53.37158203125, 55.34375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 7.0, 8.0, 7.0, 5.0, 12.0, 13.0, 16.0, 17.0, 38.0, 41.0, 67.0, 60.0, 93.0, 112.0, 106.0, 84.0, 69.0, 44.0, 36.0, 33.0, 24.0, 18.0, 13.0, 18.0, 9.0, 9.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00897216796875, -0.008716464042663574, -0.008460760116577148, -0.008205056190490723, -0.007949352264404297, -0.007693648338317871, -0.007437944412231445, -0.0071822404861450195, -0.006926536560058594, -0.006670832633972168, -0.006415128707885742, -0.006159424781799316, -0.005903720855712891, -0.005648016929626465, -0.005392313003540039, -0.005136609077453613, -0.0048809051513671875, -0.004625201225280762, -0.004369497299194336, -0.00411379337310791, -0.0038580894470214844, -0.0036023855209350586, -0.003346681594848633, -0.003090977668762207, -0.0028352737426757812, -0.0025795698165893555, -0.0023238658905029297, -0.002068161964416504, -0.0018124580383300781, -0.0015567541122436523, -0.0013010501861572266, -0.0010453462600708008, -0.000789642333984375, -0.0005339384078979492, -0.00027823448181152344, -2.2530555725097656e-05, 0.00023317337036132812, 0.0004888772964477539, 0.0007445812225341797, 0.0010002851486206055, 0.0012559890747070312, 0.001511693000793457, 0.0017673969268798828, 0.0020231008529663086, 0.0022788047790527344, 0.00253450870513916, 0.002790212631225586, 0.0030459165573120117, 0.0033016204833984375, 0.0035573244094848633, 0.003813028335571289, 0.004068732261657715, 0.004324436187744141, 0.004580140113830566, 0.004835844039916992, 0.005091547966003418, 0.005347251892089844, 0.0056029558181762695, 0.005858659744262695, 0.006114363670349121, 0.006370067596435547, 0.006625771522521973, 0.0068814754486083984, 0.007137179374694824, 0.00739288330078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 2.0, 14.0, 16.0, 15.0, 27.0, 46.0, 73.0, 89.0, 143.0, 256.0, 437.0, 974.0, 2334.0, 7015.0, 34978.0, 663351.0, 306183.0, 23443.0, 5341.0, 1953.0, 805.0, 397.0, 234.0, 124.0, 84.0, 56.0, 42.0, 32.0, 15.0, 13.0, 8.0, 16.0, 3.0, 3.0, 11.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.96875, -35.48388671875, -33.9990234375, -32.51416015625, -31.029296875, -29.54443359375, -28.0595703125, -26.57470703125, -25.08984375, -23.60498046875, -22.1201171875, -20.63525390625, -19.150390625, -17.66552734375, -16.1806640625, -14.69580078125, -13.2109375, -11.72607421875, -10.2412109375, -8.75634765625, -7.271484375, -5.78662109375, -4.3017578125, -2.81689453125, -1.33203125, 0.15283203125, 1.6376953125, 3.12255859375, 4.607421875, 6.09228515625, 7.5771484375, 9.06201171875, 10.546875, 12.03173828125, 13.5166015625, 15.00146484375, 16.486328125, 17.97119140625, 19.4560546875, 20.94091796875, 22.42578125, 23.91064453125, 25.3955078125, 26.88037109375, 28.365234375, 29.85009765625, 31.3349609375, 32.81982421875, 34.3046875, 35.78955078125, 37.2744140625, 38.75927734375, 40.244140625, 41.72900390625, 43.2138671875, 44.69873046875, 46.18359375, 47.66845703125, 49.1533203125, 50.63818359375, 52.123046875, 53.60791015625, 55.0927734375, 56.57763671875, 58.0625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 3.0, 11.0, 14.0, 18.0, 41.0, 57.0, 86.0, 131.0, 160.0, 149.0, 125.0, 69.0, 43.0, 25.0, 16.0, 8.0, 5.0, 6.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.3125, -51.6318359375, -49.951171875, -48.2705078125, -46.58984375, -44.9091796875, -43.228515625, -41.5478515625, -39.8671875, -38.1865234375, -36.505859375, -34.8251953125, -33.14453125, -31.4638671875, -29.783203125, -28.1025390625, -26.421875, -24.7412109375, -23.060546875, -21.3798828125, -19.69921875, -18.0185546875, -16.337890625, -14.6572265625, -12.9765625, -11.2958984375, -9.615234375, -7.9345703125, -6.25390625, -4.5732421875, -2.892578125, -1.2119140625, 0.46875, 2.1494140625, 3.830078125, 5.5107421875, 7.19140625, 8.8720703125, 10.552734375, 12.2333984375, 13.9140625, 15.5947265625, 17.275390625, 18.9560546875, 20.63671875, 22.3173828125, 23.998046875, 25.6787109375, 27.359375, 29.0400390625, 30.720703125, 32.4013671875, 34.08203125, 35.7626953125, 37.443359375, 39.1240234375, 40.8046875, 42.4853515625, 44.166015625, 45.8466796875, 47.52734375, 49.2080078125, 50.888671875, 52.5693359375, 54.25]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 10.0, 46.0, 185.0, 430.0, 209.0, 65.0, 19.0, 8.0, 5.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1132.900390625, -1082.6402587890625, -1032.380126953125, -982.1199340820312, -931.8598022460938, -881.5996704101562, -831.3394775390625, -781.079345703125, -730.8192138671875, -680.55908203125, -630.2989501953125, -580.0387573242188, -529.7786254882812, -479.51849365234375, -429.2583312988281, -378.9981689453125, -328.738037109375, -278.4779052734375, -228.21774291992188, -177.9575958251953, -127.69744873046875, -77.43730163574219, -27.177154541015625, 23.0830078125, 73.3431396484375, 123.60328674316406, 173.86343383789062, 224.1235809326172, 274.38372802734375, 324.64385986328125, 374.9040222167969, 425.1641845703125, 475.42431640625, 525.6844482421875, 575.944580078125, 626.2047729492188, 676.4649047851562, 726.7250366210938, 776.9852294921875, 827.245361328125, 877.5054931640625, 927.765625, 978.0257568359375, 1028.285888671875, 1078.546142578125, 1128.8062744140625, 1179.06640625, 1229.3265380859375, 1279.586669921875, 1329.8468017578125, 1380.10693359375, 1430.3670654296875, 1480.627197265625, 1530.887451171875, 1581.1475830078125, 1631.40771484375, 1681.6678466796875, 1731.927978515625, 1782.1881103515625, 1832.4482421875, 1882.70849609375, 1932.9686279296875, 1983.228759765625, 2033.4888916015625, 2083.7490234375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 9.0, 4.0, 10.0, 21.0, 16.0, 17.0, 25.0, 34.0, 24.0, 22.0, 31.0, 37.0, 34.0, 45.0, 59.0, 71.0, 69.0, 70.0, 40.0, 42.0, 41.0, 27.0, 31.0, 22.0, 35.0, 20.0, 15.0, 13.0, 14.0, 18.0, 14.0, 16.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-459.073486328125, -444.3462829589844, -429.61907958984375, -414.891845703125, -400.1646423339844, -385.43743896484375, -370.710205078125, -355.9830017089844, -341.25579833984375, -326.5285949707031, -311.8013916015625, -297.07415771484375, -282.3469543457031, -267.6197509765625, -252.8925323486328, -238.16531372070312, -223.4381103515625, -208.71090698242188, -193.9836883544922, -179.2564697265625, -164.52926635742188, -149.80206298828125, -135.07484436035156, -120.3476333618164, -105.62042236328125, -90.8932113647461, -76.16600036621094, -61.43878936767578, -46.711578369140625, -31.98436737060547, -17.257156372070312, -2.5299453735351562, 12.197265625, 26.924476623535156, 41.65168762207031, 56.37889862060547, 71.10610961914062, 85.83332061767578, 100.56053161621094, 115.2877426147461, 130.01495361328125, 144.74215698242188, 159.46937561035156, 174.19659423828125, 188.92379760742188, 203.6510009765625, 218.3782196044922, 233.10543823242188, 247.8326416015625, 262.5598449707031, 277.28704833984375, 292.0142822265625, 306.7414855957031, 321.46868896484375, 336.1959228515625, 350.9231262207031, 365.65032958984375, 380.3775329589844, 395.104736328125, 409.83197021484375, 424.5591735839844, 439.286376953125, 454.01361083984375, 468.7408142089844, 483.468017578125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 11.0, 10.0, 15.0, 34.0, 60.0, 112.0, 235.0, 483.0, 1364.0, 7247.0, 135502.0, 3964843.0, 76888.0, 5287.0, 1259.0, 440.0, 199.0, 114.0, 68.0, 23.0, 29.0, 15.0, 11.0, 5.0, 9.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.9375, -100.0068359375, -96.076171875, -92.1455078125, -88.21484375, -84.2841796875, -80.353515625, -76.4228515625, -72.4921875, -68.5615234375, -64.630859375, -60.7001953125, -56.76953125, -52.8388671875, -48.908203125, -44.9775390625, -41.046875, -37.1162109375, -33.185546875, -29.2548828125, -25.32421875, -21.3935546875, -17.462890625, -13.5322265625, -9.6015625, -5.6708984375, -1.740234375, 2.1904296875, 6.12109375, 10.0517578125, 13.982421875, 17.9130859375, 21.84375, 25.7744140625, 29.705078125, 33.6357421875, 37.56640625, 41.4970703125, 45.427734375, 49.3583984375, 53.2890625, 57.2197265625, 61.150390625, 65.0810546875, 69.01171875, 72.9423828125, 76.873046875, 80.8037109375, 84.734375, 88.6650390625, 92.595703125, 96.5263671875, 100.45703125, 104.3876953125, 108.318359375, 112.2490234375, 116.1796875, 120.1103515625, 124.041015625, 127.9716796875, 131.90234375, 135.8330078125, 139.763671875, 143.6943359375, 147.625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 13.0, 7.0, 23.0, 24.0, 37.0, 35.0, 46.0, 47.0, 64.0, 51.0, 77.0, 70.0, 63.0, 66.0, 62.0, 52.0, 44.0, 45.0, 37.0, 31.0, 23.0, 16.0, 18.0, 12.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.3125, -32.041015625, -30.76953125, -29.498046875, -28.2265625, -26.955078125, -25.68359375, -24.412109375, -23.140625, -21.869140625, -20.59765625, -19.326171875, -18.0546875, -16.783203125, -15.51171875, -14.240234375, -12.96875, -11.697265625, -10.42578125, -9.154296875, -7.8828125, -6.611328125, -5.33984375, -4.068359375, -2.796875, -1.525390625, -0.25390625, 1.017578125, 2.2890625, 3.560546875, 4.83203125, 6.103515625, 7.375, 8.646484375, 9.91796875, 11.189453125, 12.4609375, 13.732421875, 15.00390625, 16.275390625, 17.546875, 18.818359375, 20.08984375, 21.361328125, 22.6328125, 23.904296875, 25.17578125, 26.447265625, 27.71875, 28.990234375, 30.26171875, 31.533203125, 32.8046875, 34.076171875, 35.34765625, 36.619140625, 37.890625, 39.162109375, 40.43359375, 41.705078125, 42.9765625, 44.248046875, 45.51953125, 46.791015625, 48.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 11.0, 13.0, 24.0, 32.0, 53.0, 94.0, 153.0, 320.0, 595.0, 1358.0, 3441.0, 11791.0, 86355.0, 3630226.0, 426624.0, 23876.0, 5138.0, 1907.0, 1008.0, 547.0, 296.0, 169.0, 86.0, 53.0, 38.0, 20.0, 10.0, 6.0, 12.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-108.125, -105.0107421875, -101.896484375, -98.7822265625, -95.66796875, -92.5537109375, -89.439453125, -86.3251953125, -83.2109375, -80.0966796875, -76.982421875, -73.8681640625, -70.75390625, -67.6396484375, -64.525390625, -61.4111328125, -58.296875, -55.1826171875, -52.068359375, -48.9541015625, -45.83984375, -42.7255859375, -39.611328125, -36.4970703125, -33.3828125, -30.2685546875, -27.154296875, -24.0400390625, -20.92578125, -17.8115234375, -14.697265625, -11.5830078125, -8.46875, -5.3544921875, -2.240234375, 0.8740234375, 3.98828125, 7.1025390625, 10.216796875, 13.3310546875, 16.4453125, 19.5595703125, 22.673828125, 25.7880859375, 28.90234375, 32.0166015625, 35.130859375, 38.2451171875, 41.359375, 44.4736328125, 47.587890625, 50.7021484375, 53.81640625, 56.9306640625, 60.044921875, 63.1591796875, 66.2734375, 69.3876953125, 72.501953125, 75.6162109375, 78.73046875, 81.8447265625, 84.958984375, 88.0732421875, 91.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 14.0, 14.0, 18.0, 53.0, 108.0, 226.0, 598.0, 1466.0, 965.0, 335.0, 131.0, 61.0, 22.0, 21.0, 11.0, 9.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.875, -93.904296875, -89.93359375, -85.962890625, -81.9921875, -78.021484375, -74.05078125, -70.080078125, -66.109375, -62.138671875, -58.16796875, -54.197265625, -50.2265625, -46.255859375, -42.28515625, -38.314453125, -34.34375, -30.373046875, -26.40234375, -22.431640625, -18.4609375, -14.490234375, -10.51953125, -6.548828125, -2.578125, 1.392578125, 5.36328125, 9.333984375, 13.3046875, 17.275390625, 21.24609375, 25.216796875, 29.1875, 33.158203125, 37.12890625, 41.099609375, 45.0703125, 49.041015625, 53.01171875, 56.982421875, 60.953125, 64.923828125, 68.89453125, 72.865234375, 76.8359375, 80.806640625, 84.77734375, 88.748046875, 92.71875, 96.689453125, 100.66015625, 104.630859375, 108.6015625, 112.572265625, 116.54296875, 120.513671875, 124.484375, 128.455078125, 132.42578125, 136.396484375, 140.3671875, 144.337890625, 148.30859375, 152.279296875, 156.25]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 8.0, 15.0, 33.0, 118.0, 266.0, 315.0, 147.0, 43.0, 23.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-700.1126708984375, -666.9328002929688, -633.7528686523438, -600.572998046875, -567.39306640625, -534.2131958007812, -501.0333251953125, -467.8534240722656, -434.67352294921875, -401.4936218261719, -368.313720703125, -335.13385009765625, -301.9539489746094, -268.7740478515625, -235.5941619873047, -202.41427612304688, -169.234375, -136.05447387695312, -102.87458801269531, -69.69469451904297, -36.514801025390625, -3.33489990234375, 29.844985961914062, 63.024871826171875, 96.20477294921875, 129.38467407226562, 162.56455993652344, 195.74444580078125, 228.92434692382812, 262.104248046875, 295.28411865234375, 328.4640197753906, 361.64404296875, 394.8239440917969, 428.00384521484375, 461.1837158203125, 494.3636169433594, 527.5435180664062, 560.723388671875, 593.9033203125, 627.0831909179688, 660.2630615234375, 693.4429931640625, 726.6228637695312, 759.802734375, 792.982666015625, 826.1625366210938, 859.3424072265625, 892.5223388671875, 925.7022094726562, 958.8821411132812, 992.06201171875, 1025.241943359375, 1058.421875, 1091.6016845703125, 1124.7816162109375, 1157.96142578125, 1191.141357421875, 1224.3211669921875, 1257.5010986328125, 1290.6810302734375, 1323.86083984375, 1357.040771484375, 1390.220703125, 1423.400634765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 14.0, 16.0, 20.0, 22.0, 26.0, 33.0, 55.0, 48.0, 55.0, 50.0, 65.0, 68.0, 68.0, 68.0, 66.0, 72.0, 47.0, 32.0, 39.0, 25.0, 27.0, 19.0, 13.0, 12.0, 7.0, 5.0, 10.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-532.0860595703125, -518.8864135742188, -505.6867370605469, -492.4870910644531, -479.28741455078125, -466.0877685546875, -452.88812255859375, -439.6884765625, -426.4888000488281, -413.2891540527344, -400.0894775390625, -386.88983154296875, -373.690185546875, -360.4905090332031, -347.2908630371094, -334.0911865234375, -320.89154052734375, -307.69189453125, -294.4922180175781, -281.2925720214844, -268.0928955078125, -254.89324951171875, -241.693603515625, -228.4939422607422, -215.29428100585938, -202.09461975097656, -188.89495849609375, -175.6953125, -162.4956512451172, -149.29598999023438, -136.09634399414062, -122.89668273925781, -109.697021484375, -96.49736022949219, -83.2977066040039, -70.09805297851562, -56.89839172363281, -43.69873046875, -30.49907684326172, -17.299423217773438, -4.099761962890625, 9.099895477294922, 22.29955291748047, 35.499210357666016, 48.69886779785156, 61.898529052734375, 75.09818267822266, 88.29783630371094, 101.49749755859375, 114.69715881347656, 127.89681243896484, 141.09646606445312, 154.29612731933594, 167.49578857421875, 180.6954345703125, 193.8950958251953, 207.09475708007812, 220.29441833496094, 233.49407958984375, 246.6937255859375, 259.89337158203125, 273.0930480957031, 286.2926940917969, 299.49237060546875, 312.6920166015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 12.0, 18.0, 24.0, 28.0, 45.0, 58.0, 81.0, 166.0, 254.0, 444.0, 866.0, 1882.0, 4664.0, 13965.0, 50298.0, 206771.0, 479600.0, 213899.0, 52109.0, 14473.0, 4902.0, 1928.0, 910.0, 447.0, 253.0, 133.0, 93.0, 58.0, 40.0, 28.0, 25.0, 20.0, 11.0, 7.0, 9.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.15625, -57.15185546875, -55.1474609375, -53.14306640625, -51.138671875, -49.13427734375, -47.1298828125, -45.12548828125, -43.12109375, -41.11669921875, -39.1123046875, -37.10791015625, -35.103515625, -33.09912109375, -31.0947265625, -29.09033203125, -27.0859375, -25.08154296875, -23.0771484375, -21.07275390625, -19.068359375, -17.06396484375, -15.0595703125, -13.05517578125, -11.05078125, -9.04638671875, -7.0419921875, -5.03759765625, -3.033203125, -1.02880859375, 0.9755859375, 2.97998046875, 4.984375, 6.98876953125, 8.9931640625, 10.99755859375, 13.001953125, 15.00634765625, 17.0107421875, 19.01513671875, 21.01953125, 23.02392578125, 25.0283203125, 27.03271484375, 29.037109375, 31.04150390625, 33.0458984375, 35.05029296875, 37.0546875, 39.05908203125, 41.0634765625, 43.06787109375, 45.072265625, 47.07666015625, 49.0810546875, 51.08544921875, 53.08984375, 55.09423828125, 57.0986328125, 59.10302734375, 61.107421875, 63.11181640625, 65.1162109375, 67.12060546875, 69.125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 3.0, 9.0, 19.0, 20.0, 29.0, 36.0, 52.0, 60.0, 69.0, 62.0, 79.0, 77.0, 96.0, 92.0, 64.0, 67.0, 37.0, 36.0, 22.0, 17.0, 15.0, 14.0, 10.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.375, -40.84033203125, -39.3056640625, -37.77099609375, -36.236328125, -34.70166015625, -33.1669921875, -31.63232421875, -30.09765625, -28.56298828125, -27.0283203125, -25.49365234375, -23.958984375, -22.42431640625, -20.8896484375, -19.35498046875, -17.8203125, -16.28564453125, -14.7509765625, -13.21630859375, -11.681640625, -10.14697265625, -8.6123046875, -7.07763671875, -5.54296875, -4.00830078125, -2.4736328125, -0.93896484375, 0.595703125, 2.13037109375, 3.6650390625, 5.19970703125, 6.734375, 8.26904296875, 9.8037109375, 11.33837890625, 12.873046875, 14.40771484375, 15.9423828125, 17.47705078125, 19.01171875, 20.54638671875, 22.0810546875, 23.61572265625, 25.150390625, 26.68505859375, 28.2197265625, 29.75439453125, 31.2890625, 32.82373046875, 34.3583984375, 35.89306640625, 37.427734375, 38.96240234375, 40.4970703125, 42.03173828125, 43.56640625, 45.10107421875, 46.6357421875, 48.17041015625, 49.705078125, 51.23974609375, 52.7744140625, 54.30908203125, 55.84375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 10.0, 8.0, 6.0, 13.0, 13.0, 27.0, 26.0, 46.0, 59.0, 88.0, 133.0, 207.0, 349.0, 759.0, 1789.0, 5760.0, 23274.0, 130440.0, 653404.0, 187969.0, 32460.0, 7520.0, 2236.0, 855.0, 418.0, 211.0, 133.0, 95.0, 70.0, 49.0, 33.0, 29.0, 13.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-76.9375, -74.5029296875, -72.068359375, -69.6337890625, -67.19921875, -64.7646484375, -62.330078125, -59.8955078125, -57.4609375, -55.0263671875, -52.591796875, -50.1572265625, -47.72265625, -45.2880859375, -42.853515625, -40.4189453125, -37.984375, -35.5498046875, -33.115234375, -30.6806640625, -28.24609375, -25.8115234375, -23.376953125, -20.9423828125, -18.5078125, -16.0732421875, -13.638671875, -11.2041015625, -8.76953125, -6.3349609375, -3.900390625, -1.4658203125, 0.96875, 3.4033203125, 5.837890625, 8.2724609375, 10.70703125, 13.1416015625, 15.576171875, 18.0107421875, 20.4453125, 22.8798828125, 25.314453125, 27.7490234375, 30.18359375, 32.6181640625, 35.052734375, 37.4873046875, 39.921875, 42.3564453125, 44.791015625, 47.2255859375, 49.66015625, 52.0947265625, 54.529296875, 56.9638671875, 59.3984375, 61.8330078125, 64.267578125, 66.7021484375, 69.13671875, 71.5712890625, 74.005859375, 76.4404296875, 78.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 6.0, 8.0, 6.0, 5.0, 6.0, 8.0, 15.0, 14.0, 14.0, 14.0, 17.0, 20.0, 24.0, 28.0, 28.0, 35.0, 39.0, 36.0, 39.0, 48.0, 32.0, 35.0, 53.0, 43.0, 42.0, 35.0, 43.0, 37.0, 37.0, 33.0, 24.0, 20.0, 18.0, 30.0, 16.0, 16.0, 11.0, 9.0, 12.0, 10.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0], "bins": [-93.25, -90.46875, -87.6875, -84.90625, -82.125, -79.34375, -76.5625, -73.78125, -71.0, -68.21875, -65.4375, -62.65625, -59.875, -57.09375, -54.3125, -51.53125, -48.75, -45.96875, -43.1875, -40.40625, -37.625, -34.84375, -32.0625, -29.28125, -26.5, -23.71875, -20.9375, -18.15625, -15.375, -12.59375, -9.8125, -7.03125, -4.25, -1.46875, 1.3125, 4.09375, 6.875, 9.65625, 12.4375, 15.21875, 18.0, 20.78125, 23.5625, 26.34375, 29.125, 31.90625, 34.6875, 37.46875, 40.25, 43.03125, 45.8125, 48.59375, 51.375, 54.15625, 56.9375, 59.71875, 62.5, 65.28125, 68.0625, 70.84375, 73.625, 76.40625, 79.1875, 81.96875, 84.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 11.0, 12.0, 15.0, 23.0, 28.0, 29.0, 67.0, 122.0, 197.0, 345.0, 790.0, 1988.0, 5586.0, 18254.0, 71599.0, 322242.0, 515648.0, 80988.0, 20570.0, 6174.0, 2107.0, 858.0, 390.0, 193.0, 107.0, 68.0, 37.0, 34.0, 14.0, 15.0, 18.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.0625, -19.47314453125, -18.8837890625, -18.29443359375, -17.705078125, -17.11572265625, -16.5263671875, -15.93701171875, -15.34765625, -14.75830078125, -14.1689453125, -13.57958984375, -12.990234375, -12.40087890625, -11.8115234375, -11.22216796875, -10.6328125, -10.04345703125, -9.4541015625, -8.86474609375, -8.275390625, -7.68603515625, -7.0966796875, -6.50732421875, -5.91796875, -5.32861328125, -4.7392578125, -4.14990234375, -3.560546875, -2.97119140625, -2.3818359375, -1.79248046875, -1.203125, -0.61376953125, -0.0244140625, 0.56494140625, 1.154296875, 1.74365234375, 2.3330078125, 2.92236328125, 3.51171875, 4.10107421875, 4.6904296875, 5.27978515625, 5.869140625, 6.45849609375, 7.0478515625, 7.63720703125, 8.2265625, 8.81591796875, 9.4052734375, 9.99462890625, 10.583984375, 11.17333984375, 11.7626953125, 12.35205078125, 12.94140625, 13.53076171875, 14.1201171875, 14.70947265625, 15.298828125, 15.88818359375, 16.4775390625, 17.06689453125, 17.65625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 9.0, 8.0, 17.0, 17.0, 21.0, 22.0, 20.0, 31.0, 46.0, 63.0, 57.0, 57.0, 74.0, 73.0, 76.0, 80.0, 63.0, 45.0, 36.0, 37.0, 20.0, 19.0, 25.0, 13.0, 7.0, 9.0, 13.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0054931640625, -0.005337417125701904, -0.005181670188903809, -0.005025923252105713, -0.004870176315307617, -0.0047144293785095215, -0.004558682441711426, -0.00440293550491333, -0.004247188568115234, -0.004091441631317139, -0.003935694694519043, -0.0037799477577209473, -0.0036242008209228516, -0.003468453884124756, -0.00331270694732666, -0.0031569600105285645, -0.0030012130737304688, -0.002845466136932373, -0.0026897192001342773, -0.0025339722633361816, -0.002378225326538086, -0.0022224783897399902, -0.0020667314529418945, -0.0019109845161437988, -0.0017552375793457031, -0.0015994906425476074, -0.0014437437057495117, -0.001287996768951416, -0.0011322498321533203, -0.0009765028953552246, -0.0008207559585571289, -0.0006650090217590332, -0.0005092620849609375, -0.0003535151481628418, -0.0001977682113647461, -4.202127456665039e-05, 0.00011372566223144531, 0.000269472599029541, 0.0004252195358276367, 0.0005809664726257324, 0.0007367134094238281, 0.0008924603462219238, 0.0010482072830200195, 0.0012039542198181152, 0.001359701156616211, 0.0015154480934143066, 0.0016711950302124023, 0.001826941967010498, 0.0019826889038085938, 0.0021384358406066895, 0.002294182777404785, 0.002449929714202881, 0.0026056766510009766, 0.0027614235877990723, 0.002917170524597168, 0.0030729174613952637, 0.0032286643981933594, 0.003384411334991455, 0.0035401582717895508, 0.0036959052085876465, 0.003851652145385742, 0.004007399082183838, 0.004163146018981934, 0.004318892955780029, 0.004474639892578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 9.0, 16.0, 20.0, 33.0, 49.0, 80.0, 143.0, 287.0, 531.0, 1180.0, 2959.0, 9164.0, 37150.0, 195331.0, 644081.0, 122053.0, 24757.0, 6579.0, 2265.0, 900.0, 418.0, 204.0, 113.0, 81.0, 40.0, 34.0, 24.0, 19.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.0819091796875, -13.390380859375, -12.6988525390625, -12.00732421875, -11.3157958984375, -10.624267578125, -9.9327392578125, -9.2412109375, -8.5496826171875, -7.858154296875, -7.1666259765625, -6.47509765625, -5.7835693359375, -5.092041015625, -4.4005126953125, -3.708984375, -3.0174560546875, -2.325927734375, -1.6343994140625, -0.94287109375, -0.2513427734375, 0.440185546875, 1.1317138671875, 1.8232421875, 2.5147705078125, 3.206298828125, 3.8978271484375, 4.58935546875, 5.2808837890625, 5.972412109375, 6.6639404296875, 7.35546875, 8.0469970703125, 8.738525390625, 9.4300537109375, 10.12158203125, 10.8131103515625, 11.504638671875, 12.1961669921875, 12.8876953125, 13.5792236328125, 14.270751953125, 14.9622802734375, 15.65380859375, 16.3453369140625, 17.036865234375, 17.7283935546875, 18.419921875, 19.1114501953125, 19.802978515625, 20.4945068359375, 21.18603515625, 21.8775634765625, 22.569091796875, 23.2606201171875, 23.9521484375, 24.6436767578125, 25.335205078125, 26.0267333984375, 26.71826171875, 27.4097900390625, 28.101318359375, 28.7928466796875, 29.484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 11.0, 10.0, 18.0, 16.0, 24.0, 37.0, 42.0, 60.0, 85.0, 91.0, 85.0, 92.0, 82.0, 88.0, 63.0, 46.0, 36.0, 34.0, 13.0, 19.0, 15.0, 9.0, 4.0, 6.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.603759765625, -15.81689453125, -15.030029296875, -14.2431640625, -13.456298828125, -12.66943359375, -11.882568359375, -11.095703125, -10.308837890625, -9.52197265625, -8.735107421875, -7.9482421875, -7.161376953125, -6.37451171875, -5.587646484375, -4.80078125, -4.013916015625, -3.22705078125, -2.440185546875, -1.6533203125, -0.866455078125, -0.07958984375, 0.707275390625, 1.494140625, 2.281005859375, 3.06787109375, 3.854736328125, 4.6416015625, 5.428466796875, 6.21533203125, 7.002197265625, 7.7890625, 8.575927734375, 9.36279296875, 10.149658203125, 10.9365234375, 11.723388671875, 12.51025390625, 13.297119140625, 14.083984375, 14.870849609375, 15.65771484375, 16.444580078125, 17.2314453125, 18.018310546875, 18.80517578125, 19.592041015625, 20.37890625, 21.165771484375, 21.95263671875, 22.739501953125, 23.5263671875, 24.313232421875, 25.10009765625, 25.886962890625, 26.673828125, 27.460693359375, 28.24755859375, 29.034423828125, 29.8212890625, 30.608154296875, 31.39501953125, 32.181884765625, 32.96875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 18.0, 47.0, 186.0, 448.0, 197.0, 55.0, 20.0, 12.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-725.009033203125, -687.73828125, -650.467529296875, -613.19677734375, -575.926025390625, -538.6552734375, -501.38458251953125, -464.11383056640625, -426.84307861328125, -389.57232666015625, -352.30157470703125, -315.0308532714844, -277.7601013183594, -240.48934936523438, -203.21861267089844, -165.9478759765625, -128.6771240234375, -91.40637969970703, -54.13563537597656, -16.864891052246094, 20.405853271484375, 57.676605224609375, 94.94734191894531, 132.21807861328125, 169.48883056640625, 206.75958251953125, 244.0303192138672, 281.3010559082031, 318.5718078613281, 355.8425598144531, 393.11328125, 430.384033203125, 467.6546630859375, 504.9254150390625, 542.1961669921875, 579.4669189453125, 616.7376708984375, 654.0084228515625, 691.2791137695312, 728.5498657226562, 765.8206176757812, 803.0913696289062, 840.3621215820312, 877.6328735351562, 914.903564453125, 952.17431640625, 989.445068359375, 1026.7158203125, 1063.986572265625, 1101.25732421875, 1138.528076171875, 1175.798828125, 1213.069580078125, 1250.34033203125, 1287.611083984375, 1324.8818359375, 1362.152587890625, 1399.42333984375, 1436.694091796875, 1473.96484375, 1511.235595703125, 1548.50634765625, 1585.777099609375, 1623.0478515625, 1660.3184814453125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 4.0, 8.0, 11.0, 18.0, 14.0, 14.0, 26.0, 16.0, 27.0, 26.0, 25.0, 33.0, 56.0, 45.0, 84.0, 98.0, 96.0, 59.0, 47.0, 23.0, 23.0, 43.0, 19.0, 28.0, 18.0, 22.0, 28.0, 20.0, 10.0, 5.0, 8.0, 6.0, 6.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-422.7027893066406, -410.2447814941406, -397.7867736816406, -385.3287658691406, -372.8707580566406, -360.4127502441406, -347.9547424316406, -335.4967346191406, -323.0387268066406, -310.5807189941406, -298.1227111816406, -285.6647033691406, -273.2066955566406, -260.7486877441406, -248.29067993164062, -235.83267211914062, -223.3746795654297, -210.9166717529297, -198.4586639404297, -186.0006561279297, -173.5426483154297, -161.0846405029297, -148.62664794921875, -136.16864013671875, -123.71062469482422, -111.25261688232422, -98.79460906982422, -86.33660888671875, -73.87860107421875, -61.420589447021484, -48.96258544921875, -36.50457763671875, -24.04656982421875, -11.588562965393066, 0.8694438934326172, 13.327449798583984, 25.785457611083984, 38.243465423583984, 50.70146942138672, 63.15947723388672, 75.61748504638672, 88.07549285888672, 100.53350067138672, 112.99150085449219, 125.44950866699219, 137.9075164794922, 150.3655242919922, 162.8235321044922, 175.2815399169922, 187.7395477294922, 200.1975555419922, 212.6555633544922, 225.1135711669922, 237.5715789794922, 250.02957153320312, 262.4875793457031, 274.9455871582031, 287.4035949707031, 299.8616027832031, 312.3196105957031, 324.7776184082031, 337.2356262207031, 349.6936340332031, 362.1516418457031, 374.6096496582031]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 7.0, 17.0, 15.0, 27.0, 32.0, 66.0, 89.0, 186.0, 433.0, 1006.0, 3503.0, 19732.0, 482022.0, 3561855.0, 112405.0, 9255.0, 2134.0, 733.0, 311.0, 161.0, 104.0, 47.0, 31.0, 29.0, 13.0, 14.0, 16.0, 7.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.9375, -62.470703125, -60.00390625, -57.537109375, -55.0703125, -52.603515625, -50.13671875, -47.669921875, -45.203125, -42.736328125, -40.26953125, -37.802734375, -35.3359375, -32.869140625, -30.40234375, -27.935546875, -25.46875, -23.001953125, -20.53515625, -18.068359375, -15.6015625, -13.134765625, -10.66796875, -8.201171875, -5.734375, -3.267578125, -0.80078125, 1.666015625, 4.1328125, 6.599609375, 9.06640625, 11.533203125, 14.0, 16.466796875, 18.93359375, 21.400390625, 23.8671875, 26.333984375, 28.80078125, 31.267578125, 33.734375, 36.201171875, 38.66796875, 41.134765625, 43.6015625, 46.068359375, 48.53515625, 51.001953125, 53.46875, 55.935546875, 58.40234375, 60.869140625, 63.3359375, 65.802734375, 68.26953125, 70.736328125, 73.203125, 75.669921875, 78.13671875, 80.603515625, 83.0703125, 85.537109375, 88.00390625, 90.470703125, 92.9375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 8.0, 12.0, 15.0, 21.0, 24.0, 28.0, 35.0, 46.0, 41.0, 62.0, 67.0, 50.0, 67.0, 65.0, 73.0, 64.0, 67.0, 56.0, 50.0, 29.0, 30.0, 16.0, 13.0, 13.0, 12.0, 10.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.40625, -32.21142578125, -31.0166015625, -29.82177734375, -28.626953125, -27.43212890625, -26.2373046875, -25.04248046875, -23.84765625, -22.65283203125, -21.4580078125, -20.26318359375, -19.068359375, -17.87353515625, -16.6787109375, -15.48388671875, -14.2890625, -13.09423828125, -11.8994140625, -10.70458984375, -9.509765625, -8.31494140625, -7.1201171875, -5.92529296875, -4.73046875, -3.53564453125, -2.3408203125, -1.14599609375, 0.048828125, 1.24365234375, 2.4384765625, 3.63330078125, 4.828125, 6.02294921875, 7.2177734375, 8.41259765625, 9.607421875, 10.80224609375, 11.9970703125, 13.19189453125, 14.38671875, 15.58154296875, 16.7763671875, 17.97119140625, 19.166015625, 20.36083984375, 21.5556640625, 22.75048828125, 23.9453125, 25.14013671875, 26.3349609375, 27.52978515625, 28.724609375, 29.91943359375, 31.1142578125, 32.30908203125, 33.50390625, 34.69873046875, 35.8935546875, 37.08837890625, 38.283203125, 39.47802734375, 40.6728515625, 41.86767578125, 43.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 12.0, 8.0, 15.0, 16.0, 23.0, 35.0, 48.0, 96.0, 161.0, 370.0, 793.0, 2026.0, 5929.0, 22771.0, 148028.0, 2976504.0, 954356.0, 63681.0, 12875.0, 3908.0, 1398.0, 573.0, 253.0, 147.0, 67.0, 60.0, 33.0, 27.0, 18.0, 12.0, 13.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-59.0, -57.25439453125, -55.5087890625, -53.76318359375, -52.017578125, -50.27197265625, -48.5263671875, -46.78076171875, -45.03515625, -43.28955078125, -41.5439453125, -39.79833984375, -38.052734375, -36.30712890625, -34.5615234375, -32.81591796875, -31.0703125, -29.32470703125, -27.5791015625, -25.83349609375, -24.087890625, -22.34228515625, -20.5966796875, -18.85107421875, -17.10546875, -15.35986328125, -13.6142578125, -11.86865234375, -10.123046875, -8.37744140625, -6.6318359375, -4.88623046875, -3.140625, -1.39501953125, 0.3505859375, 2.09619140625, 3.841796875, 5.58740234375, 7.3330078125, 9.07861328125, 10.82421875, 12.56982421875, 14.3154296875, 16.06103515625, 17.806640625, 19.55224609375, 21.2978515625, 23.04345703125, 24.7890625, 26.53466796875, 28.2802734375, 30.02587890625, 31.771484375, 33.51708984375, 35.2626953125, 37.00830078125, 38.75390625, 40.49951171875, 42.2451171875, 43.99072265625, 45.736328125, 47.48193359375, 49.2275390625, 50.97314453125, 52.71875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 11.0, 12.0, 12.0, 13.0, 18.0, 28.0, 40.0, 55.0, 102.0, 140.0, 150.0, 243.0, 377.0, 567.0, 595.0, 505.0, 380.0, 217.0, 186.0, 107.0, 71.0, 61.0, 35.0, 32.0, 22.0, 18.0, 14.0, 6.0, 11.0, 10.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-45.71875, -44.34423828125, -42.9697265625, -41.59521484375, -40.220703125, -38.84619140625, -37.4716796875, -36.09716796875, -34.72265625, -33.34814453125, -31.9736328125, -30.59912109375, -29.224609375, -27.85009765625, -26.4755859375, -25.10107421875, -23.7265625, -22.35205078125, -20.9775390625, -19.60302734375, -18.228515625, -16.85400390625, -15.4794921875, -14.10498046875, -12.73046875, -11.35595703125, -9.9814453125, -8.60693359375, -7.232421875, -5.85791015625, -4.4833984375, -3.10888671875, -1.734375, -0.35986328125, 1.0146484375, 2.38916015625, 3.763671875, 5.13818359375, 6.5126953125, 7.88720703125, 9.26171875, 10.63623046875, 12.0107421875, 13.38525390625, 14.759765625, 16.13427734375, 17.5087890625, 18.88330078125, 20.2578125, 21.63232421875, 23.0068359375, 24.38134765625, 25.755859375, 27.13037109375, 28.5048828125, 29.87939453125, 31.25390625, 32.62841796875, 34.0029296875, 35.37744140625, 36.751953125, 38.12646484375, 39.5009765625, 40.87548828125, 42.25]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 14.0, 19.0, 44.0, 92.0, 153.0, 191.0, 184.0, 133.0, 84.0, 29.0, 16.0, 8.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-402.8458251953125, -385.7581787109375, -368.6705322265625, -351.5828857421875, -334.4952392578125, -317.4075927734375, -300.3199462890625, -283.2322998046875, -266.1446533203125, -249.0570068359375, -231.9693603515625, -214.8817138671875, -197.7940673828125, -180.7064208984375, -163.61878967285156, -146.53114318847656, -129.44351196289062, -112.35586547851562, -95.26821899414062, -78.18058013916016, -61.092933654785156, -44.005287170410156, -26.917648315429688, -9.830001831054688, 7.2576446533203125, 24.34528923034668, 41.43293380737305, 58.52057647705078, 75.60822296142578, 92.69586944580078, 109.78350830078125, 126.87115478515625, 143.95880126953125, 161.04644775390625, 178.13409423828125, 195.22174072265625, 212.30938720703125, 229.39703369140625, 246.4846649169922, 263.57232666015625, 280.65997314453125, 297.74761962890625, 314.83526611328125, 331.92291259765625, 349.01055908203125, 366.09820556640625, 383.18585205078125, 400.27349853515625, 417.3611145019531, 434.4487609863281, 451.5364074707031, 468.6240539550781, 485.7117004394531, 502.7993469238281, 519.886962890625, 536.974609375, 554.062255859375, 571.14990234375, 588.237548828125, 605.3251953125, 622.412841796875, 639.50048828125, 656.588134765625, 673.67578125, 690.763427734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 9.0, 8.0, 5.0, 10.0, 14.0, 18.0, 18.0, 32.0, 30.0, 31.0, 32.0, 32.0, 40.0, 42.0, 50.0, 32.0, 48.0, 39.0, 35.0, 52.0, 35.0, 37.0, 47.0, 29.0, 23.0, 49.0, 33.0, 27.0, 33.0, 27.0, 17.0, 18.0, 16.0, 11.0, 5.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-288.9852600097656, -281.2853698730469, -273.58544921875, -265.88555908203125, -258.1856689453125, -250.48577880859375, -242.78587341308594, -235.08596801757812, -227.38607788085938, -219.68618774414062, -211.9862823486328, -204.286376953125, -196.58648681640625, -188.8865966796875, -181.1866912841797, -173.48678588867188, -165.78689575195312, -158.08700561523438, -150.38710021972656, -142.68719482421875, -134.9873046875, -127.28740692138672, -119.58750915527344, -111.88761138916016, -104.18771362304688, -96.4878158569336, -88.78791809082031, -81.08802032470703, -73.38812255859375, -65.68822479248047, -57.98832702636719, -50.288429260253906, -42.58854675292969, -34.888648986816406, -27.188751220703125, -19.488853454589844, -11.788955688476562, -4.089057922363281, 3.61083984375, 11.310737609863281, 19.010635375976562, 26.710533142089844, 34.410430908203125, 42.110328674316406, 49.81022644042969, 57.51012420654297, 65.21002197265625, 72.90991973876953, 80.60981750488281, 88.3097152709961, 96.00961303710938, 103.70951080322266, 111.40940856933594, 119.10930633544922, 126.8092041015625, 134.50909423828125, 142.20899963378906, 149.90890502929688, 157.60879516601562, 165.30868530273438, 173.0085906982422, 180.70849609375, 188.40838623046875, 196.1082763671875, 203.8081817626953]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 14.0, 14.0, 16.0, 31.0, 41.0, 78.0, 108.0, 193.0, 383.0, 799.0, 1842.0, 5409.0, 18370.0, 75790.0, 336399.0, 453142.0, 116650.0, 27262.0, 7418.0, 2547.0, 973.0, 469.0, 229.0, 133.0, 70.0, 71.0, 35.0, 19.0, 15.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-72.0, -70.0615234375, -68.123046875, -66.1845703125, -64.24609375, -62.3076171875, -60.369140625, -58.4306640625, -56.4921875, -54.5537109375, -52.615234375, -50.6767578125, -48.73828125, -46.7998046875, -44.861328125, -42.9228515625, -40.984375, -39.0458984375, -37.107421875, -35.1689453125, -33.23046875, -31.2919921875, -29.353515625, -27.4150390625, -25.4765625, -23.5380859375, -21.599609375, -19.6611328125, -17.72265625, -15.7841796875, -13.845703125, -11.9072265625, -9.96875, -8.0302734375, -6.091796875, -4.1533203125, -2.21484375, -0.2763671875, 1.662109375, 3.6005859375, 5.5390625, 7.4775390625, 9.416015625, 11.3544921875, 13.29296875, 15.2314453125, 17.169921875, 19.1083984375, 21.046875, 22.9853515625, 24.923828125, 26.8623046875, 28.80078125, 30.7392578125, 32.677734375, 34.6162109375, 36.5546875, 38.4931640625, 40.431640625, 42.3701171875, 44.30859375, 46.2470703125, 48.185546875, 50.1240234375, 52.0625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 10.0, 11.0, 12.0, 15.0, 25.0, 30.0, 34.0, 35.0, 45.0, 56.0, 68.0, 60.0, 67.0, 63.0, 70.0, 54.0, 69.0, 48.0, 47.0, 38.0, 32.0, 23.0, 26.0, 17.0, 10.0, 13.0, 5.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.28125, -33.07470703125, -31.8681640625, -30.66162109375, -29.455078125, -28.24853515625, -27.0419921875, -25.83544921875, -24.62890625, -23.42236328125, -22.2158203125, -21.00927734375, -19.802734375, -18.59619140625, -17.3896484375, -16.18310546875, -14.9765625, -13.77001953125, -12.5634765625, -11.35693359375, -10.150390625, -8.94384765625, -7.7373046875, -6.53076171875, -5.32421875, -4.11767578125, -2.9111328125, -1.70458984375, -0.498046875, 0.70849609375, 1.9150390625, 3.12158203125, 4.328125, 5.53466796875, 6.7412109375, 7.94775390625, 9.154296875, 10.36083984375, 11.5673828125, 12.77392578125, 13.98046875, 15.18701171875, 16.3935546875, 17.60009765625, 18.806640625, 20.01318359375, 21.2197265625, 22.42626953125, 23.6328125, 24.83935546875, 26.0458984375, 27.25244140625, 28.458984375, 29.66552734375, 30.8720703125, 32.07861328125, 33.28515625, 34.49169921875, 35.6982421875, 36.90478515625, 38.111328125, 39.31787109375, 40.5244140625, 41.73095703125, 42.9375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 6.0, 12.0, 12.0, 20.0, 33.0, 57.0, 78.0, 84.0, 186.0, 262.0, 461.0, 929.0, 2567.0, 12376.0, 139136.0, 812446.0, 68484.0, 7733.0, 1811.0, 783.0, 397.0, 252.0, 128.0, 101.0, 61.0, 39.0, 23.0, 16.0, 13.0, 16.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.1875, -111.8359375, -108.484375, -105.1328125, -101.78125, -98.4296875, -95.078125, -91.7265625, -88.375, -85.0234375, -81.671875, -78.3203125, -74.96875, -71.6171875, -68.265625, -64.9140625, -61.5625, -58.2109375, -54.859375, -51.5078125, -48.15625, -44.8046875, -41.453125, -38.1015625, -34.75, -31.3984375, -28.046875, -24.6953125, -21.34375, -17.9921875, -14.640625, -11.2890625, -7.9375, -4.5859375, -1.234375, 2.1171875, 5.46875, 8.8203125, 12.171875, 15.5234375, 18.875, 22.2265625, 25.578125, 28.9296875, 32.28125, 35.6328125, 38.984375, 42.3359375, 45.6875, 49.0390625, 52.390625, 55.7421875, 59.09375, 62.4453125, 65.796875, 69.1484375, 72.5, 75.8515625, 79.203125, 82.5546875, 85.90625, 89.2578125, 92.609375, 95.9609375, 99.3125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 5.0, 3.0, 12.0, 10.0, 12.0, 15.0, 22.0, 19.0, 21.0, 35.0, 41.0, 36.0, 46.0, 52.0, 60.0, 49.0, 59.0, 50.0, 64.0, 47.0, 52.0, 42.0, 42.0, 39.0, 36.0, 28.0, 18.0, 13.0, 20.0, 7.0, 6.0, 3.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.4375, -100.8896484375, -97.341796875, -93.7939453125, -90.24609375, -86.6982421875, -83.150390625, -79.6025390625, -76.0546875, -72.5068359375, -68.958984375, -65.4111328125, -61.86328125, -58.3154296875, -54.767578125, -51.2197265625, -47.671875, -44.1240234375, -40.576171875, -37.0283203125, -33.48046875, -29.9326171875, -26.384765625, -22.8369140625, -19.2890625, -15.7412109375, -12.193359375, -8.6455078125, -5.09765625, -1.5498046875, 1.998046875, 5.5458984375, 9.09375, 12.6416015625, 16.189453125, 19.7373046875, 23.28515625, 26.8330078125, 30.380859375, 33.9287109375, 37.4765625, 41.0244140625, 44.572265625, 48.1201171875, 51.66796875, 55.2158203125, 58.763671875, 62.3115234375, 65.859375, 69.4072265625, 72.955078125, 76.5029296875, 80.05078125, 83.5986328125, 87.146484375, 90.6943359375, 94.2421875, 97.7900390625, 101.337890625, 104.8857421875, 108.43359375, 111.9814453125, 115.529296875, 119.0771484375, 122.625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 7.0, 8.0, 9.0, 10.0, 10.0, 14.0, 14.0, 19.0, 33.0, 51.0, 65.0, 113.0, 205.0, 399.0, 908.0, 2731.0, 11236.0, 72302.0, 793535.0, 141911.0, 18691.0, 3921.0, 1155.0, 526.0, 256.0, 132.0, 78.0, 61.0, 36.0, 30.0, 31.0, 11.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -27.13037109375, -26.2451171875, -25.35986328125, -24.474609375, -23.58935546875, -22.7041015625, -21.81884765625, -20.93359375, -20.04833984375, -19.1630859375, -18.27783203125, -17.392578125, -16.50732421875, -15.6220703125, -14.73681640625, -13.8515625, -12.96630859375, -12.0810546875, -11.19580078125, -10.310546875, -9.42529296875, -8.5400390625, -7.65478515625, -6.76953125, -5.88427734375, -4.9990234375, -4.11376953125, -3.228515625, -2.34326171875, -1.4580078125, -0.57275390625, 0.3125, 1.19775390625, 2.0830078125, 2.96826171875, 3.853515625, 4.73876953125, 5.6240234375, 6.50927734375, 7.39453125, 8.27978515625, 9.1650390625, 10.05029296875, 10.935546875, 11.82080078125, 12.7060546875, 13.59130859375, 14.4765625, 15.36181640625, 16.2470703125, 17.13232421875, 18.017578125, 18.90283203125, 19.7880859375, 20.67333984375, 21.55859375, 22.44384765625, 23.3291015625, 24.21435546875, 25.099609375, 25.98486328125, 26.8701171875, 27.75537109375, 28.640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 2.0, 5.0, 7.0, 8.0, 9.0, 10.0, 10.0, 12.0, 12.0, 25.0, 21.0, 43.0, 42.0, 48.0, 72.0, 93.0, 111.0, 101.0, 73.0, 56.0, 45.0, 42.0, 25.0, 23.0, 19.0, 17.0, 12.0, 15.0, 7.0, 11.0, 5.0, 2.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004932403564453125, -0.0047754645347595215, -0.004618525505065918, -0.0044615864753723145, -0.004304647445678711, -0.004147708415985107, -0.003990769386291504, -0.0038338303565979004, -0.003676891326904297, -0.0035199522972106934, -0.00336301326751709, -0.0032060742378234863, -0.003049135208129883, -0.0028921961784362793, -0.0027352571487426758, -0.0025783181190490723, -0.0024213790893554688, -0.0022644400596618652, -0.0021075010299682617, -0.0019505620002746582, -0.0017936229705810547, -0.0016366839408874512, -0.0014797449111938477, -0.0013228058815002441, -0.0011658668518066406, -0.0010089278221130371, -0.0008519887924194336, -0.0006950497627258301, -0.0005381107330322266, -0.00038117170333862305, -0.00022423267364501953, -6.729364395141602e-05, 8.96453857421875e-05, 0.000246584415435791, 0.00040352344512939453, 0.000560462474822998, 0.0007174015045166016, 0.0008743405342102051, 0.0010312795639038086, 0.0011882185935974121, 0.0013451576232910156, 0.0015020966529846191, 0.0016590356826782227, 0.0018159747123718262, 0.0019729137420654297, 0.002129852771759033, 0.0022867918014526367, 0.0024437308311462402, 0.0026006698608398438, 0.0027576088905334473, 0.0029145479202270508, 0.0030714869499206543, 0.003228425979614258, 0.0033853650093078613, 0.003542304039001465, 0.0036992430686950684, 0.003856182098388672, 0.004013121128082275, 0.004170060157775879, 0.004326999187469482, 0.004483938217163086, 0.0046408772468566895, 0.004797816276550293, 0.0049547553062438965, 0.0051116943359375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 6.0, 3.0, 5.0, 7.0, 5.0, 6.0, 9.0, 17.0, 20.0, 34.0, 42.0, 73.0, 94.0, 151.0, 236.0, 390.0, 652.0, 1435.0, 3172.0, 9067.0, 32412.0, 165598.0, 696407.0, 103860.0, 22696.0, 6808.0, 2586.0, 1177.0, 606.0, 347.0, 202.0, 138.0, 90.0, 58.0, 48.0, 33.0, 20.0, 18.0, 10.0, 9.0, 4.0, 7.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.734375, -18.13720703125, -17.5400390625, -16.94287109375, -16.345703125, -15.74853515625, -15.1513671875, -14.55419921875, -13.95703125, -13.35986328125, -12.7626953125, -12.16552734375, -11.568359375, -10.97119140625, -10.3740234375, -9.77685546875, -9.1796875, -8.58251953125, -7.9853515625, -7.38818359375, -6.791015625, -6.19384765625, -5.5966796875, -4.99951171875, -4.40234375, -3.80517578125, -3.2080078125, -2.61083984375, -2.013671875, -1.41650390625, -0.8193359375, -0.22216796875, 0.375, 0.97216796875, 1.5693359375, 2.16650390625, 2.763671875, 3.36083984375, 3.9580078125, 4.55517578125, 5.15234375, 5.74951171875, 6.3466796875, 6.94384765625, 7.541015625, 8.13818359375, 8.7353515625, 9.33251953125, 9.9296875, 10.52685546875, 11.1240234375, 11.72119140625, 12.318359375, 12.91552734375, 13.5126953125, 14.10986328125, 14.70703125, 15.30419921875, 15.9013671875, 16.49853515625, 17.095703125, 17.69287109375, 18.2900390625, 18.88720703125, 19.484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 12.0, 6.0, 11.0, 18.0, 20.0, 28.0, 44.0, 49.0, 68.0, 88.0, 105.0, 134.0, 97.0, 77.0, 69.0, 35.0, 27.0, 38.0, 21.0, 13.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.265625, -22.492919921875, -21.72021484375, -20.947509765625, -20.1748046875, -19.402099609375, -18.62939453125, -17.856689453125, -17.083984375, -16.311279296875, -15.53857421875, -14.765869140625, -13.9931640625, -13.220458984375, -12.44775390625, -11.675048828125, -10.90234375, -10.129638671875, -9.35693359375, -8.584228515625, -7.8115234375, -7.038818359375, -6.26611328125, -5.493408203125, -4.720703125, -3.947998046875, -3.17529296875, -2.402587890625, -1.6298828125, -0.857177734375, -0.08447265625, 0.688232421875, 1.4609375, 2.233642578125, 3.00634765625, 3.779052734375, 4.5517578125, 5.324462890625, 6.09716796875, 6.869873046875, 7.642578125, 8.415283203125, 9.18798828125, 9.960693359375, 10.7333984375, 11.506103515625, 12.27880859375, 13.051513671875, 13.82421875, 14.596923828125, 15.36962890625, 16.142333984375, 16.9150390625, 17.687744140625, 18.46044921875, 19.233154296875, 20.005859375, 20.778564453125, 21.55126953125, 22.323974609375, 23.0966796875, 23.869384765625, 24.64208984375, 25.414794921875, 26.1875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 11.0, 16.0, 31.0, 39.0, 98.0, 174.0, 302.0, 157.0, 76.0, 38.0, 25.0, 11.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-782.902587890625, -764.0009155273438, -745.0992431640625, -726.1976318359375, -707.2959594726562, -688.394287109375, -669.4926147460938, -650.5909423828125, -631.6893310546875, -612.7876586914062, -593.885986328125, -574.984375, -556.0827026367188, -537.1810302734375, -518.2793579101562, -499.377685546875, -480.47601318359375, -461.5743408203125, -442.6726989746094, -423.7710266113281, -404.869384765625, -385.96771240234375, -367.0660400390625, -348.16436767578125, -329.2627258300781, -310.3610534667969, -291.45941162109375, -272.5577392578125, -253.6560821533203, -234.75442504882812, -215.85275268554688, -196.9510955810547, -178.0494384765625, -159.1477813720703, -140.24612426757812, -121.34445190429688, -102.44279479980469, -83.5411376953125, -64.63947296142578, -45.73780822753906, -26.836151123046875, -7.934490203857422, 10.967170715332031, 29.868831634521484, 48.77049255371094, 67.67214965820312, 86.57381439208984, 105.47547912597656, 124.37713623046875, 143.27879333496094, 162.18045043945312, 181.08212280273438, 199.98377990722656, 218.88543701171875, 237.787109375, 256.68878173828125, 275.5904235839844, 294.4920959472656, 313.39373779296875, 332.29541015625, 351.19708251953125, 370.0987243652344, 389.0003967285156, 407.90203857421875, 426.8037109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 2.0, 3.0, 9.0, 6.0, 10.0, 8.0, 13.0, 15.0, 15.0, 26.0, 27.0, 30.0, 26.0, 31.0, 32.0, 34.0, 47.0, 67.0, 104.0, 97.0, 53.0, 46.0, 37.0, 30.0, 28.0, 28.0, 26.0, 20.0, 22.0, 16.0, 17.0, 13.0, 13.0, 12.0, 7.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.5806884765625, -352.6942138671875, -340.8077392578125, -328.9212646484375, -317.0347900390625, -305.1483459472656, -293.2618713378906, -281.3753967285156, -269.4889221191406, -257.6024475097656, -245.71597290039062, -233.8295135498047, -221.9430389404297, -210.0565643310547, -198.17010498046875, -186.28363037109375, -174.39715576171875, -162.51068115234375, -150.62420654296875, -138.7377471923828, -126.85127258300781, -114.96479797363281, -103.07833099365234, -91.19186401367188, -79.30538940429688, -67.41891479492188, -55.532447814941406, -43.64597702026367, -31.759506225585938, -19.873035430908203, -7.986564636230469, 3.89990234375, 15.786376953125, 27.672847747802734, 39.55931854248047, 51.4457893371582, 63.33226013183594, 75.21873474121094, 87.1052017211914, 98.99166870117188, 110.87814331054688, 122.76461791992188, 134.65109252929688, 146.5375518798828, 158.4240264892578, 170.3105010986328, 182.19696044921875, 194.08343505859375, 205.96990966796875, 217.85638427734375, 229.74285888671875, 241.6293182373047, 253.5157928466797, 265.4022521972656, 277.2887268066406, 289.1752014160156, 301.0616760253906, 312.9481506347656, 324.8346252441406, 336.7210998535156, 348.6075439453125, 360.4940185546875, 372.3804931640625, 384.2669677734375, 396.1534423828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 12.0, 10.0, 16.0, 14.0, 33.0, 25.0, 49.0, 73.0, 132.0, 178.0, 357.0, 778.0, 2397.0, 10229.0, 89069.0, 2551905.0, 1480152.0, 48028.0, 7332.0, 1868.0, 676.0, 320.0, 193.0, 138.0, 74.0, 63.0, 36.0, 17.0, 24.0, 26.0, 11.0, 11.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-65.375, -63.1884765625, -61.001953125, -58.8154296875, -56.62890625, -54.4423828125, -52.255859375, -50.0693359375, -47.8828125, -45.6962890625, -43.509765625, -41.3232421875, -39.13671875, -36.9501953125, -34.763671875, -32.5771484375, -30.390625, -28.2041015625, -26.017578125, -23.8310546875, -21.64453125, -19.4580078125, -17.271484375, -15.0849609375, -12.8984375, -10.7119140625, -8.525390625, -6.3388671875, -4.15234375, -1.9658203125, 0.220703125, 2.4072265625, 4.59375, 6.7802734375, 8.966796875, 11.1533203125, 13.33984375, 15.5263671875, 17.712890625, 19.8994140625, 22.0859375, 24.2724609375, 26.458984375, 28.6455078125, 30.83203125, 33.0185546875, 35.205078125, 37.3916015625, 39.578125, 41.7646484375, 43.951171875, 46.1376953125, 48.32421875, 50.5107421875, 52.697265625, 54.8837890625, 57.0703125, 59.2568359375, 61.443359375, 63.6298828125, 65.81640625, 68.0029296875, 70.189453125, 72.3759765625, 74.5625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 5.0, 7.0, 12.0, 6.0, 10.0, 13.0, 16.0, 18.0, 30.0, 30.0, 45.0, 44.0, 41.0, 42.0, 57.0, 46.0, 53.0, 52.0, 36.0, 45.0, 48.0, 46.0, 37.0, 28.0, 37.0, 25.0, 23.0, 25.0, 16.0, 21.0, 19.0, 12.0, 12.0, 11.0, 5.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.265625, -24.356689453125, -23.44775390625, -22.538818359375, -21.6298828125, -20.720947265625, -19.81201171875, -18.903076171875, -17.994140625, -17.085205078125, -16.17626953125, -15.267333984375, -14.3583984375, -13.449462890625, -12.54052734375, -11.631591796875, -10.72265625, -9.813720703125, -8.90478515625, -7.995849609375, -7.0869140625, -6.177978515625, -5.26904296875, -4.360107421875, -3.451171875, -2.542236328125, -1.63330078125, -0.724365234375, 0.1845703125, 1.093505859375, 2.00244140625, 2.911376953125, 3.8203125, 4.729248046875, 5.63818359375, 6.547119140625, 7.4560546875, 8.364990234375, 9.27392578125, 10.182861328125, 11.091796875, 12.000732421875, 12.90966796875, 13.818603515625, 14.7275390625, 15.636474609375, 16.54541015625, 17.454345703125, 18.36328125, 19.272216796875, 20.18115234375, 21.090087890625, 21.9990234375, 22.907958984375, 23.81689453125, 24.725830078125, 25.634765625, 26.543701171875, 27.45263671875, 28.361572265625, 29.2705078125, 30.179443359375, 31.08837890625, 31.997314453125, 32.90625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 5.0, 9.0, 22.0, 25.0, 40.0, 55.0, 89.0, 154.0, 347.0, 1021.0, 3590.0, 20414.0, 359800.0, 3670385.0, 123828.0, 11000.0, 2263.0, 641.0, 254.0, 138.0, 61.0, 55.0, 20.0, 16.0, 5.0, 10.0, 8.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.3125, -67.8330078125, -65.353515625, -62.8740234375, -60.39453125, -57.9150390625, -55.435546875, -52.9560546875, -50.4765625, -47.9970703125, -45.517578125, -43.0380859375, -40.55859375, -38.0791015625, -35.599609375, -33.1201171875, -30.640625, -28.1611328125, -25.681640625, -23.2021484375, -20.72265625, -18.2431640625, -15.763671875, -13.2841796875, -10.8046875, -8.3251953125, -5.845703125, -3.3662109375, -0.88671875, 1.5927734375, 4.072265625, 6.5517578125, 9.03125, 11.5107421875, 13.990234375, 16.4697265625, 18.94921875, 21.4287109375, 23.908203125, 26.3876953125, 28.8671875, 31.3466796875, 33.826171875, 36.3056640625, 38.78515625, 41.2646484375, 43.744140625, 46.2236328125, 48.703125, 51.1826171875, 53.662109375, 56.1416015625, 58.62109375, 61.1005859375, 63.580078125, 66.0595703125, 68.5390625, 71.0185546875, 73.498046875, 75.9775390625, 78.45703125, 80.9365234375, 83.416015625, 85.8955078125, 88.375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 14.0, 16.0, 18.0, 28.0, 36.0, 43.0, 75.0, 118.0, 185.0, 276.0, 472.0, 582.0, 718.0, 574.0, 306.0, 232.0, 135.0, 73.0, 50.0, 25.0, 18.0, 14.0, 17.0, 7.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4375, -58.55419921875, -56.6708984375, -54.78759765625, -52.904296875, -51.02099609375, -49.1376953125, -47.25439453125, -45.37109375, -43.48779296875, -41.6044921875, -39.72119140625, -37.837890625, -35.95458984375, -34.0712890625, -32.18798828125, -30.3046875, -28.42138671875, -26.5380859375, -24.65478515625, -22.771484375, -20.88818359375, -19.0048828125, -17.12158203125, -15.23828125, -13.35498046875, -11.4716796875, -9.58837890625, -7.705078125, -5.82177734375, -3.9384765625, -2.05517578125, -0.171875, 1.71142578125, 3.5947265625, 5.47802734375, 7.361328125, 9.24462890625, 11.1279296875, 13.01123046875, 14.89453125, 16.77783203125, 18.6611328125, 20.54443359375, 22.427734375, 24.31103515625, 26.1943359375, 28.07763671875, 29.9609375, 31.84423828125, 33.7275390625, 35.61083984375, 37.494140625, 39.37744140625, 41.2607421875, 43.14404296875, 45.02734375, 46.91064453125, 48.7939453125, 50.67724609375, 52.560546875, 54.44384765625, 56.3271484375, 58.21044921875, 60.09375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 14.0, 27.0, 51.0, 122.0, 231.0, 242.0, 187.0, 79.0, 20.0, 12.0, 6.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1182.080810546875, -1160.336669921875, -1138.5926513671875, -1116.8485107421875, -1095.1043701171875, -1073.3603515625, -1051.6162109375, -1029.8720703125, -1008.1279907226562, -986.3839111328125, -964.6397705078125, -942.8956909179688, -921.151611328125, -899.407470703125, -877.6633911132812, -855.9193115234375, -834.1751708984375, -812.4310913085938, -790.6869506835938, -768.94287109375, -747.19873046875, -725.4546508789062, -703.7105712890625, -681.9664306640625, -660.2223510742188, -638.478271484375, -616.734130859375, -594.9900512695312, -573.2459716796875, -551.5018310546875, -529.7577514648438, -508.0136413574219, -486.2695617675781, -464.52545166015625, -442.7813720703125, -421.0372619628906, -399.29315185546875, -377.5490417480469, -355.804931640625, -334.06085205078125, -312.3167419433594, -290.5726318359375, -268.82855224609375, -247.08444213867188, -225.34033203125, -203.59622192382812, -181.8521270751953, -160.1080322265625, -138.36392211914062, -116.61981964111328, -94.87571716308594, -73.1316146850586, -51.38751220703125, -29.643409729003906, -7.8993072509765625, 13.84478759765625, 35.588897705078125, 57.33300018310547, 79.07710266113281, 100.82120513916016, 122.5653076171875, 144.30941772460938, 166.0535125732422, 187.797607421875, 209.54171752929688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 5.0, 5.0, 16.0, 9.0, 15.0, 8.0, 20.0, 26.0, 20.0, 34.0, 26.0, 33.0, 38.0, 42.0, 34.0, 49.0, 54.0, 45.0, 45.0, 43.0, 36.0, 27.0, 38.0, 42.0, 32.0, 27.0, 29.0, 24.0, 28.0, 20.0, 9.0, 17.0, 18.0, 15.0, 11.0, 8.0, 5.0, 5.0, 7.0, 3.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-232.91329956054688, -225.816162109375, -218.71902465820312, -211.62188720703125, -204.52474975585938, -197.4276123046875, -190.33047485351562, -183.23333740234375, -176.13619995117188, -169.0390625, -161.94192504882812, -154.84478759765625, -147.74765014648438, -140.6505126953125, -133.55337524414062, -126.45623779296875, -119.35910034179688, -112.261962890625, -105.16482543945312, -98.06768798828125, -90.97055053710938, -83.8734130859375, -76.77627563476562, -69.67913818359375, -62.582000732421875, -55.48486328125, -48.387725830078125, -41.29058837890625, -34.193450927734375, -27.0963134765625, -19.999176025390625, -12.90203857421875, -5.8048858642578125, 1.2922515869140625, 8.389389038085938, 15.486526489257812, 22.583663940429688, 29.680801391601562, 36.77793884277344, 43.87507629394531, 50.97221374511719, 58.06935119628906, 65.16648864746094, 72.26362609863281, 79.36076354980469, 86.45790100097656, 93.55503845214844, 100.65217590332031, 107.74931335449219, 114.84645080566406, 121.94358825683594, 129.0407257080078, 136.1378631591797, 143.23500061035156, 150.33213806152344, 157.4292755126953, 164.5264129638672, 171.62355041503906, 178.72068786621094, 185.8178253173828, 192.9149627685547, 200.01210021972656, 207.10923767089844, 214.2063751220703, 221.3035125732422]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 10.0, 9.0, 11.0, 24.0, 39.0, 81.0, 155.0, 415.0, 1197.0, 3683.0, 13863.0, 66688.0, 442617.0, 435309.0, 65014.0, 13792.0, 3723.0, 1143.0, 407.0, 159.0, 93.0, 49.0, 20.0, 22.0, 8.0, 0.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.75, -82.015625, -79.28125, -76.546875, -73.8125, -71.078125, -68.34375, -65.609375, -62.875, -60.140625, -57.40625, -54.671875, -51.9375, -49.203125, -46.46875, -43.734375, -41.0, -38.265625, -35.53125, -32.796875, -30.0625, -27.328125, -24.59375, -21.859375, -19.125, -16.390625, -13.65625, -10.921875, -8.1875, -5.453125, -2.71875, 0.015625, 2.75, 5.484375, 8.21875, 10.953125, 13.6875, 16.421875, 19.15625, 21.890625, 24.625, 27.359375, 30.09375, 32.828125, 35.5625, 38.296875, 41.03125, 43.765625, 46.5, 49.234375, 51.96875, 54.703125, 57.4375, 60.171875, 62.90625, 65.640625, 68.375, 71.109375, 73.84375, 76.578125, 79.3125, 82.046875, 84.78125, 87.515625, 90.25]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 7.0, 6.0, 12.0, 15.0, 16.0, 18.0, 22.0, 15.0, 26.0, 29.0, 40.0, 47.0, 53.0, 39.0, 49.0, 42.0, 46.0, 56.0, 35.0, 51.0, 49.0, 43.0, 37.0, 37.0, 25.0, 28.0, 26.0, 28.0, 16.0, 18.0, 12.0, 14.0, 6.0, 5.0, 5.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -25.034423828125, -24.11572265625, -23.197021484375, -22.2783203125, -21.359619140625, -20.44091796875, -19.522216796875, -18.603515625, -17.684814453125, -16.76611328125, -15.847412109375, -14.9287109375, -14.010009765625, -13.09130859375, -12.172607421875, -11.25390625, -10.335205078125, -9.41650390625, -8.497802734375, -7.5791015625, -6.660400390625, -5.74169921875, -4.822998046875, -3.904296875, -2.985595703125, -2.06689453125, -1.148193359375, -0.2294921875, 0.689208984375, 1.60791015625, 2.526611328125, 3.4453125, 4.364013671875, 5.28271484375, 6.201416015625, 7.1201171875, 8.038818359375, 8.95751953125, 9.876220703125, 10.794921875, 11.713623046875, 12.63232421875, 13.551025390625, 14.4697265625, 15.388427734375, 16.30712890625, 17.225830078125, 18.14453125, 19.063232421875, 19.98193359375, 20.900634765625, 21.8193359375, 22.738037109375, 23.65673828125, 24.575439453125, 25.494140625, 26.412841796875, 27.33154296875, 28.250244140625, 29.1689453125, 30.087646484375, 31.00634765625, 31.925048828125, 32.84375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 1.0, 5.0, 12.0, 9.0, 22.0, 29.0, 33.0, 43.0, 89.0, 117.0, 150.0, 248.0, 398.0, 584.0, 1115.0, 2407.0, 8985.0, 79718.0, 860347.0, 80090.0, 8934.0, 2371.0, 1092.0, 598.0, 388.0, 235.0, 157.0, 112.0, 73.0, 56.0, 45.0, 25.0, 16.0, 10.0, 11.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-101.8125, -98.361328125, -94.91015625, -91.458984375, -88.0078125, -84.556640625, -81.10546875, -77.654296875, -74.203125, -70.751953125, -67.30078125, -63.849609375, -60.3984375, -56.947265625, -53.49609375, -50.044921875, -46.59375, -43.142578125, -39.69140625, -36.240234375, -32.7890625, -29.337890625, -25.88671875, -22.435546875, -18.984375, -15.533203125, -12.08203125, -8.630859375, -5.1796875, -1.728515625, 1.72265625, 5.173828125, 8.625, 12.076171875, 15.52734375, 18.978515625, 22.4296875, 25.880859375, 29.33203125, 32.783203125, 36.234375, 39.685546875, 43.13671875, 46.587890625, 50.0390625, 53.490234375, 56.94140625, 60.392578125, 63.84375, 67.294921875, 70.74609375, 74.197265625, 77.6484375, 81.099609375, 84.55078125, 88.001953125, 91.453125, 94.904296875, 98.35546875, 101.806640625, 105.2578125, 108.708984375, 112.16015625, 115.611328125, 119.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 3.0, 7.0, 4.0, 10.0, 11.0, 20.0, 16.0, 20.0, 26.0, 37.0, 28.0, 44.0, 57.0, 53.0, 49.0, 79.0, 60.0, 60.0, 61.0, 61.0, 43.0, 41.0, 30.0, 28.0, 29.0, 15.0, 21.0, 18.0, 15.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.625, -117.646484375, -113.66796875, -109.689453125, -105.7109375, -101.732421875, -97.75390625, -93.775390625, -89.796875, -85.818359375, -81.83984375, -77.861328125, -73.8828125, -69.904296875, -65.92578125, -61.947265625, -57.96875, -53.990234375, -50.01171875, -46.033203125, -42.0546875, -38.076171875, -34.09765625, -30.119140625, -26.140625, -22.162109375, -18.18359375, -14.205078125, -10.2265625, -6.248046875, -2.26953125, 1.708984375, 5.6875, 9.666015625, 13.64453125, 17.623046875, 21.6015625, 25.580078125, 29.55859375, 33.537109375, 37.515625, 41.494140625, 45.47265625, 49.451171875, 53.4296875, 57.408203125, 61.38671875, 65.365234375, 69.34375, 73.322265625, 77.30078125, 81.279296875, 85.2578125, 89.236328125, 93.21484375, 97.193359375, 101.171875, 105.150390625, 109.12890625, 113.107421875, 117.0859375, 121.064453125, 125.04296875, 129.021484375, 133.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 14.0, 12.0, 33.0, 28.0, 36.0, 79.0, 122.0, 212.0, 407.0, 782.0, 2032.0, 6478.0, 44538.0, 886047.0, 93470.0, 9554.0, 2629.0, 986.0, 447.0, 229.0, 125.0, 82.0, 50.0, 35.0, 26.0, 13.0, 17.0, 12.0, 14.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.703125, -30.633056640625, -29.56298828125, -28.492919921875, -27.4228515625, -26.352783203125, -25.28271484375, -24.212646484375, -23.142578125, -22.072509765625, -21.00244140625, -19.932373046875, -18.8623046875, -17.792236328125, -16.72216796875, -15.652099609375, -14.58203125, -13.511962890625, -12.44189453125, -11.371826171875, -10.3017578125, -9.231689453125, -8.16162109375, -7.091552734375, -6.021484375, -4.951416015625, -3.88134765625, -2.811279296875, -1.7412109375, -0.671142578125, 0.39892578125, 1.468994140625, 2.5390625, 3.609130859375, 4.67919921875, 5.749267578125, 6.8193359375, 7.889404296875, 8.95947265625, 10.029541015625, 11.099609375, 12.169677734375, 13.23974609375, 14.309814453125, 15.3798828125, 16.449951171875, 17.52001953125, 18.590087890625, 19.66015625, 20.730224609375, 21.80029296875, 22.870361328125, 23.9404296875, 25.010498046875, 26.08056640625, 27.150634765625, 28.220703125, 29.290771484375, 30.36083984375, 31.430908203125, 32.5009765625, 33.571044921875, 34.64111328125, 35.711181640625, 36.78125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 2.0, 8.0, 9.0, 13.0, 12.0, 14.0, 15.0, 35.0, 47.0, 61.0, 87.0, 144.0, 156.0, 115.0, 67.0, 52.0, 29.0, 33.0, 24.0, 14.0, 18.0, 6.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005748748779296875, -0.005529940128326416, -0.005311131477355957, -0.005092322826385498, -0.004873514175415039, -0.00465470552444458, -0.004435896873474121, -0.004217088222503662, -0.003998279571533203, -0.003779470920562744, -0.003560662269592285, -0.003341853618621826, -0.003123044967651367, -0.002904236316680908, -0.0026854276657104492, -0.0024666190147399902, -0.0022478103637695312, -0.0020290017127990723, -0.0018101930618286133, -0.0015913844108581543, -0.0013725757598876953, -0.0011537671089172363, -0.0009349584579467773, -0.0007161498069763184, -0.0004973411560058594, -0.0002785325050354004, -5.9723854064941406e-05, 0.00015908479690551758, 0.00037789344787597656, 0.0005967020988464355, 0.0008155107498168945, 0.0010343194007873535, 0.0012531280517578125, 0.0014719367027282715, 0.0016907453536987305, 0.0019095540046691895, 0.0021283626556396484, 0.0023471713066101074, 0.0025659799575805664, 0.0027847886085510254, 0.0030035972595214844, 0.0032224059104919434, 0.0034412145614624023, 0.0036600232124328613, 0.0038788318634033203, 0.004097640514373779, 0.004316449165344238, 0.004535257816314697, 0.004754066467285156, 0.004972875118255615, 0.005191683769226074, 0.005410492420196533, 0.005629301071166992, 0.005848109722137451, 0.00606691837310791, 0.006285727024078369, 0.006504535675048828, 0.006723344326019287, 0.006942152976989746, 0.007160961627960205, 0.007379770278930664, 0.007598578929901123, 0.007817387580871582, 0.008036196231842041, 0.0082550048828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 12.0, 13.0, 20.0, 11.0, 29.0, 26.0, 48.0, 60.0, 89.0, 122.0, 170.0, 240.0, 391.0, 731.0, 1300.0, 2721.0, 6852.0, 24499.0, 207295.0, 734738.0, 50904.0, 10450.0, 3749.0, 1711.0, 881.0, 491.0, 308.0, 204.0, 130.0, 86.0, 71.0, 45.0, 28.0, 33.0, 11.0, 10.0, 14.0, 14.0, 10.0, 4.0, 7.0, 3.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0], "bins": [-24.265625, -23.576171875, -22.88671875, -22.197265625, -21.5078125, -20.818359375, -20.12890625, -19.439453125, -18.75, -18.060546875, -17.37109375, -16.681640625, -15.9921875, -15.302734375, -14.61328125, -13.923828125, -13.234375, -12.544921875, -11.85546875, -11.166015625, -10.4765625, -9.787109375, -9.09765625, -8.408203125, -7.71875, -7.029296875, -6.33984375, -5.650390625, -4.9609375, -4.271484375, -3.58203125, -2.892578125, -2.203125, -1.513671875, -0.82421875, -0.134765625, 0.5546875, 1.244140625, 1.93359375, 2.623046875, 3.3125, 4.001953125, 4.69140625, 5.380859375, 6.0703125, 6.759765625, 7.44921875, 8.138671875, 8.828125, 9.517578125, 10.20703125, 10.896484375, 11.5859375, 12.275390625, 12.96484375, 13.654296875, 14.34375, 15.033203125, 15.72265625, 16.412109375, 17.1015625, 17.791015625, 18.48046875, 19.169921875, 19.859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 13.0, 11.0, 24.0, 33.0, 28.0, 47.0, 50.0, 56.0, 79.0, 89.0, 99.0, 111.0, 73.0, 70.0, 46.0, 28.0, 38.0, 20.0, 14.0, 10.0, 8.0, 8.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.59375, -20.97998046875, -20.3662109375, -19.75244140625, -19.138671875, -18.52490234375, -17.9111328125, -17.29736328125, -16.68359375, -16.06982421875, -15.4560546875, -14.84228515625, -14.228515625, -13.61474609375, -13.0009765625, -12.38720703125, -11.7734375, -11.15966796875, -10.5458984375, -9.93212890625, -9.318359375, -8.70458984375, -8.0908203125, -7.47705078125, -6.86328125, -6.24951171875, -5.6357421875, -5.02197265625, -4.408203125, -3.79443359375, -3.1806640625, -2.56689453125, -1.953125, -1.33935546875, -0.7255859375, -0.11181640625, 0.501953125, 1.11572265625, 1.7294921875, 2.34326171875, 2.95703125, 3.57080078125, 4.1845703125, 4.79833984375, 5.412109375, 6.02587890625, 6.6396484375, 7.25341796875, 7.8671875, 8.48095703125, 9.0947265625, 9.70849609375, 10.322265625, 10.93603515625, 11.5498046875, 12.16357421875, 12.77734375, 13.39111328125, 14.0048828125, 14.61865234375, 15.232421875, 15.84619140625, 16.4599609375, 17.07373046875, 17.6875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 12.0, 19.0, 80.0, 216.0, 488.0, 123.0, 40.0, 7.0, 8.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-560.6902465820312, -526.1357421875, -491.5812072753906, -457.02667236328125, -422.47216796875, -387.91766357421875, -353.3631286621094, -318.80859375, -284.25408935546875, -249.69956970214844, -215.14505004882812, -180.5905303955078, -146.0360107421875, -111.48149108886719, -76.92697143554688, -42.37245178222656, -7.81793212890625, 26.736587524414062, 61.291107177734375, 95.84562683105469, 130.400146484375, 164.9546661376953, 199.50918579101562, 234.06370544433594, 268.61822509765625, 303.1727294921875, 337.7272644042969, 372.28179931640625, 406.8363037109375, 441.39080810546875, 475.9453430175781, 510.4998779296875, 545.0543212890625, 579.6088256835938, 614.163330078125, 648.7178955078125, 683.2723999023438, 717.826904296875, 752.3814697265625, 786.9359741210938, 821.490478515625, 856.0449829101562, 890.5994873046875, 925.154052734375, 959.7085571289062, 994.2630615234375, 1028.817626953125, 1063.3720703125, 1097.9266357421875, 1132.481201171875, 1167.03564453125, 1201.5902099609375, 1236.144775390625, 1270.69921875, 1305.2537841796875, 1339.8082275390625, 1374.36279296875, 1408.9173583984375, 1443.4718017578125, 1478.0263671875, 1512.580810546875, 1547.1353759765625, 1581.68994140625, 1616.244384765625, 1650.7989501953125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 4.0, 2.0, 7.0, 8.0, 6.0, 6.0, 12.0, 4.0, 5.0, 16.0, 12.0, 17.0, 26.0, 23.0, 19.0, 36.0, 36.0, 24.0, 39.0, 82.0, 130.0, 108.0, 65.0, 35.0, 39.0, 25.0, 25.0, 28.0, 23.0, 22.0, 28.0, 22.0, 7.0, 12.0, 10.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-390.56060791015625, -379.00103759765625, -367.4414978027344, -355.8819274902344, -344.3223876953125, -332.7628173828125, -321.2032470703125, -309.6437072753906, -298.08416748046875, -286.52459716796875, -274.9650573730469, -263.4054870605469, -251.845947265625, -240.286376953125, -228.72682189941406, -217.16726684570312, -205.60769653320312, -194.0481414794922, -182.48858642578125, -170.92901611328125, -159.36947631835938, -147.80990600585938, -136.25035095214844, -124.6907958984375, -113.13124084472656, -101.57168579101562, -90.01213073730469, -78.45256805419922, -66.89301300048828, -55.333457946777344, -43.773895263671875, -32.21434020996094, -20.654815673828125, -9.095258712768555, 2.4642982482910156, 14.023857116699219, 25.583412170410156, 37.142967224121094, 48.70252990722656, 60.2620849609375, 71.82164001464844, 83.38119506835938, 94.94075012207031, 106.50031280517578, 118.05986785888672, 129.61941528320312, 141.17898559570312, 152.73854064941406, 164.298095703125, 175.85765075683594, 187.41720581054688, 198.97677612304688, 210.53631591796875, 222.09588623046875, 233.6554412841797, 245.21499633789062, 256.7745361328125, 268.3341064453125, 279.8936462402344, 291.4532165527344, 303.01275634765625, 314.57232666015625, 326.13189697265625, 337.6914367675781, 349.2510070800781]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 14.0, 19.0, 30.0, 30.0, 47.0, 71.0, 107.0, 161.0, 280.0, 541.0, 1002.0, 2429.0, 7090.0, 33662.0, 411115.0, 2818302.0, 846221.0, 56641.0, 10053.0, 3275.0, 1404.0, 727.0, 411.0, 209.0, 140.0, 96.0, 64.0, 38.0, 21.0, 25.0, 15.0, 9.0, 5.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.25, -57.025390625, -54.80078125, -52.576171875, -50.3515625, -48.126953125, -45.90234375, -43.677734375, -41.453125, -39.228515625, -37.00390625, -34.779296875, -32.5546875, -30.330078125, -28.10546875, -25.880859375, -23.65625, -21.431640625, -19.20703125, -16.982421875, -14.7578125, -12.533203125, -10.30859375, -8.083984375, -5.859375, -3.634765625, -1.41015625, 0.814453125, 3.0390625, 5.263671875, 7.48828125, 9.712890625, 11.9375, 14.162109375, 16.38671875, 18.611328125, 20.8359375, 23.060546875, 25.28515625, 27.509765625, 29.734375, 31.958984375, 34.18359375, 36.408203125, 38.6328125, 40.857421875, 43.08203125, 45.306640625, 47.53125, 49.755859375, 51.98046875, 54.205078125, 56.4296875, 58.654296875, 60.87890625, 63.103515625, 65.328125, 67.552734375, 69.77734375, 72.001953125, 74.2265625, 76.451171875, 78.67578125, 80.900390625, 83.125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 12.0, 10.0, 16.0, 18.0, 15.0, 20.0, 15.0, 28.0, 36.0, 43.0, 44.0, 49.0, 43.0, 61.0, 67.0, 52.0, 51.0, 49.0, 47.0, 65.0, 43.0, 33.0, 24.0, 19.0, 22.0, 32.0, 19.0, 16.0, 12.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.5, -32.529541015625, -31.55908203125, -30.588623046875, -29.6181640625, -28.647705078125, -27.67724609375, -26.706787109375, -25.736328125, -24.765869140625, -23.79541015625, -22.824951171875, -21.8544921875, -20.884033203125, -19.91357421875, -18.943115234375, -17.97265625, -17.002197265625, -16.03173828125, -15.061279296875, -14.0908203125, -13.120361328125, -12.14990234375, -11.179443359375, -10.208984375, -9.238525390625, -8.26806640625, -7.297607421875, -6.3271484375, -5.356689453125, -4.38623046875, -3.415771484375, -2.4453125, -1.474853515625, -0.50439453125, 0.466064453125, 1.4365234375, 2.406982421875, 3.37744140625, 4.347900390625, 5.318359375, 6.288818359375, 7.25927734375, 8.229736328125, 9.2001953125, 10.170654296875, 11.14111328125, 12.111572265625, 13.08203125, 14.052490234375, 15.02294921875, 15.993408203125, 16.9638671875, 17.934326171875, 18.90478515625, 19.875244140625, 20.845703125, 21.816162109375, 22.78662109375, 23.757080078125, 24.7275390625, 25.697998046875, 26.66845703125, 27.638916015625, 28.609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 10.0, 11.0, 24.0, 27.0, 49.0, 65.0, 129.0, 188.0, 363.0, 779.0, 2027.0, 9205.0, 436631.0, 3712477.0, 25631.0, 3968.0, 1385.0, 563.0, 299.0, 160.0, 98.0, 60.0, 31.0, 32.0, 15.0, 15.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-187.75, -182.560546875, -177.37109375, -172.181640625, -166.9921875, -161.802734375, -156.61328125, -151.423828125, -146.234375, -141.044921875, -135.85546875, -130.666015625, -125.4765625, -120.287109375, -115.09765625, -109.908203125, -104.71875, -99.529296875, -94.33984375, -89.150390625, -83.9609375, -78.771484375, -73.58203125, -68.392578125, -63.203125, -58.013671875, -52.82421875, -47.634765625, -42.4453125, -37.255859375, -32.06640625, -26.876953125, -21.6875, -16.498046875, -11.30859375, -6.119140625, -0.9296875, 4.259765625, 9.44921875, 14.638671875, 19.828125, 25.017578125, 30.20703125, 35.396484375, 40.5859375, 45.775390625, 50.96484375, 56.154296875, 61.34375, 66.533203125, 71.72265625, 76.912109375, 82.1015625, 87.291015625, 92.48046875, 97.669921875, 102.859375, 108.048828125, 113.23828125, 118.427734375, 123.6171875, 128.806640625, 133.99609375, 139.185546875, 144.375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 11.0, 18.0, 26.0, 45.0, 90.0, 145.0, 226.0, 405.0, 507.0, 665.0, 610.0, 400.0, 313.0, 181.0, 113.0, 87.0, 59.0, 46.0, 20.0, 26.0, 19.0, 16.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.5625, -92.4150390625, -89.267578125, -86.1201171875, -82.97265625, -79.8251953125, -76.677734375, -73.5302734375, -70.3828125, -67.2353515625, -64.087890625, -60.9404296875, -57.79296875, -54.6455078125, -51.498046875, -48.3505859375, -45.203125, -42.0556640625, -38.908203125, -35.7607421875, -32.61328125, -29.4658203125, -26.318359375, -23.1708984375, -20.0234375, -16.8759765625, -13.728515625, -10.5810546875, -7.43359375, -4.2861328125, -1.138671875, 2.0087890625, 5.15625, 8.3037109375, 11.451171875, 14.5986328125, 17.74609375, 20.8935546875, 24.041015625, 27.1884765625, 30.3359375, 33.4833984375, 36.630859375, 39.7783203125, 42.92578125, 46.0732421875, 49.220703125, 52.3681640625, 55.515625, 58.6630859375, 61.810546875, 64.9580078125, 68.10546875, 71.2529296875, 74.400390625, 77.5478515625, 80.6953125, 83.8427734375, 86.990234375, 90.1376953125, 93.28515625, 96.4326171875, 99.580078125, 102.7275390625, 105.875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 15.0, 24.0, 195.0, 584.0, 134.0, 33.0, 13.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2136.615234375, -2025.388427734375, -1914.16162109375, -1802.9349365234375, -1691.7081298828125, -1580.4813232421875, -1469.254638671875, -1358.02783203125, -1246.801025390625, -1135.57421875, -1024.347412109375, -913.1207275390625, -801.8939208984375, -690.6671142578125, -579.4403686523438, -468.213623046875, -356.98681640625, -245.76004028320312, -134.53326416015625, -23.306488037109375, 87.9202880859375, 199.1470947265625, 310.37384033203125, 421.6005859375, 532.827392578125, 644.05419921875, 755.2809448242188, 866.5076904296875, 977.7344970703125, 1088.9613037109375, 1200.18798828125, 1311.414794921875, 1422.6416015625, 1533.868408203125, 1645.09521484375, 1756.3218994140625, 1867.5487060546875, 1978.7755126953125, 2090.002197265625, 2201.22900390625, 2312.455810546875, 2423.6826171875, 2534.909423828125, 2646.13623046875, 2757.36279296875, 2868.58984375, 2979.81640625, 3091.043212890625, 3202.27001953125, 3313.496826171875, 3424.7236328125, 3535.950439453125, 3647.17724609375, 3758.40380859375, 3869.630615234375, 3980.857421875, 4092.084228515625, 4203.31103515625, 4314.53759765625, 4425.7646484375, 4536.9912109375, 4648.21826171875, 4759.44482421875, 4870.671875, 4981.8984375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 8.0, 2.0, 6.0, 9.0, 8.0, 10.0, 15.0, 15.0, 23.0, 22.0, 31.0, 34.0, 31.0, 48.0, 49.0, 66.0, 63.0, 77.0, 77.0, 94.0, 56.0, 43.0, 50.0, 25.0, 35.0, 17.0, 21.0, 16.0, 10.0, 12.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-747.901611328125, -723.1615600585938, -698.4215698242188, -673.6815185546875, -648.9414672851562, -624.201416015625, -599.46142578125, -574.7213745117188, -549.9813232421875, -525.2412719726562, -500.5012512207031, -475.76123046875, -451.02117919921875, -426.2811584472656, -401.5411376953125, -376.80108642578125, -352.0610656738281, -327.321044921875, -302.58099365234375, -277.8409729003906, -253.10092163085938, -228.36090087890625, -203.62086486816406, -178.88082885742188, -154.1407928466797, -129.4007568359375, -104.66072082519531, -79.92069244384766, -55.18065643310547, -30.44062042236328, -5.700592041015625, 19.039443969726562, 43.77947998046875, 68.51951599121094, 93.25955200195312, 117.99958038330078, 142.7396240234375, 167.47964477539062, 192.2196807861328, 216.959716796875, 241.6997528076172, 266.4397888183594, 291.1798095703125, 315.91986083984375, 340.6598815917969, 365.3999328613281, 390.13995361328125, 414.8800048828125, 439.6200256347656, 464.36004638671875, 489.10009765625, 513.8401489257812, 538.5801391601562, 563.3201904296875, 588.0602416992188, 612.80029296875, 637.540283203125, 662.2803344726562, 687.0203247070312, 711.7603759765625, 736.5004272460938, 761.240478515625, 785.98046875, 810.7205200195312, 835.4605712890625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 10.0, 13.0, 12.0, 13.0, 18.0, 30.0, 40.0, 63.0, 101.0, 150.0, 230.0, 321.0, 592.0, 1012.0, 2227.0, 5333.0, 14673.0, 50348.0, 245975.0, 589773.0, 97276.0, 25253.0, 8208.0, 3413.0, 1493.0, 780.0, 453.0, 240.0, 153.0, 118.0, 69.0, 50.0, 32.0, 16.0, 10.0, 10.0, 10.0, 8.0, 9.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-58.15625, -56.2939453125, -54.431640625, -52.5693359375, -50.70703125, -48.8447265625, -46.982421875, -45.1201171875, -43.2578125, -41.3955078125, -39.533203125, -37.6708984375, -35.80859375, -33.9462890625, -32.083984375, -30.2216796875, -28.359375, -26.4970703125, -24.634765625, -22.7724609375, -20.91015625, -19.0478515625, -17.185546875, -15.3232421875, -13.4609375, -11.5986328125, -9.736328125, -7.8740234375, -6.01171875, -4.1494140625, -2.287109375, -0.4248046875, 1.4375, 3.2998046875, 5.162109375, 7.0244140625, 8.88671875, 10.7490234375, 12.611328125, 14.4736328125, 16.3359375, 18.1982421875, 20.060546875, 21.9228515625, 23.78515625, 25.6474609375, 27.509765625, 29.3720703125, 31.234375, 33.0966796875, 34.958984375, 36.8212890625, 38.68359375, 40.5458984375, 42.408203125, 44.2705078125, 46.1328125, 47.9951171875, 49.857421875, 51.7197265625, 53.58203125, 55.4443359375, 57.306640625, 59.1689453125, 61.03125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 9.0, 17.0, 19.0, 22.0, 27.0, 33.0, 50.0, 73.0, 58.0, 88.0, 87.0, 88.0, 77.0, 83.0, 74.0, 58.0, 36.0, 29.0, 19.0, 20.0, 11.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.125, -57.2158203125, -55.306640625, -53.3974609375, -51.48828125, -49.5791015625, -47.669921875, -45.7607421875, -43.8515625, -41.9423828125, -40.033203125, -38.1240234375, -36.21484375, -34.3056640625, -32.396484375, -30.4873046875, -28.578125, -26.6689453125, -24.759765625, -22.8505859375, -20.94140625, -19.0322265625, -17.123046875, -15.2138671875, -13.3046875, -11.3955078125, -9.486328125, -7.5771484375, -5.66796875, -3.7587890625, -1.849609375, 0.0595703125, 1.96875, 3.8779296875, 5.787109375, 7.6962890625, 9.60546875, 11.5146484375, 13.423828125, 15.3330078125, 17.2421875, 19.1513671875, 21.060546875, 22.9697265625, 24.87890625, 26.7880859375, 28.697265625, 30.6064453125, 32.515625, 34.4248046875, 36.333984375, 38.2431640625, 40.15234375, 42.0615234375, 43.970703125, 45.8798828125, 47.7890625, 49.6982421875, 51.607421875, 53.5166015625, 55.42578125, 57.3349609375, 59.244140625, 61.1533203125, 63.0625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 5.0, 12.0, 30.0, 43.0, 59.0, 91.0, 148.0, 244.0, 527.0, 1061.0, 3726.0, 33186.0, 942593.0, 59119.0, 5168.0, 1308.0, 552.0, 272.0, 152.0, 86.0, 55.0, 29.0, 35.0, 15.0, 6.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.75, -110.3642578125, -106.978515625, -103.5927734375, -100.20703125, -96.8212890625, -93.435546875, -90.0498046875, -86.6640625, -83.2783203125, -79.892578125, -76.5068359375, -73.12109375, -69.7353515625, -66.349609375, -62.9638671875, -59.578125, -56.1923828125, -52.806640625, -49.4208984375, -46.03515625, -42.6494140625, -39.263671875, -35.8779296875, -32.4921875, -29.1064453125, -25.720703125, -22.3349609375, -18.94921875, -15.5634765625, -12.177734375, -8.7919921875, -5.40625, -2.0205078125, 1.365234375, 4.7509765625, 8.13671875, 11.5224609375, 14.908203125, 18.2939453125, 21.6796875, 25.0654296875, 28.451171875, 31.8369140625, 35.22265625, 38.6083984375, 41.994140625, 45.3798828125, 48.765625, 52.1513671875, 55.537109375, 58.9228515625, 62.30859375, 65.6943359375, 69.080078125, 72.4658203125, 75.8515625, 79.2373046875, 82.623046875, 86.0087890625, 89.39453125, 92.7802734375, 96.166015625, 99.5517578125, 102.9375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 13.0, 15.0, 13.0, 15.0, 26.0, 48.0, 37.0, 54.0, 59.0, 93.0, 95.0, 100.0, 108.0, 77.0, 61.0, 42.0, 27.0, 26.0, 24.0, 15.0, 9.0, 10.0, 5.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-239.75, -233.109375, -226.46875, -219.828125, -213.1875, -206.546875, -199.90625, -193.265625, -186.625, -179.984375, -173.34375, -166.703125, -160.0625, -153.421875, -146.78125, -140.140625, -133.5, -126.859375, -120.21875, -113.578125, -106.9375, -100.296875, -93.65625, -87.015625, -80.375, -73.734375, -67.09375, -60.453125, -53.8125, -47.171875, -40.53125, -33.890625, -27.25, -20.609375, -13.96875, -7.328125, -0.6875, 5.953125, 12.59375, 19.234375, 25.875, 32.515625, 39.15625, 45.796875, 52.4375, 59.078125, 65.71875, 72.359375, 79.0, 85.640625, 92.28125, 98.921875, 105.5625, 112.203125, 118.84375, 125.484375, 132.125, 138.765625, 145.40625, 152.046875, 158.6875, 165.328125, 171.96875, 178.609375, 185.25]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 12.0, 8.0, 10.0, 13.0, 11.0, 14.0, 12.0, 20.0, 21.0, 29.0, 41.0, 75.0, 127.0, 230.0, 544.0, 1549.0, 6642.0, 59734.0, 939250.0, 33294.0, 4628.0, 1236.0, 434.0, 209.0, 129.0, 63.0, 43.0, 45.0, 20.0, 18.0, 14.0, 10.0, 11.0, 9.0, 8.0, 9.0, 0.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.703125, -24.933349609375, -24.16357421875, -23.393798828125, -22.6240234375, -21.854248046875, -21.08447265625, -20.314697265625, -19.544921875, -18.775146484375, -18.00537109375, -17.235595703125, -16.4658203125, -15.696044921875, -14.92626953125, -14.156494140625, -13.38671875, -12.616943359375, -11.84716796875, -11.077392578125, -10.3076171875, -9.537841796875, -8.76806640625, -7.998291015625, -7.228515625, -6.458740234375, -5.68896484375, -4.919189453125, -4.1494140625, -3.379638671875, -2.60986328125, -1.840087890625, -1.0703125, -0.300537109375, 0.46923828125, 1.239013671875, 2.0087890625, 2.778564453125, 3.54833984375, 4.318115234375, 5.087890625, 5.857666015625, 6.62744140625, 7.397216796875, 8.1669921875, 8.936767578125, 9.70654296875, 10.476318359375, 11.24609375, 12.015869140625, 12.78564453125, 13.555419921875, 14.3251953125, 15.094970703125, 15.86474609375, 16.634521484375, 17.404296875, 18.174072265625, 18.94384765625, 19.713623046875, 20.4833984375, 21.253173828125, 22.02294921875, 22.792724609375, 23.5625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 11.0, 6.0, 14.0, 10.0, 19.0, 27.0, 30.0, 50.0, 76.0, 95.0, 139.0, 119.0, 105.0, 80.0, 42.0, 36.0, 24.0, 18.0, 17.0, 10.0, 12.0, 7.0, 6.0, 8.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00357818603515625, -0.0034590959548950195, -0.003340005874633789, -0.0032209157943725586, -0.003101825714111328, -0.0029827356338500977, -0.002863645553588867, -0.0027445554733276367, -0.0026254653930664062, -0.0025063753128051758, -0.0023872852325439453, -0.002268195152282715, -0.0021491050720214844, -0.002030014991760254, -0.0019109249114990234, -0.001791834831237793, -0.0016727447509765625, -0.001553654670715332, -0.0014345645904541016, -0.001315474510192871, -0.0011963844299316406, -0.0010772943496704102, -0.0009582042694091797, -0.0008391141891479492, -0.0007200241088867188, -0.0006009340286254883, -0.0004818439483642578, -0.00036275386810302734, -0.00024366378784179688, -0.0001245737075805664, -5.4836273193359375e-06, 0.00011360645294189453, 0.000232696533203125, 0.00035178661346435547, 0.00047087669372558594, 0.0005899667739868164, 0.0007090568542480469, 0.0008281469345092773, 0.0009472370147705078, 0.0010663270950317383, 0.0011854171752929688, 0.0013045072555541992, 0.0014235973358154297, 0.0015426874160766602, 0.0016617774963378906, 0.001780867576599121, 0.0018999576568603516, 0.002019047737121582, 0.0021381378173828125, 0.002257227897644043, 0.0023763179779052734, 0.002495408058166504, 0.0026144981384277344, 0.002733588218688965, 0.0028526782989501953, 0.0029717683792114258, 0.0030908584594726562, 0.0032099485397338867, 0.003329038619995117, 0.0034481287002563477, 0.003567218780517578, 0.0036863088607788086, 0.003805398941040039, 0.0039244890213012695, 0.0040435791015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 7.0, 5.0, 8.0, 17.0, 23.0, 39.0, 45.0, 84.0, 185.0, 392.0, 1218.0, 5879.0, 59354.0, 943852.0, 31844.0, 4005.0, 952.0, 307.0, 159.0, 65.0, 42.0, 24.0, 13.0, 7.0, 13.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.859375, -28.162109375, -27.46484375, -26.767578125, -26.0703125, -25.373046875, -24.67578125, -23.978515625, -23.28125, -22.583984375, -21.88671875, -21.189453125, -20.4921875, -19.794921875, -19.09765625, -18.400390625, -17.703125, -17.005859375, -16.30859375, -15.611328125, -14.9140625, -14.216796875, -13.51953125, -12.822265625, -12.125, -11.427734375, -10.73046875, -10.033203125, -9.3359375, -8.638671875, -7.94140625, -7.244140625, -6.546875, -5.849609375, -5.15234375, -4.455078125, -3.7578125, -3.060546875, -2.36328125, -1.666015625, -0.96875, -0.271484375, 0.42578125, 1.123046875, 1.8203125, 2.517578125, 3.21484375, 3.912109375, 4.609375, 5.306640625, 6.00390625, 6.701171875, 7.3984375, 8.095703125, 8.79296875, 9.490234375, 10.1875, 10.884765625, 11.58203125, 12.279296875, 12.9765625, 13.673828125, 14.37109375, 15.068359375, 15.765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 7.0, 1.0, 3.0, 5.0, 3.0, 4.0, 13.0, 12.0, 15.0, 28.0, 34.0, 63.0, 109.0, 112.0, 143.0, 114.0, 110.0, 79.0, 35.0, 30.0, 22.0, 12.0, 14.0, 8.0, 6.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.570556640625, -16.93798828125, -16.305419921875, -15.6728515625, -15.040283203125, -14.40771484375, -13.775146484375, -13.142578125, -12.510009765625, -11.87744140625, -11.244873046875, -10.6123046875, -9.979736328125, -9.34716796875, -8.714599609375, -8.08203125, -7.449462890625, -6.81689453125, -6.184326171875, -5.5517578125, -4.919189453125, -4.28662109375, -3.654052734375, -3.021484375, -2.388916015625, -1.75634765625, -1.123779296875, -0.4912109375, 0.141357421875, 0.77392578125, 1.406494140625, 2.0390625, 2.671630859375, 3.30419921875, 3.936767578125, 4.5693359375, 5.201904296875, 5.83447265625, 6.467041015625, 7.099609375, 7.732177734375, 8.36474609375, 8.997314453125, 9.6298828125, 10.262451171875, 10.89501953125, 11.527587890625, 12.16015625, 12.792724609375, 13.42529296875, 14.057861328125, 14.6904296875, 15.322998046875, 15.95556640625, 16.588134765625, 17.220703125, 17.853271484375, 18.48583984375, 19.118408203125, 19.7509765625, 20.383544921875, 21.01611328125, 21.648681640625, 22.28125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 6.0, 10.0, 13.0, 26.0, 72.0, 172.0, 558.0, 81.0, 30.0, 14.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1120.3734130859375, -1093.8857421875, -1067.3980712890625, -1040.910400390625, -1014.4226684570312, -987.9349365234375, -961.447265625, -934.9595947265625, -908.4718627929688, -881.9841918945312, -855.4964599609375, -829.0087890625, -802.5211181640625, -776.0333862304688, -749.5457153320312, -723.0579833984375, -696.5703125, -670.0826416015625, -643.5949096679688, -617.1072387695312, -590.6195678710938, -564.1318359375, -537.6441650390625, -511.1564636230469, -484.6688232421875, -458.1811218261719, -431.6934509277344, -405.20574951171875, -378.7180480957031, -352.2303466796875, -325.74267578125, -299.2549743652344, -272.76727294921875, -246.2795867919922, -219.79188537597656, -193.30419921875, -166.81649780273438, -140.3288116455078, -113.84112548828125, -87.35342407226562, -60.86573791503906, -34.37804412841797, -7.890354156494141, 18.597335815429688, 45.08502960205078, 71.57272338867188, 98.06040954589844, 124.54811096191406, 151.03579711914062, 177.5234832763672, 204.0111846923828, 230.49887084960938, 256.986572265625, 283.4742431640625, 309.9619445800781, 336.44964599609375, 362.93731689453125, 389.4250183105469, 415.9126892089844, 442.400390625, 468.8880920410156, 495.37579345703125, 521.8634643554688, 548.3511962890625, 574.8388671875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 16.0, 13.0, 25.0, 21.0, 33.0, 29.0, 45.0, 119.0, 290.0, 155.0, 49.0, 39.0, 36.0, 25.0, 22.0, 17.0, 16.0, 7.0, 7.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-667.7740478515625, -649.9910278320312, -632.2080078125, -614.4249267578125, -596.6419067382812, -578.85888671875, -561.0758056640625, -543.2927856445312, -525.509765625, -507.72674560546875, -489.9436950683594, -472.16064453125, -454.37762451171875, -436.5946044921875, -418.8115539550781, -401.02850341796875, -383.2454833984375, -365.46246337890625, -347.6794128417969, -329.8963623046875, -312.11334228515625, -294.330322265625, -276.5472717285156, -258.76422119140625, -240.981201171875, -223.1981658935547, -205.41513061523438, -187.63209533691406, -169.84906005859375, -152.06602478027344, -134.28298950195312, -116.49995422363281, -98.71685791015625, -80.93382263183594, -63.150787353515625, -45.36775207519531, -27.584716796875, -9.801681518554688, 7.981353759765625, 25.764389038085938, 43.54742431640625, 61.33045959472656, 79.11349487304688, 96.89653015136719, 114.6795654296875, 132.4626007080078, 150.24563598632812, 168.02867126464844, 185.81170654296875, 203.59474182128906, 221.37777709960938, 239.1608123779297, 256.94384765625, 274.72686767578125, 292.5099182128906, 310.29296875, 328.07598876953125, 345.8590087890625, 363.6420593261719, 381.42510986328125, 399.2081298828125, 416.99114990234375, 434.7742004394531, 452.5572509765625, 470.34027099609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 12.0, 11.0, 13.0, 15.0, 18.0, 18.0, 24.0, 45.0, 22.0, 68.0, 105.0, 267.0, 87.0, 46.0, 40.0, 29.0, 24.0, 32.0, 19.0, 28.0, 14.0, 9.0, 12.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-48.09375, -46.904541015625, -45.71533203125, -44.526123046875, -43.3369140625, -42.147705078125, -40.95849609375, -39.769287109375, -38.580078125, -37.390869140625, -36.20166015625, -35.012451171875, -33.8232421875, -32.634033203125, -31.44482421875, -30.255615234375, -29.06640625, -27.877197265625, -26.68798828125, -25.498779296875, -24.3095703125, -23.120361328125, -21.93115234375, -20.741943359375, -19.552734375, -18.363525390625, -17.17431640625, -15.985107421875, -14.7958984375, -13.606689453125, -12.41748046875, -11.228271484375, -10.0390625, -8.849853515625, -7.66064453125, -6.471435546875, -5.2822265625, -4.093017578125, -2.90380859375, -1.714599609375, -0.525390625, 0.663818359375, 1.85302734375, 3.042236328125, 4.2314453125, 5.420654296875, 6.60986328125, 7.799072265625, 8.98828125, 10.177490234375, 11.36669921875, 12.555908203125, 13.7451171875, 14.934326171875, 16.12353515625, 17.312744140625, 18.501953125, 19.691162109375, 20.88037109375, 22.069580078125, 23.2587890625, 24.447998046875, 25.63720703125, 26.826416015625, 28.015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 7.0, 6.0, 10.0, 9.0, 21.0, 35.0, 33.0, 61.0, 204.0, 632.0, 10571.0, 8372808.0, 3418.0, 407.0, 149.0, 59.0, 29.0, 21.0, 13.0, 17.0, 14.0, 18.0, 19.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-661.8748168945312, -638.5213012695312, -615.167724609375, -591.814208984375, -568.4606323242188, -545.1071166992188, -521.7535400390625, -498.4000244140625, -475.0464782714844, -451.69293212890625, -428.3393859863281, -404.98583984375, -381.63232421875, -358.27874755859375, -334.92523193359375, -311.5716857910156, -288.2181396484375, -264.8645935058594, -241.51104736328125, -218.1575164794922, -194.80397033691406, -171.45042419433594, -148.09689331054688, -124.74334716796875, -101.38980102539062, -78.0362548828125, -54.682716369628906, -31.329177856445312, -7.9756317138671875, 15.377914428710938, 38.7314453125, 62.084991455078125, 85.4385986328125, 108.79214477539062, 132.14569091796875, 155.4992218017578, 178.85276794433594, 202.20631408691406, 225.55984497070312, 248.91339111328125, 272.2669372558594, 295.6204833984375, 318.9740295410156, 342.32757568359375, 365.68109130859375, 389.03466796875, 412.38818359375, 435.7417297363281, 459.09527587890625, 482.4488220214844, 505.8023681640625, 529.1558837890625, 552.5094604492188, 575.8629760742188, 599.216552734375, 622.570068359375, 645.923583984375, 669.277099609375, 692.6306762695312, 715.9841918945312, 739.3377685546875, 762.6912841796875, 786.0447998046875, 809.3983764648438, 832.751953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 6.0, 7.0, 11.0, 6.0, 5.0, 5.0, 6.0, 9.0, 7.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-950.4044799804688, -926.173583984375, -901.942626953125, -877.7117309570312, -853.4808349609375, -829.2498779296875, -805.0189819335938, -780.7880859375, -756.55712890625, -732.3262329101562, -708.0952758789062, -683.8643798828125, -659.6334228515625, -635.4025268554688, -611.171630859375, -586.940673828125, -562.7097778320312, -538.4788818359375, -514.2479248046875, -490.01702880859375, -465.7861022949219, -441.55517578125, -417.32427978515625, -393.0933532714844, -368.8624267578125, -344.6315002441406, -320.40057373046875, -296.169677734375, -271.9387512207031, -247.70782470703125, -223.47691345214844, -199.24600219726562, -175.0150146484375, -150.78408813476562, -126.55317687988281, -102.32225799560547, -78.09133911132812, -53.86042022705078, -29.629501342773438, -5.398590087890625, 18.83233642578125, 43.063255310058594, 67.29417419433594, 91.52509307861328, 115.75601196289062, 139.9869384765625, 164.2178497314453, 188.44876098632812, 212.6796875, 236.91061401367188, 261.14154052734375, 285.3724365234375, 309.6033630371094, 333.83428955078125, 358.065185546875, 382.2961120605469, 406.52703857421875, 430.7579650878906, 454.9888916015625, 479.21978759765625, 503.4507141113281, 527.681640625, 551.9125366210938, 576.1434326171875, 600.3743896484375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 5.0, 8.0, 9.0, 12.0, 14.0, 17.0, 18.0, 35.0, 42.0, 58.0, 82.0, 93.0, 138.0, 195.0, 324.0, 579.0, 995.0, 2204.0, 5244.0, 14364.0, 41410.0, 128561.0, 204361.0, 83145.0, 26322.0, 9231.0, 3492.0, 1463.0, 721.0, 405.0, 200.0, 121.0, 109.0, 67.0, 51.0, 41.0, 30.0, 20.0, 14.0, 15.0, 10.0, 7.0, 6.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-241.625, -234.37109375, -227.1171875, -219.86328125, -212.609375, -205.35546875, -198.1015625, -190.84765625, -183.59375, -176.33984375, -169.0859375, -161.83203125, -154.578125, -147.32421875, -140.0703125, -132.81640625, -125.5625, -118.30859375, -111.0546875, -103.80078125, -96.546875, -89.29296875, -82.0390625, -74.78515625, -67.53125, -60.27734375, -53.0234375, -45.76953125, -38.515625, -31.26171875, -24.0078125, -16.75390625, -9.5, -2.24609375, 5.0078125, 12.26171875, 19.515625, 26.76953125, 34.0234375, 41.27734375, 48.53125, 55.78515625, 63.0390625, 70.29296875, 77.546875, 84.80078125, 92.0546875, 99.30859375, 106.5625, 113.81640625, 121.0703125, 128.32421875, 135.578125, 142.83203125, 150.0859375, 157.33984375, 164.59375, 171.84765625, 179.1015625, 186.35546875, 193.609375, 200.86328125, 208.1171875, 215.37109375, 222.625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 14.0, 21.0, 17.0, 32.0, 43.0, 36.0, 49.0, 74.0, 96.0, 91.0, 91.0, 89.0, 96.0, 70.0, 32.0, 38.0, 25.0, 19.0, 12.0, 9.0, 8.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.875, -55.96484375, -54.0546875, -52.14453125, -50.234375, -48.32421875, -46.4140625, -44.50390625, -42.59375, -40.68359375, -38.7734375, -36.86328125, -34.953125, -33.04296875, -31.1328125, -29.22265625, -27.3125, -25.40234375, -23.4921875, -21.58203125, -19.671875, -17.76171875, -15.8515625, -13.94140625, -12.03125, -10.12109375, -8.2109375, -6.30078125, -4.390625, -2.48046875, -0.5703125, 1.33984375, 3.25, 5.16015625, 7.0703125, 8.98046875, 10.890625, 12.80078125, 14.7109375, 16.62109375, 18.53125, 20.44140625, 22.3515625, 24.26171875, 26.171875, 28.08203125, 29.9921875, 31.90234375, 33.8125, 35.72265625, 37.6328125, 39.54296875, 41.453125, 43.36328125, 45.2734375, 47.18359375, 49.09375, 51.00390625, 52.9140625, 54.82421875, 56.734375, 58.64453125, 60.5546875, 62.46484375, 64.375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 12.0, 18.0, 53.0, 128.0, 117.0, 79.0, 21.0, 19.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.38316345214844, -130.05235290527344, -116.7215576171875, -103.3907470703125, -90.05994415283203, -76.72914123535156, -63.39833068847656, -50.067527770996094, -36.736724853515625, -23.405920028686523, -10.075115203857422, 3.2556915283203125, 16.58649444580078, 29.91729736328125, 43.24810791015625, 56.57891082763672, 69.90971374511719, 83.24051666259766, 96.57131958007812, 109.90213012695312, 123.2329330444336, 136.56373596191406, 149.89454650878906, 163.225341796875, 176.55615234375, 189.886962890625, 203.21775817871094, 216.54856872558594, 229.87936401367188, 243.21017456054688, 256.5409851074219, 269.8717956542969, 283.20257568359375, 296.53338623046875, 309.86419677734375, 323.19500732421875, 336.5257873535156, 349.8565979003906, 363.1874084472656, 376.5182189941406, 389.8489990234375, 403.1798095703125, 416.5106201171875, 429.8414306640625, 443.1722106933594, 456.5030212402344, 469.8338317871094, 483.1646423339844, 496.4954528808594, 509.8262634277344, 523.1570434570312, 536.4878540039062, 549.8186645507812, 563.1494750976562, 576.4802856445312, 589.8110961914062, 603.1419067382812, 616.4727172851562, 629.8035278320312, 643.1343383789062, 656.4651489257812, 669.7958984375, 683.126708984375, 696.45751953125, 709.788330078125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 4.0, 11.0, 8.0, 13.0, 26.0, 93.0, 106.0, 118.0, 43.0, 11.0, 15.0, 7.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-477.7574157714844, -465.9818115234375, -454.2061767578125, -442.4305419921875, -430.6549377441406, -418.87933349609375, -407.10369873046875, -395.32806396484375, -383.5524597167969, -371.77685546875, -360.001220703125, -348.2255859375, -336.4499816894531, -324.67437744140625, -312.89874267578125, -301.12310791015625, -289.3475036621094, -277.5718994140625, -265.7962646484375, -254.02064514160156, -242.24502563476562, -230.4694061279297, -218.69378662109375, -206.9181671142578, -195.14254760742188, -183.36692810058594, -171.59130859375, -159.81568908691406, -148.04006958007812, -136.2644500732422, -124.48883056640625, -112.71321105957031, -100.93759155273438, -89.16197204589844, -77.3863525390625, -65.61073303222656, -53.835113525390625, -42.05949401855469, -30.28387451171875, -18.508255004882812, -6.732635498046875, 5.0429840087890625, 16.818603515625, 28.594223022460938, 40.369842529296875, 52.14546203613281, 63.92108154296875, 75.69670104980469, 87.47232055664062, 99.24794006347656, 111.0235595703125, 122.79917907714844, 134.57479858398438, 146.3504180908203, 158.12603759765625, 169.9016571044922, 181.67727661132812, 193.45289611816406, 205.228515625, 217.00413513183594, 228.77975463867188, 240.5553741455078, 252.33099365234375, 264.10662841796875, 275.8822326660156]}, "eval/loss": 6.7275872230529785, "eval/wer": 1.4950096235887056, "eval/runtime": 1512.5692, "eval/samples_per_second": 1.747, "eval/steps_per_second": 0.437}