diff --git "a/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" "b/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" --- "a/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" +++ "b/wandb/run-20220302_094439-2kys49al/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 6.8859, "train/learning_rate": 2.4118223703558477e-05, "train/epoch": 0.7, "train/global_step": 2500, "_runtime": 11399, "_timestamp": 1646225678, "_step": 2504, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30425.0, 46.0, 11.0, 3.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7628.0, -7456.46875, -7284.9375, -7113.40625, -6941.875, -6770.34375, -6598.8125, -6427.28125, -6255.75, -6084.21875, -5912.6875, -5741.15625, -5569.625, -5398.09375, -5226.5625, -5055.03125, -4883.5, -4711.96875, -4540.4375, -4368.90625, -4197.375, -4025.84375, -3854.3125, -3682.78125, -3511.25, -3339.71875, -3168.1875, -2996.65625, -2825.125, -2653.59375, -2482.0625, -2310.53125, -2139.0, -1967.46875, -1795.9375, -1624.40625, -1452.875, -1281.34375, -1109.8125, -938.28125, -766.75, -595.21875, -423.6875, -252.15625, -80.625, 90.90625, 262.4375, 433.96875, 605.5, 777.03125, 948.5625, 1120.09375, 1291.625, 1463.15625, 1634.6875, 1806.21875, 1977.75, 2149.28125, 2320.8125, 2492.34375, 2663.875, 2835.40625, 3006.9375, 3178.46875, 3350.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 7.0, 7.0, 13.0, 17.0, 23.0, 22.0, 37.0, 46.0, 50.0, 67.0, 80.0, 99.0, 95.0, 100.0, 81.0, 53.0, 53.0, 34.0, 22.0, 23.0, 15.0, 16.0, 4.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1077.32373046875, -1034.0784912109375, -990.8333740234375, -947.588134765625, -904.343017578125, -861.0977783203125, -817.8526000976562, -774.607421875, -731.3622436523438, -688.1170654296875, -644.8718872070312, -601.626708984375, -558.3814697265625, -515.1363525390625, -471.89111328125, -428.64593505859375, -385.4007568359375, -342.15557861328125, -298.910400390625, -255.66519165039062, -212.42001342773438, -169.17483520507812, -125.92962646484375, -82.6844482421875, -39.43927001953125, 3.8059158325195312, 47.05110168457031, 90.29629516601562, 133.54147338867188, 176.78665161132812, 220.0318603515625, 263.27703857421875, 306.5220947265625, 349.76727294921875, 393.012451171875, 436.2576599121094, 479.5028381347656, 522.748046875, 565.9932250976562, 609.2384033203125, 652.4835815429688, 695.728759765625, 738.9739379882812, 782.2191162109375, 825.46435546875, 868.70947265625, 911.9547119140625, 955.1998901367188, 998.445068359375, 1041.6903076171875, 1084.9354248046875, 1128.1806640625, 1171.42578125, 1214.6710205078125, 1257.916259765625, 1301.161376953125, 1344.406494140625, 1387.6517333984375, 1430.8968505859375, 1474.14208984375, 1517.38720703125, 1560.6324462890625, 1603.877685546875, 1647.122802734375, 1690.3680419921875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 9.0, 5.0, 6.0, 11.0, 11.0, 19.0, 18.0, 19.0, 33.0, 27.0, 32.0, 30.0, 31.0, 31.0, 36.0, 49.0, 35.0, 46.0, 40.0, 34.0, 39.0, 35.0, 41.0, 29.0, 34.0, 29.0, 29.0, 25.0, 22.0, 31.0, 28.0, 16.0, 12.0, 15.0, 12.0, 7.0, 10.0, 12.0, 5.0, 3.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-855.9072265625, -829.31494140625, -802.72265625, -776.1304321289062, -749.5381469726562, -722.9458618164062, -696.3536376953125, -669.7613525390625, -643.1690673828125, -616.5767822265625, -589.9844970703125, -563.3922729492188, -536.7999877929688, -510.20770263671875, -483.6154479980469, -457.023193359375, -430.430908203125, -403.838623046875, -377.2463684082031, -350.65411376953125, -324.06182861328125, -297.46954345703125, -270.8772888183594, -244.28501892089844, -217.6927490234375, -191.10047912597656, -164.50820922851562, -137.9159393310547, -111.32366943359375, -84.73139953613281, -58.139129638671875, -31.546859741210938, -4.95458984375, 21.637680053710938, 48.229949951171875, 74.82221984863281, 101.41448974609375, 128.0067596435547, 154.59902954101562, 181.19129943847656, 207.7835693359375, 234.37583923339844, 260.9681091308594, 287.56036376953125, 314.15264892578125, 340.74493408203125, 367.3371887207031, 393.929443359375, 420.521728515625, 447.114013671875, 473.7062683105469, 500.29852294921875, 526.8908081054688, 553.4830932617188, 580.0753173828125, 606.6676025390625, 633.2598876953125, 659.8521728515625, 686.4444580078125, 713.0366821289062, 739.6289672851562, 766.2212524414062, 792.8134765625, 819.40576171875, 845.998046875]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 17.0, 35.0, 40.0, 57.0, 73.0, 113.0, 149.0, 225.0, 366.0, 515.0, 699.0, 1108.0, 1549.0, 2512.0, 3669.0, 5638.0, 9091.0, 14324.0, 23443.0, 38825.0, 69347.0, 149928.0, 390341.0, 158445.0, 72173.0, 40618.0, 23936.0, 14670.0, 9204.0, 5940.0, 3737.0, 2637.0, 1628.0, 1107.0, 749.0, 503.0, 372.0, 238.0, 168.0, 107.0, 78.0, 46.0, 38.0, 25.0, 28.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2280.0, -2207.6875, -2135.375, -2063.0625, -1990.75, -1918.4375, -1846.125, -1773.8125, -1701.5, -1629.1875, -1556.875, -1484.5625, -1412.25, -1339.9375, -1267.625, -1195.3125, -1123.0, -1050.6875, -978.375, -906.0625, -833.75, -761.4375, -689.125, -616.8125, -544.5, -472.1875, -399.875, -327.5625, -255.25, -182.9375, -110.625, -38.3125, 34.0, 106.3125, 178.625, 250.9375, 323.25, 395.5625, 467.875, 540.1875, 612.5, 684.8125, 757.125, 829.4375, 901.75, 974.0625, 1046.375, 1118.6875, 1191.0, 1263.3125, 1335.625, 1407.9375, 1480.25, 1552.5625, 1624.875, 1697.1875, 1769.5, 1841.8125, 1914.125, 1986.4375, 2058.75, 2131.0625, 2203.375, 2275.6875, 2348.0]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 7.0, 8.0, 8.0, 13.0, 16.0, 15.0, 20.0, 17.0, 25.0, 18.0, 24.0, 51.0, 62.0, 80.0, 126.0, 114.0, 76.0, 49.0, 46.0, 36.0, 26.0, 14.0, 23.0, 22.0, 18.0, 18.0, 9.0, 8.0, 5.0, 5.0, 6.0, 4.0, 3.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-834.0, -808.6875, -783.375, -758.0625, -732.75, -707.4375, -682.125, -656.8125, -631.5, -606.1875, -580.875, -555.5625, -530.25, -504.9375, -479.625, -454.3125, -429.0, -403.6875, -378.375, -353.0625, -327.75, -302.4375, -277.125, -251.8125, -226.5, -201.1875, -175.875, -150.5625, -125.25, -99.9375, -74.625, -49.3125, -24.0, 1.3125, 26.625, 51.9375, 77.25, 102.5625, 127.875, 153.1875, 178.5, 203.8125, 229.125, 254.4375, 279.75, 305.0625, 330.375, 355.6875, 381.0, 406.3125, 431.625, 456.9375, 482.25, 507.5625, 532.875, 558.1875, 583.5, 608.8125, 634.125, 659.4375, 684.75, 710.0625, 735.375, 760.6875, 786.0]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 1.0, 12.0, 7.0, 8.0, 9.0, 12.0, 19.0, 17.0, 18.0, 21.0, 27.0, 41.0, 36.0, 28.0, 55.0, 53.0, 44.0, 60.0, 52.0, 62.0, 61.0, 37.0, 45.0, 49.0, 39.0, 27.0, 27.0, 16.0, 12.0, 22.0, 15.0, 10.0, 13.0, 8.0, 5.0, 9.0, 2.0, 4.0, 7.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-462.0770568847656, -449.7961730957031, -437.5152893066406, -425.2344055175781, -412.9535217285156, -400.6726379394531, -388.3917541503906, -376.1108703613281, -363.8299865722656, -351.5491027832031, -339.2682189941406, -326.9873352050781, -314.7064514160156, -302.4255676269531, -290.1446838378906, -277.8638000488281, -265.5828857421875, -253.302001953125, -241.0211181640625, -228.740234375, -216.4593505859375, -204.178466796875, -191.8975830078125, -179.61669921875, -167.3358154296875, -155.054931640625, -142.7740478515625, -130.4931640625, -118.2122802734375, -105.931396484375, -93.65050506591797, -81.36962127685547, -69.0887451171875, -56.807861328125, -44.5269775390625, -32.246089935302734, -19.965206146240234, -7.684322357177734, 4.596565246582031, 16.87744903564453, 29.15833282470703, 41.43921661376953, 53.72010040283203, 66.00099182128906, 78.28187561035156, 90.56275939941406, 102.84364318847656, 115.12452697753906, 127.40541076660156, 139.68629455566406, 151.96717834472656, 164.24806213378906, 176.52894592285156, 188.80982971191406, 201.09072875976562, 213.37161254882812, 225.65249633789062, 237.93338012695312, 250.21426391601562, 262.4951477050781, 274.7760314941406, 287.0569152832031, 299.3377990722656, 311.6186828613281, 323.8995666503906]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 3.0, 8.0, 8.0, 6.0, 11.0, 17.0, 18.0, 25.0, 25.0, 27.0, 22.0, 15.0, 27.0, 25.0, 36.0, 42.0, 40.0, 41.0, 44.0, 36.0, 37.0, 37.0, 33.0, 37.0, 34.0, 24.0, 41.0, 17.0, 30.0, 28.0, 28.0, 26.0, 20.0, 17.0, 19.0, 11.0, 19.0, 7.0, 7.0, 9.0, 7.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-326.74267578125, -316.16741943359375, -305.5921325683594, -295.016845703125, -284.44158935546875, -273.8663330078125, -263.2910461425781, -252.7157745361328, -242.1405029296875, -231.5652313232422, -220.98995971679688, -210.41468811035156, -199.83941650390625, -189.26414489746094, -178.68887329101562, -168.1136016845703, -157.538330078125, -146.9630584716797, -136.38778686523438, -125.81251525878906, -115.23724365234375, -104.66197204589844, -94.08670043945312, -83.51142883300781, -72.9361572265625, -62.36088562011719, -51.785614013671875, -41.21034240722656, -30.63507080078125, -20.059799194335938, -9.484527587890625, 1.0907440185546875, 11.666015625, 22.241287231445312, 32.816558837890625, 43.39183044433594, 53.96710205078125, 64.54237365722656, 75.11764526367188, 85.69291687011719, 96.2681884765625, 106.84346008300781, 117.41873168945312, 127.99400329589844, 138.56927490234375, 149.14454650878906, 159.71981811523438, 170.2950897216797, 180.870361328125, 191.4456329345703, 202.02090454101562, 212.59617614746094, 223.17144775390625, 233.74671936035156, 244.32199096679688, 254.8972625732422, 265.4725341796875, 276.04779052734375, 286.6230773925781, 297.1983642578125, 307.77362060546875, 318.348876953125, 328.9241638183594, 339.49945068359375, 350.07470703125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 5.0, 21.0, 32.0, 50.0, 79.0, 108.0, 180.0, 276.0, 443.0, 648.0, 981.0, 1517.0, 2304.0, 3474.0, 5198.0, 7983.0, 12463.0, 19890.0, 31730.0, 52218.0, 89601.0, 163395.0, 398160.0, 1282804.0, 1325359.0, 404223.0, 160786.0, 88835.0, 52363.0, 32248.0, 20245.0, 12891.0, 8396.0, 5321.0, 3482.0, 2296.0, 1549.0, 982.0, 635.0, 412.0, 256.0, 158.0, 102.0, 72.0, 34.0, 30.0, 14.0, 8.0, 10.0, 3.0, 3.0, 7.0, 0.0, 0.0, 1.0, 2.0], "bins": [-393.75, -381.44921875, -369.1484375, -356.84765625, -344.546875, -332.24609375, -319.9453125, -307.64453125, -295.34375, -283.04296875, -270.7421875, -258.44140625, -246.140625, -233.83984375, -221.5390625, -209.23828125, -196.9375, -184.63671875, -172.3359375, -160.03515625, -147.734375, -135.43359375, -123.1328125, -110.83203125, -98.53125, -86.23046875, -73.9296875, -61.62890625, -49.328125, -37.02734375, -24.7265625, -12.42578125, -0.125, 12.17578125, 24.4765625, 36.77734375, 49.078125, 61.37890625, 73.6796875, 85.98046875, 98.28125, 110.58203125, 122.8828125, 135.18359375, 147.484375, 159.78515625, 172.0859375, 184.38671875, 196.6875, 208.98828125, 221.2890625, 233.58984375, 245.890625, 258.19140625, 270.4921875, 282.79296875, 295.09375, 307.39453125, 319.6953125, 331.99609375, 344.296875, 356.59765625, 368.8984375, 381.19921875, 393.5]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 0.0, 6.0, 2.0, 9.0, 6.0, 9.0, 11.0, 15.0, 17.0, 25.0, 21.0, 24.0, 16.0, 21.0, 28.0, 29.0, 27.0, 40.0, 36.0, 35.0, 47.0, 46.0, 35.0, 30.0, 31.0, 45.0, 37.0, 34.0, 35.0, 32.0, 31.0, 28.0, 29.0, 20.0, 23.0, 23.0, 17.0, 13.0, 13.0, 16.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-160.25, -154.7734375, -149.296875, -143.8203125, -138.34375, -132.8671875, -127.390625, -121.9140625, -116.4375, -110.9609375, -105.484375, -100.0078125, -94.53125, -89.0546875, -83.578125, -78.1015625, -72.625, -67.1484375, -61.671875, -56.1953125, -50.71875, -45.2421875, -39.765625, -34.2890625, -28.8125, -23.3359375, -17.859375, -12.3828125, -6.90625, -1.4296875, 4.046875, 9.5234375, 15.0, 20.4765625, 25.953125, 31.4296875, 36.90625, 42.3828125, 47.859375, 53.3359375, 58.8125, 64.2890625, 69.765625, 75.2421875, 80.71875, 86.1953125, 91.671875, 97.1484375, 102.625, 108.1015625, 113.578125, 119.0546875, 124.53125, 130.0078125, 135.484375, 140.9609375, 146.4375, 151.9140625, 157.390625, 162.8671875, 168.34375, 173.8203125, 179.296875, 184.7734375, 190.25]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 6.0, 12.0, 18.0, 37.0, 42.0, 53.0, 93.0, 117.0, 224.0, 365.0, 498.0, 820.0, 1155.0, 1981.0, 3204.0, 5356.0, 8935.0, 15954.0, 28432.0, 53780.0, 104720.0, 213775.0, 476560.0, 1291220.0, 1150515.0, 430857.0, 195809.0, 96740.0, 49823.0, 26583.0, 14810.0, 8606.0, 5097.0, 2977.0, 1828.0, 1166.0, 732.0, 461.0, 315.0, 174.0, 144.0, 94.0, 56.0, 44.0, 17.0, 19.0, 17.0, 14.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-318.0, -307.72265625, -297.4453125, -287.16796875, -276.890625, -266.61328125, -256.3359375, -246.05859375, -235.78125, -225.50390625, -215.2265625, -204.94921875, -194.671875, -184.39453125, -174.1171875, -163.83984375, -153.5625, -143.28515625, -133.0078125, -122.73046875, -112.453125, -102.17578125, -91.8984375, -81.62109375, -71.34375, -61.06640625, -50.7890625, -40.51171875, -30.234375, -19.95703125, -9.6796875, 0.59765625, 10.875, 21.15234375, 31.4296875, 41.70703125, 51.984375, 62.26171875, 72.5390625, 82.81640625, 93.09375, 103.37109375, 113.6484375, 123.92578125, 134.203125, 144.48046875, 154.7578125, 165.03515625, 175.3125, 185.58984375, 195.8671875, 206.14453125, 216.421875, 226.69921875, 236.9765625, 247.25390625, 257.53125, 267.80859375, 278.0859375, 288.36328125, 298.640625, 308.91796875, 319.1953125, 329.47265625, 339.75]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 8.0, 9.0, 16.0, 18.0, 15.0, 31.0, 43.0, 53.0, 59.0, 62.0, 82.0, 94.0, 143.0, 151.0, 150.0, 265.0, 294.0, 339.0, 390.0, 366.0, 283.0, 227.0, 177.0, 137.0, 144.0, 96.0, 86.0, 67.0, 53.0, 42.0, 44.0, 23.0, 17.0, 16.0, 14.0, 8.0, 8.0, 10.0, 7.0, 5.0, 3.0, 7.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-99.4375, -96.2822265625, -93.126953125, -89.9716796875, -86.81640625, -83.6611328125, -80.505859375, -77.3505859375, -74.1953125, -71.0400390625, -67.884765625, -64.7294921875, -61.57421875, -58.4189453125, -55.263671875, -52.1083984375, -48.953125, -45.7978515625, -42.642578125, -39.4873046875, -36.33203125, -33.1767578125, -30.021484375, -26.8662109375, -23.7109375, -20.5556640625, -17.400390625, -14.2451171875, -11.08984375, -7.9345703125, -4.779296875, -1.6240234375, 1.53125, 4.6865234375, 7.841796875, 10.9970703125, 14.15234375, 17.3076171875, 20.462890625, 23.6181640625, 26.7734375, 29.9287109375, 33.083984375, 36.2392578125, 39.39453125, 42.5498046875, 45.705078125, 48.8603515625, 52.015625, 55.1708984375, 58.326171875, 61.4814453125, 64.63671875, 67.7919921875, 70.947265625, 74.1025390625, 77.2578125, 80.4130859375, 83.568359375, 86.7236328125, 89.87890625, 93.0341796875, 96.189453125, 99.3447265625, 102.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 5.0, 12.0, 11.0, 16.0, 27.0, 25.0, 23.0, 29.0, 39.0, 51.0, 57.0, 64.0, 78.0, 79.0, 63.0, 66.0, 52.0, 50.0, 44.0, 37.0, 26.0, 29.0, 18.0, 12.0, 17.0, 10.0, 13.0, 6.0, 3.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-261.63311767578125, -253.87571716308594, -246.1183319091797, -238.36093139648438, -230.60354614257812, -222.8461456298828, -215.0887451171875, -207.33135986328125, -199.57395935058594, -191.81655883789062, -184.05917358398438, -176.30177307128906, -168.54437255859375, -160.7869873046875, -153.0295867919922, -145.27218627929688, -137.51480102539062, -129.7574005126953, -122.00001525878906, -114.24261474609375, -106.48522186279297, -98.72782897949219, -90.97042846679688, -83.2130355834961, -75.45564270019531, -67.69824981689453, -59.940853118896484, -52.18345642089844, -44.426063537597656, -36.668670654296875, -28.911273956298828, -21.15387725830078, -13.396484375, -5.639089584350586, 2.118305206298828, 9.875699996948242, 17.633094787597656, 25.390487670898438, 33.147884368896484, 40.90528106689453, 48.66267395019531, 56.420066833496094, 64.17745971679688, 71.93486022949219, 79.69225311279297, 87.44964599609375, 95.20704650878906, 102.96443939208984, 110.72183227539062, 118.4792251586914, 126.23661804199219, 133.9940185546875, 141.75140380859375, 149.50880432128906, 157.26620483398438, 165.02359008789062, 172.78099060058594, 180.53839111328125, 188.2957763671875, 196.0531768798828, 203.81057739257812, 211.56796264648438, 219.3253631591797, 227.082763671875, 234.84014892578125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 11.0, 11.0, 14.0, 13.0, 16.0, 16.0, 27.0, 24.0, 32.0, 26.0, 34.0, 37.0, 27.0, 39.0, 57.0, 50.0, 43.0, 47.0, 46.0, 38.0, 47.0, 42.0, 39.0, 30.0, 28.0, 32.0, 22.0, 22.0, 18.0, 18.0, 23.0, 9.0, 8.0, 12.0, 9.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-188.866455078125, -182.6168670654297, -176.36727905273438, -170.11769104003906, -163.86810302734375, -157.61851501464844, -151.36892700195312, -145.1193389892578, -138.8697509765625, -132.6201629638672, -126.37057495117188, -120.12098693847656, -113.87139892578125, -107.62181091308594, -101.37222290039062, -95.12263488769531, -88.87303924560547, -82.62345123291016, -76.37386322021484, -70.12427520751953, -63.87468719482422, -57.625099182128906, -51.37550735473633, -45.125919342041016, -38.8763313293457, -32.62674331665039, -26.377155303955078, -20.127565383911133, -13.87797737121582, -7.628389358520508, -1.3787994384765625, 4.87078857421875, 11.120376586914062, 17.369964599609375, 23.619552612304688, 29.869142532348633, 36.11872863769531, 42.368316650390625, 48.6179084777832, 54.867496490478516, 61.11708450317383, 67.3666763305664, 73.61626434326172, 79.86585235595703, 86.11544036865234, 92.36502838134766, 98.61461639404297, 104.86420440673828, 111.1137924194336, 117.3633804321289, 123.61296844482422, 129.86256408691406, 136.11215209960938, 142.3617401123047, 148.611328125, 154.8609161376953, 161.11050415039062, 167.36009216308594, 173.60968017578125, 179.85926818847656, 186.10885620117188, 192.3584442138672, 198.6080322265625, 204.8576202392578, 211.10720825195312]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 7.0, 7.0, 9.0, 14.0, 24.0, 28.0, 34.0, 61.0, 80.0, 107.0, 139.0, 195.0, 277.0, 380.0, 563.0, 736.0, 1042.0, 1461.0, 2077.0, 3014.0, 4270.0, 6498.0, 9937.0, 14975.0, 23011.0, 35898.0, 56673.0, 93572.0, 161052.0, 232941.0, 153864.0, 89663.0, 54929.0, 34867.0, 21924.0, 14337.0, 9398.0, 6361.0, 4261.0, 2914.0, 2052.0, 1373.0, 1002.0, 685.0, 523.0, 343.0, 281.0, 173.0, 148.0, 117.0, 69.0, 47.0, 53.0, 34.0, 20.0, 17.0, 11.0, 10.0, 5.0, 1.0, 5.0, 2.0], "bins": [-167.25, -161.93359375, -156.6171875, -151.30078125, -145.984375, -140.66796875, -135.3515625, -130.03515625, -124.71875, -119.40234375, -114.0859375, -108.76953125, -103.453125, -98.13671875, -92.8203125, -87.50390625, -82.1875, -76.87109375, -71.5546875, -66.23828125, -60.921875, -55.60546875, -50.2890625, -44.97265625, -39.65625, -34.33984375, -29.0234375, -23.70703125, -18.390625, -13.07421875, -7.7578125, -2.44140625, 2.875, 8.19140625, 13.5078125, 18.82421875, 24.140625, 29.45703125, 34.7734375, 40.08984375, 45.40625, 50.72265625, 56.0390625, 61.35546875, 66.671875, 71.98828125, 77.3046875, 82.62109375, 87.9375, 93.25390625, 98.5703125, 103.88671875, 109.203125, 114.51953125, 119.8359375, 125.15234375, 130.46875, 135.78515625, 141.1015625, 146.41796875, 151.734375, 157.05078125, 162.3671875, 167.68359375, 173.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 3.0, 8.0, 15.0, 11.0, 19.0, 11.0, 15.0, 24.0, 33.0, 27.0, 36.0, 26.0, 35.0, 41.0, 35.0, 54.0, 51.0, 42.0, 39.0, 51.0, 48.0, 44.0, 31.0, 59.0, 24.0, 26.0, 23.0, 27.0, 23.0, 23.0, 15.0, 12.0, 9.0, 12.0, 11.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-153.875, -148.556640625, -143.23828125, -137.919921875, -132.6015625, -127.283203125, -121.96484375, -116.646484375, -111.328125, -106.009765625, -100.69140625, -95.373046875, -90.0546875, -84.736328125, -79.41796875, -74.099609375, -68.78125, -63.462890625, -58.14453125, -52.826171875, -47.5078125, -42.189453125, -36.87109375, -31.552734375, -26.234375, -20.916015625, -15.59765625, -10.279296875, -4.9609375, 0.357421875, 5.67578125, 10.994140625, 16.3125, 21.630859375, 26.94921875, 32.267578125, 37.5859375, 42.904296875, 48.22265625, 53.541015625, 58.859375, 64.177734375, 69.49609375, 74.814453125, 80.1328125, 85.451171875, 90.76953125, 96.087890625, 101.40625, 106.724609375, 112.04296875, 117.361328125, 122.6796875, 127.998046875, 133.31640625, 138.634765625, 143.953125, 149.271484375, 154.58984375, 159.908203125, 165.2265625, 170.544921875, 175.86328125, 181.181640625, 186.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 6.0, 13.0, 30.0, 38.0, 50.0, 81.0, 117.0, 191.0, 319.0, 526.0, 826.0, 1203.0, 2049.0, 3384.0, 5621.0, 9575.0, 16308.0, 29987.0, 62333.0, 175772.0, 450963.0, 162078.0, 59228.0, 29119.0, 15927.0, 8979.0, 5473.0, 3167.0, 1914.0, 1193.0, 752.0, 455.0, 305.0, 214.0, 140.0, 74.0, 52.0, 23.0, 20.0, 14.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-132.875, -128.65234375, -124.4296875, -120.20703125, -115.984375, -111.76171875, -107.5390625, -103.31640625, -99.09375, -94.87109375, -90.6484375, -86.42578125, -82.203125, -77.98046875, -73.7578125, -69.53515625, -65.3125, -61.08984375, -56.8671875, -52.64453125, -48.421875, -44.19921875, -39.9765625, -35.75390625, -31.53125, -27.30859375, -23.0859375, -18.86328125, -14.640625, -10.41796875, -6.1953125, -1.97265625, 2.25, 6.47265625, 10.6953125, 14.91796875, 19.140625, 23.36328125, 27.5859375, 31.80859375, 36.03125, 40.25390625, 44.4765625, 48.69921875, 52.921875, 57.14453125, 61.3671875, 65.58984375, 69.8125, 74.03515625, 78.2578125, 82.48046875, 86.703125, 90.92578125, 95.1484375, 99.37109375, 103.59375, 107.81640625, 112.0390625, 116.26171875, 120.484375, 124.70703125, 128.9296875, 133.15234375, 137.375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 6.0, 8.0, 8.0, 13.0, 15.0, 15.0, 15.0, 22.0, 27.0, 22.0, 22.0, 30.0, 31.0, 39.0, 38.0, 44.0, 30.0, 41.0, 43.0, 36.0, 43.0, 27.0, 37.0, 42.0, 29.0, 35.0, 20.0, 40.0, 29.0, 38.0, 24.0, 18.0, 24.0, 11.0, 14.0, 10.0, 12.0, 12.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.8125, -93.6025390625, -90.392578125, -87.1826171875, -83.97265625, -80.7626953125, -77.552734375, -74.3427734375, -71.1328125, -67.9228515625, -64.712890625, -61.5029296875, -58.29296875, -55.0830078125, -51.873046875, -48.6630859375, -45.453125, -42.2431640625, -39.033203125, -35.8232421875, -32.61328125, -29.4033203125, -26.193359375, -22.9833984375, -19.7734375, -16.5634765625, -13.353515625, -10.1435546875, -6.93359375, -3.7236328125, -0.513671875, 2.6962890625, 5.90625, 9.1162109375, 12.326171875, 15.5361328125, 18.74609375, 21.9560546875, 25.166015625, 28.3759765625, 31.5859375, 34.7958984375, 38.005859375, 41.2158203125, 44.42578125, 47.6357421875, 50.845703125, 54.0556640625, 57.265625, 60.4755859375, 63.685546875, 66.8955078125, 70.10546875, 73.3154296875, 76.525390625, 79.7353515625, 82.9453125, 86.1552734375, 89.365234375, 92.5751953125, 95.78515625, 98.9951171875, 102.205078125, 105.4150390625, 108.625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 2.0, 8.0, 10.0, 16.0, 15.0, 22.0, 29.0, 40.0, 67.0, 75.0, 103.0, 142.0, 214.0, 279.0, 398.0, 572.0, 895.0, 1245.0, 2014.0, 3256.0, 5757.0, 10775.0, 23090.0, 61288.0, 315979.0, 488202.0, 77944.0, 27114.0, 12412.0, 6191.0, 3678.0, 2145.0, 1395.0, 966.0, 682.0, 468.0, 293.0, 198.0, 160.0, 102.0, 82.0, 66.0, 50.0, 30.0, 24.0, 18.0, 7.0, 9.0, 5.0, 7.0, 3.0, 3.0, 0.0, 5.0, 0.0, 2.0, 1.0, 3.0], "bins": [-30.625, -29.64013671875, -28.6552734375, -27.67041015625, -26.685546875, -25.70068359375, -24.7158203125, -23.73095703125, -22.74609375, -21.76123046875, -20.7763671875, -19.79150390625, -18.806640625, -17.82177734375, -16.8369140625, -15.85205078125, -14.8671875, -13.88232421875, -12.8974609375, -11.91259765625, -10.927734375, -9.94287109375, -8.9580078125, -7.97314453125, -6.98828125, -6.00341796875, -5.0185546875, -4.03369140625, -3.048828125, -2.06396484375, -1.0791015625, -0.09423828125, 0.890625, 1.87548828125, 2.8603515625, 3.84521484375, 4.830078125, 5.81494140625, 6.7998046875, 7.78466796875, 8.76953125, 9.75439453125, 10.7392578125, 11.72412109375, 12.708984375, 13.69384765625, 14.6787109375, 15.66357421875, 16.6484375, 17.63330078125, 18.6181640625, 19.60302734375, 20.587890625, 21.57275390625, 22.5576171875, 23.54248046875, 24.52734375, 25.51220703125, 26.4970703125, 27.48193359375, 28.466796875, 29.45166015625, 30.4365234375, 31.42138671875, 32.40625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 1.0, 5.0, 5.0, 10.0, 14.0, 15.0, 21.0, 20.0, 26.0, 35.0, 26.0, 26.0, 49.0, 53.0, 69.0, 62.0, 55.0, 43.0, 62.0, 54.0, 53.0, 47.0, 49.0, 40.0, 33.0, 30.0, 18.0, 8.0, 12.0, 9.0, 7.0, 8.0, 10.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003173828125, -0.00305938720703125, -0.0029449462890625, -0.00283050537109375, -0.002716064453125, -0.00260162353515625, -0.0024871826171875, -0.00237274169921875, -0.00225830078125, -0.00214385986328125, -0.0020294189453125, -0.00191497802734375, -0.001800537109375, -0.00168609619140625, -0.0015716552734375, -0.00145721435546875, -0.0013427734375, -0.00122833251953125, -0.0011138916015625, -0.00099945068359375, -0.000885009765625, -0.00077056884765625, -0.0006561279296875, -0.00054168701171875, -0.00042724609375, -0.00031280517578125, -0.0001983642578125, -8.392333984375e-05, 3.0517578125e-05, 0.00014495849609375, 0.0002593994140625, 0.00037384033203125, 0.00048828125, 0.00060272216796875, 0.0007171630859375, 0.00083160400390625, 0.000946044921875, 0.00106048583984375, 0.0011749267578125, 0.00128936767578125, 0.00140380859375, 0.00151824951171875, 0.0016326904296875, 0.00174713134765625, 0.001861572265625, 0.00197601318359375, 0.0020904541015625, 0.00220489501953125, 0.0023193359375, 0.00243377685546875, 0.0025482177734375, 0.00266265869140625, 0.002777099609375, 0.00289154052734375, 0.0030059814453125, 0.00312042236328125, 0.00323486328125, 0.00334930419921875, 0.0034637451171875, 0.00357818603515625, 0.003692626953125, 0.00380706787109375, 0.0039215087890625, 0.00403594970703125, 0.004150390625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 5.0, 10.0, 20.0, 41.0, 38.0, 54.0, 76.0, 132.0, 171.0, 255.0, 382.0, 611.0, 856.0, 1407.0, 2246.0, 4040.0, 7282.0, 15613.0, 40548.0, 146376.0, 567224.0, 178193.0, 46711.0, 17285.0, 7908.0, 4212.0, 2454.0, 1526.0, 966.0, 657.0, 395.0, 266.0, 186.0, 136.0, 83.0, 48.0, 41.0, 30.0, 22.0, 12.0, 11.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.75, -66.638671875, -64.52734375, -62.416015625, -60.3046875, -58.193359375, -56.08203125, -53.970703125, -51.859375, -49.748046875, -47.63671875, -45.525390625, -43.4140625, -41.302734375, -39.19140625, -37.080078125, -34.96875, -32.857421875, -30.74609375, -28.634765625, -26.5234375, -24.412109375, -22.30078125, -20.189453125, -18.078125, -15.966796875, -13.85546875, -11.744140625, -9.6328125, -7.521484375, -5.41015625, -3.298828125, -1.1875, 0.923828125, 3.03515625, 5.146484375, 7.2578125, 9.369140625, 11.48046875, 13.591796875, 15.703125, 17.814453125, 19.92578125, 22.037109375, 24.1484375, 26.259765625, 28.37109375, 30.482421875, 32.59375, 34.705078125, 36.81640625, 38.927734375, 41.0390625, 43.150390625, 45.26171875, 47.373046875, 49.484375, 51.595703125, 53.70703125, 55.818359375, 57.9296875, 60.041015625, 62.15234375, 64.263671875, 66.375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 5.0, 9.0, 3.0, 4.0, 8.0, 12.0, 15.0, 13.0, 32.0, 37.0, 65.0, 75.0, 99.0, 182.0, 117.0, 86.0, 59.0, 40.0, 30.0, 29.0, 23.0, 11.0, 9.0, 7.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.125, -16.59814453125, -16.0712890625, -15.54443359375, -15.017578125, -14.49072265625, -13.9638671875, -13.43701171875, -12.91015625, -12.38330078125, -11.8564453125, -11.32958984375, -10.802734375, -10.27587890625, -9.7490234375, -9.22216796875, -8.6953125, -8.16845703125, -7.6416015625, -7.11474609375, -6.587890625, -6.06103515625, -5.5341796875, -5.00732421875, -4.48046875, -3.95361328125, -3.4267578125, -2.89990234375, -2.373046875, -1.84619140625, -1.3193359375, -0.79248046875, -0.265625, 0.26123046875, 0.7880859375, 1.31494140625, 1.841796875, 2.36865234375, 2.8955078125, 3.42236328125, 3.94921875, 4.47607421875, 5.0029296875, 5.52978515625, 6.056640625, 6.58349609375, 7.1103515625, 7.63720703125, 8.1640625, 8.69091796875, 9.2177734375, 9.74462890625, 10.271484375, 10.79833984375, 11.3251953125, 11.85205078125, 12.37890625, 12.90576171875, 13.4326171875, 13.95947265625, 14.486328125, 15.01318359375, 15.5400390625, 16.06689453125, 16.59375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 7.0, 20.0, 18.0, 15.0, 23.0, 36.0, 42.0, 39.0, 52.0, 75.0, 73.0, 78.0, 73.0, 67.0, 64.0, 65.0, 51.0, 37.0, 34.0, 26.0, 18.0, 9.0, 14.0, 11.0, 13.0, 5.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-190.5220947265625, -183.56692504882812, -176.6117401123047, -169.65655517578125, -162.70138549804688, -155.7462158203125, -148.79103088378906, -141.83584594726562, -134.88067626953125, -127.92549896240234, -120.97032165527344, -114.01514434814453, -107.05996704101562, -100.10478973388672, -93.14961242675781, -86.1944351196289, -79.2392578125, -72.2840805053711, -65.32890319824219, -58.37372589111328, -51.418548583984375, -44.46337127685547, -37.50819396972656, -30.553016662597656, -23.59783935546875, -16.642662048339844, -9.687484741210938, -2.7323074340820312, 4.222869873046875, 11.178047180175781, 18.133224487304688, 25.088401794433594, 32.0435791015625, 38.998756408691406, 45.95393371582031, 52.90911102294922, 59.864288330078125, 66.81946563720703, 73.77464294433594, 80.72982025146484, 87.68499755859375, 94.64017486572266, 101.59535217285156, 108.55052947998047, 115.50570678710938, 122.46088409423828, 129.4160614013672, 136.37124633789062, 143.326416015625, 150.28158569335938, 157.2367706298828, 164.19195556640625, 171.14712524414062, 178.102294921875, 185.05747985839844, 192.01266479492188, 198.96783447265625, 205.92300415039062, 212.87818908691406, 219.8333740234375, 226.78854370117188, 233.74371337890625, 240.6988983154297, 247.65408325195312, 254.6092529296875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 10.0, 11.0, 2.0, 13.0, 14.0, 9.0, 17.0, 18.0, 19.0, 36.0, 28.0, 34.0, 26.0, 32.0, 37.0, 39.0, 52.0, 34.0, 58.0, 53.0, 42.0, 37.0, 49.0, 38.0, 41.0, 35.0, 18.0, 33.0, 20.0, 19.0, 23.0, 23.0, 16.0, 15.0, 9.0, 10.0, 8.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-146.6458740234375, -141.6204833984375, -136.59507751464844, -131.56968688964844, -126.5442886352539, -121.51889038085938, -116.49349975585938, -111.46810150146484, -106.44270324707031, -101.41730499267578, -96.39190673828125, -91.36651611328125, -86.34111785888672, -81.31571960449219, -76.29032897949219, -71.26493072509766, -66.23953247070312, -61.214134216308594, -56.18873977661133, -51.16334533691406, -46.13794708251953, -41.112548828125, -36.087154388427734, -31.06175994873047, -26.036361694335938, -21.01096534729004, -15.98556900024414, -10.960172653198242, -5.934776306152344, -0.9093799591064453, 4.116016387939453, 9.141410827636719, 14.16680908203125, 19.19220542907715, 24.217601776123047, 29.242998123168945, 34.268394470214844, 39.293792724609375, 44.31918716430664, 49.344581604003906, 54.36997985839844, 59.39537811279297, 64.4207763671875, 69.4461669921875, 74.47156524658203, 79.49696350097656, 84.52235412597656, 89.5477523803711, 94.57315063476562, 99.59854888916016, 104.62394714355469, 109.64933776855469, 114.67473602294922, 119.70013427734375, 124.72552490234375, 129.75091552734375, 134.7763214111328, 139.8017120361328, 144.82711791992188, 149.85250854492188, 154.87789916992188, 159.90330505371094, 164.92869567871094, 169.9541015625, 174.9794921875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 9.0, 10.0, 28.0, 30.0, 53.0, 67.0, 87.0, 154.0, 218.0, 369.0, 571.0, 889.0, 1573.0, 2673.0, 4712.0, 8687.0, 15938.0, 30526.0, 61301.0, 126800.0, 241025.0, 260893.0, 145912.0, 70423.0, 35236.0, 18067.0, 9415.0, 5382.0, 2912.0, 1802.0, 1037.0, 611.0, 390.0, 266.0, 159.0, 92.0, 79.0, 44.0, 31.0, 28.0, 16.0, 8.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-327.0, -315.76171875, -304.5234375, -293.28515625, -282.046875, -270.80859375, -259.5703125, -248.33203125, -237.09375, -225.85546875, -214.6171875, -203.37890625, -192.140625, -180.90234375, -169.6640625, -158.42578125, -147.1875, -135.94921875, -124.7109375, -113.47265625, -102.234375, -90.99609375, -79.7578125, -68.51953125, -57.28125, -46.04296875, -34.8046875, -23.56640625, -12.328125, -1.08984375, 10.1484375, 21.38671875, 32.625, 43.86328125, 55.1015625, 66.33984375, 77.578125, 88.81640625, 100.0546875, 111.29296875, 122.53125, 133.76953125, 145.0078125, 156.24609375, 167.484375, 178.72265625, 189.9609375, 201.19921875, 212.4375, 223.67578125, 234.9140625, 246.15234375, 257.390625, 268.62890625, 279.8671875, 291.10546875, 302.34375, 313.58203125, 324.8203125, 336.05859375, 347.296875, 358.53515625, 369.7734375, 381.01171875, 392.25]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 8.0, 7.0, 6.0, 11.0, 17.0, 10.0, 19.0, 20.0, 23.0, 19.0, 27.0, 23.0, 45.0, 37.0, 36.0, 41.0, 33.0, 53.0, 45.0, 46.0, 43.0, 50.0, 47.0, 36.0, 36.0, 33.0, 26.0, 22.0, 26.0, 24.0, 31.0, 17.0, 13.0, 17.0, 8.0, 8.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-103.625, -100.0556640625, -96.486328125, -92.9169921875, -89.34765625, -85.7783203125, -82.208984375, -78.6396484375, -75.0703125, -71.5009765625, -67.931640625, -64.3623046875, -60.79296875, -57.2236328125, -53.654296875, -50.0849609375, -46.515625, -42.9462890625, -39.376953125, -35.8076171875, -32.23828125, -28.6689453125, -25.099609375, -21.5302734375, -17.9609375, -14.3916015625, -10.822265625, -7.2529296875, -3.68359375, -0.1142578125, 3.455078125, 7.0244140625, 10.59375, 14.1630859375, 17.732421875, 21.3017578125, 24.87109375, 28.4404296875, 32.009765625, 35.5791015625, 39.1484375, 42.7177734375, 46.287109375, 49.8564453125, 53.42578125, 56.9951171875, 60.564453125, 64.1337890625, 67.703125, 71.2724609375, 74.841796875, 78.4111328125, 81.98046875, 85.5498046875, 89.119140625, 92.6884765625, 96.2578125, 99.8271484375, 103.396484375, 106.9658203125, 110.53515625, 114.1044921875, 117.673828125, 121.2431640625, 124.8125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 5.0, 7.0, 8.0, 6.0, 8.0, 24.0, 31.0, 33.0, 54.0, 108.0, 157.0, 210.0, 347.0, 509.0, 811.0, 1302.0, 2147.0, 3554.0, 5772.0, 9571.0, 16015.0, 27479.0, 46471.0, 77917.0, 128343.0, 188350.0, 194849.0, 136844.0, 84166.0, 50176.0, 29397.0, 17248.0, 10414.0, 6148.0, 3808.0, 2195.0, 1429.0, 929.0, 593.0, 349.0, 271.0, 155.0, 111.0, 83.0, 54.0, 25.0, 28.0, 21.0, 11.0, 6.0, 6.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-201.75, -194.810546875, -187.87109375, -180.931640625, -173.9921875, -167.052734375, -160.11328125, -153.173828125, -146.234375, -139.294921875, -132.35546875, -125.416015625, -118.4765625, -111.537109375, -104.59765625, -97.658203125, -90.71875, -83.779296875, -76.83984375, -69.900390625, -62.9609375, -56.021484375, -49.08203125, -42.142578125, -35.203125, -28.263671875, -21.32421875, -14.384765625, -7.4453125, -0.505859375, 6.43359375, 13.373046875, 20.3125, 27.251953125, 34.19140625, 41.130859375, 48.0703125, 55.009765625, 61.94921875, 68.888671875, 75.828125, 82.767578125, 89.70703125, 96.646484375, 103.5859375, 110.525390625, 117.46484375, 124.404296875, 131.34375, 138.283203125, 145.22265625, 152.162109375, 159.1015625, 166.041015625, 172.98046875, 179.919921875, 186.859375, 193.798828125, 200.73828125, 207.677734375, 214.6171875, 221.556640625, 228.49609375, 235.435546875, 242.375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 8.0, 5.0, 6.0, 9.0, 10.0, 11.0, 13.0, 17.0, 14.0, 17.0, 25.0, 27.0, 36.0, 32.0, 37.0, 35.0, 37.0, 29.0, 39.0, 39.0, 50.0, 40.0, 43.0, 27.0, 32.0, 37.0, 21.0, 28.0, 29.0, 27.0, 24.0, 31.0, 27.0, 18.0, 19.0, 16.0, 15.0, 11.0, 17.0, 7.0, 9.0, 7.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.6875, -71.3642578125, -69.041015625, -66.7177734375, -64.39453125, -62.0712890625, -59.748046875, -57.4248046875, -55.1015625, -52.7783203125, -50.455078125, -48.1318359375, -45.80859375, -43.4853515625, -41.162109375, -38.8388671875, -36.515625, -34.1923828125, -31.869140625, -29.5458984375, -27.22265625, -24.8994140625, -22.576171875, -20.2529296875, -17.9296875, -15.6064453125, -13.283203125, -10.9599609375, -8.63671875, -6.3134765625, -3.990234375, -1.6669921875, 0.65625, 2.9794921875, 5.302734375, 7.6259765625, 9.94921875, 12.2724609375, 14.595703125, 16.9189453125, 19.2421875, 21.5654296875, 23.888671875, 26.2119140625, 28.53515625, 30.8583984375, 33.181640625, 35.5048828125, 37.828125, 40.1513671875, 42.474609375, 44.7978515625, 47.12109375, 49.4443359375, 51.767578125, 54.0908203125, 56.4140625, 58.7373046875, 61.060546875, 63.3837890625, 65.70703125, 68.0302734375, 70.353515625, 72.6767578125, 75.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 8.0, 18.0, 17.0, 24.0, 55.0, 70.0, 80.0, 109.0, 149.0, 197.0, 233.0, 348.0, 510.0, 631.0, 889.0, 1359.0, 1850.0, 2810.0, 4466.0, 7420.0, 14245.0, 36086.0, 147451.0, 634781.0, 127615.0, 33133.0, 13473.0, 7156.0, 4256.0, 2692.0, 1773.0, 1211.0, 942.0, 670.0, 453.0, 354.0, 264.0, 204.0, 149.0, 110.0, 74.0, 52.0, 36.0, 25.0, 25.0, 17.0, 16.0, 6.0, 10.0, 6.0, 6.0, 3.0, 1.0, 1.0], "bins": [-375.25, -364.03515625, -352.8203125, -341.60546875, -330.390625, -319.17578125, -307.9609375, -296.74609375, -285.53125, -274.31640625, -263.1015625, -251.88671875, -240.671875, -229.45703125, -218.2421875, -207.02734375, -195.8125, -184.59765625, -173.3828125, -162.16796875, -150.953125, -139.73828125, -128.5234375, -117.30859375, -106.09375, -94.87890625, -83.6640625, -72.44921875, -61.234375, -50.01953125, -38.8046875, -27.58984375, -16.375, -5.16015625, 6.0546875, 17.26953125, 28.484375, 39.69921875, 50.9140625, 62.12890625, 73.34375, 84.55859375, 95.7734375, 106.98828125, 118.203125, 129.41796875, 140.6328125, 151.84765625, 163.0625, 174.27734375, 185.4921875, 196.70703125, 207.921875, 219.13671875, 230.3515625, 241.56640625, 252.78125, 263.99609375, 275.2109375, 286.42578125, 297.640625, 308.85546875, 320.0703125, 331.28515625, 342.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 9.0, 18.0, 9.0, 24.0, 35.0, 40.0, 75.0, 116.0, 150.0, 145.0, 96.0, 88.0, 59.0, 39.0, 22.0, 21.0, 13.0, 14.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01947021484375, -0.01894664764404297, -0.018423080444335938, -0.017899513244628906, -0.017375946044921875, -0.016852378845214844, -0.016328811645507812, -0.01580524444580078, -0.01528167724609375, -0.014758110046386719, -0.014234542846679688, -0.013710975646972656, -0.013187408447265625, -0.012663841247558594, -0.012140274047851562, -0.011616706848144531, -0.0110931396484375, -0.010569572448730469, -0.010046005249023438, -0.009522438049316406, -0.008998870849609375, -0.008475303649902344, -0.007951736450195312, -0.007428169250488281, -0.00690460205078125, -0.006381034851074219, -0.0058574676513671875, -0.005333900451660156, -0.004810333251953125, -0.004286766052246094, -0.0037631988525390625, -0.0032396316528320312, -0.002716064453125, -0.0021924972534179688, -0.0016689300537109375, -0.0011453628540039062, -0.000621795654296875, -9.822845458984375e-05, 0.0004253387451171875, 0.0009489059448242188, 0.00147247314453125, 0.0019960403442382812, 0.0025196075439453125, 0.0030431747436523438, 0.003566741943359375, 0.004090309143066406, 0.0046138763427734375, 0.005137443542480469, 0.0056610107421875, 0.006184577941894531, 0.0067081451416015625, 0.007231712341308594, 0.007755279541015625, 0.008278846740722656, 0.008802413940429688, 0.009325981140136719, 0.00984954833984375, 0.010373115539550781, 0.010896682739257812, 0.011420249938964844, 0.011943817138671875, 0.012467384338378906, 0.012990951538085938, 0.013514518737792969, 0.0140380859375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 4.0, 8.0, 9.0, 15.0, 15.0, 29.0, 24.0, 23.0, 50.0, 53.0, 92.0, 100.0, 114.0, 176.0, 222.0, 325.0, 485.0, 651.0, 1013.0, 1591.0, 2538.0, 4386.0, 9152.0, 26454.0, 181782.0, 716208.0, 70301.0, 16199.0, 6665.0, 3520.0, 2078.0, 1298.0, 893.0, 571.0, 384.0, 308.0, 206.0, 153.0, 112.0, 87.0, 55.0, 40.0, 42.0, 44.0, 20.0, 19.0, 13.0, 12.0, 5.0, 2.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-390.75, -376.94140625, -363.1328125, -349.32421875, -335.515625, -321.70703125, -307.8984375, -294.08984375, -280.28125, -266.47265625, -252.6640625, -238.85546875, -225.046875, -211.23828125, -197.4296875, -183.62109375, -169.8125, -156.00390625, -142.1953125, -128.38671875, -114.578125, -100.76953125, -86.9609375, -73.15234375, -59.34375, -45.53515625, -31.7265625, -17.91796875, -4.109375, 9.69921875, 23.5078125, 37.31640625, 51.125, 64.93359375, 78.7421875, 92.55078125, 106.359375, 120.16796875, 133.9765625, 147.78515625, 161.59375, 175.40234375, 189.2109375, 203.01953125, 216.828125, 230.63671875, 244.4453125, 258.25390625, 272.0625, 285.87109375, 299.6796875, 313.48828125, 327.296875, 341.10546875, 354.9140625, 368.72265625, 382.53125, 396.33984375, 410.1484375, 423.95703125, 437.765625, 451.57421875, 465.3828125, 479.19140625, 493.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 8.0, 10.0, 13.0, 26.0, 41.0, 99.0, 194.0, 221.0, 159.0, 86.0, 45.0, 27.0, 11.0, 4.0, 9.0, 8.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.0, -116.892578125, -112.78515625, -108.677734375, -104.5703125, -100.462890625, -96.35546875, -92.248046875, -88.140625, -84.033203125, -79.92578125, -75.818359375, -71.7109375, -67.603515625, -63.49609375, -59.388671875, -55.28125, -51.173828125, -47.06640625, -42.958984375, -38.8515625, -34.744140625, -30.63671875, -26.529296875, -22.421875, -18.314453125, -14.20703125, -10.099609375, -5.9921875, -1.884765625, 2.22265625, 6.330078125, 10.4375, 14.544921875, 18.65234375, 22.759765625, 26.8671875, 30.974609375, 35.08203125, 39.189453125, 43.296875, 47.404296875, 51.51171875, 55.619140625, 59.7265625, 63.833984375, 67.94140625, 72.048828125, 76.15625, 80.263671875, 84.37109375, 88.478515625, 92.5859375, 96.693359375, 100.80078125, 104.908203125, 109.015625, 113.123046875, 117.23046875, 121.337890625, 125.4453125, 129.552734375, 133.66015625, 137.767578125, 141.875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 9.0, 16.0, 15.0, 25.0, 29.0, 36.0, 44.0, 56.0, 61.0, 69.0, 86.0, 97.0, 59.0, 51.0, 53.0, 52.0, 49.0, 24.0, 28.0, 25.0, 22.0, 15.0, 19.0, 8.0, 7.0, 7.0, 9.0, 3.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-181.39321899414062, -175.23069763183594, -169.06817626953125, -162.90565490722656, -156.74313354492188, -150.5806121826172, -144.4180908203125, -138.25555419921875, -132.09304809570312, -125.93052673339844, -119.76800537109375, -113.60548400878906, -107.44296264648438, -101.28044128417969, -95.11791229248047, -88.95539093017578, -82.79286193847656, -76.63034057617188, -70.46781921386719, -64.3052978515625, -58.14277267456055, -51.98025131225586, -45.817726135253906, -39.65520477294922, -33.49268341064453, -27.330162048339844, -21.167638778686523, -15.005115509033203, -8.842594146728516, -2.680072784423828, 3.482452392578125, 9.644973754882812, 15.8074951171875, 21.970016479492188, 28.132539749145508, 34.29506301879883, 40.457584381103516, 46.6201057434082, 52.782630920410156, 58.945152282714844, 65.10767364501953, 71.27019500732422, 77.4327163696289, 83.59524536132812, 89.75776672363281, 95.9202880859375, 102.08280944824219, 108.24533081054688, 114.40785217285156, 120.57037353515625, 126.73289489746094, 132.89541625976562, 139.0579376220703, 145.220458984375, 151.38299560546875, 157.54550170898438, 163.70803833007812, 169.8705596923828, 176.0330810546875, 182.1956024169922, 188.35812377929688, 194.52064514160156, 200.68316650390625, 206.845703125, 213.00820922851562]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 6.0, 8.0, 16.0, 9.0, 24.0, 26.0, 23.0, 26.0, 30.0, 34.0, 23.0, 33.0, 33.0, 51.0, 40.0, 38.0, 38.0, 54.0, 37.0, 38.0, 41.0, 39.0, 45.0, 49.0, 36.0, 25.0, 21.0, 19.0, 25.0, 21.0, 12.0, 13.0, 5.0, 9.0, 7.0, 7.0, 4.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-131.53257751464844, -127.18876647949219, -122.84495544433594, -118.50114440917969, -114.15733337402344, -109.81352233886719, -105.46971130371094, -101.12590026855469, -96.78208923339844, -92.43827819824219, -88.09446716308594, -83.75065612792969, -79.40684509277344, -75.06303405761719, -70.71922302246094, -66.37541198730469, -62.031593322753906, -57.687782287597656, -53.343971252441406, -49.000160217285156, -44.656349182128906, -40.312538146972656, -35.96872329711914, -31.62491226196289, -27.28110122680664, -22.93729019165039, -18.59347915649414, -14.249666213989258, -9.905855178833008, -5.562044143676758, -1.218231201171875, 3.125579833984375, 7.469390869140625, 11.813201904296875, 16.157012939453125, 20.500825881958008, 24.844636917114258, 29.188447952270508, 33.53226089477539, 37.87607192993164, 42.21988296508789, 46.56369400024414, 50.90750503540039, 55.251319885253906, 59.595130920410156, 63.938941955566406, 68.28275299072266, 72.6265640258789, 76.97037506103516, 81.3141860961914, 85.65799713134766, 90.0018081665039, 94.34561920166016, 98.6894302368164, 103.03324890136719, 107.37705993652344, 111.72087097167969, 116.06468200683594, 120.40849304199219, 124.75230407714844, 129.0961151123047, 133.43992614746094, 137.7837371826172, 142.12754821777344, 146.4713592529297]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 17.0, 17.0, 19.0, 44.0, 58.0, 86.0, 134.0, 203.0, 250.0, 471.0, 767.0, 1190.0, 1911.0, 3071.0, 4995.0, 8386.0, 14256.0, 24448.0, 42944.0, 79990.0, 158742.0, 367002.0, 1206544.0, 1435054.0, 449101.0, 182633.0, 90580.0, 49375.0, 28376.0, 16910.0, 10159.0, 6058.0, 3929.0, 2370.0, 1490.0, 953.0, 668.0, 388.0, 243.0, 159.0, 102.0, 50.0, 46.0, 21.0, 22.0, 16.0, 11.0, 8.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-169.25, -163.626953125, -158.00390625, -152.380859375, -146.7578125, -141.134765625, -135.51171875, -129.888671875, -124.265625, -118.642578125, -113.01953125, -107.396484375, -101.7734375, -96.150390625, -90.52734375, -84.904296875, -79.28125, -73.658203125, -68.03515625, -62.412109375, -56.7890625, -51.166015625, -45.54296875, -39.919921875, -34.296875, -28.673828125, -23.05078125, -17.427734375, -11.8046875, -6.181640625, -0.55859375, 5.064453125, 10.6875, 16.310546875, 21.93359375, 27.556640625, 33.1796875, 38.802734375, 44.42578125, 50.048828125, 55.671875, 61.294921875, 66.91796875, 72.541015625, 78.1640625, 83.787109375, 89.41015625, 95.033203125, 100.65625, 106.279296875, 111.90234375, 117.525390625, 123.1484375, 128.771484375, 134.39453125, 140.017578125, 145.640625, 151.263671875, 156.88671875, 162.509765625, 168.1328125, 173.755859375, 179.37890625, 185.001953125, 190.625]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 8.0, 10.0, 17.0, 12.0, 23.0, 22.0, 31.0, 18.0, 35.0, 30.0, 33.0, 29.0, 37.0, 48.0, 32.0, 38.0, 48.0, 38.0, 54.0, 47.0, 38.0, 50.0, 39.0, 31.0, 30.0, 24.0, 22.0, 21.0, 21.0, 15.0, 15.0, 7.0, 16.0, 6.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.46875, -59.31103515625, -57.1533203125, -54.99560546875, -52.837890625, -50.68017578125, -48.5224609375, -46.36474609375, -44.20703125, -42.04931640625, -39.8916015625, -37.73388671875, -35.576171875, -33.41845703125, -31.2607421875, -29.10302734375, -26.9453125, -24.78759765625, -22.6298828125, -20.47216796875, -18.314453125, -16.15673828125, -13.9990234375, -11.84130859375, -9.68359375, -7.52587890625, -5.3681640625, -3.21044921875, -1.052734375, 1.10498046875, 3.2626953125, 5.42041015625, 7.578125, 9.73583984375, 11.8935546875, 14.05126953125, 16.208984375, 18.36669921875, 20.5244140625, 22.68212890625, 24.83984375, 26.99755859375, 29.1552734375, 31.31298828125, 33.470703125, 35.62841796875, 37.7861328125, 39.94384765625, 42.1015625, 44.25927734375, 46.4169921875, 48.57470703125, 50.732421875, 52.89013671875, 55.0478515625, 57.20556640625, 59.36328125, 61.52099609375, 63.6787109375, 65.83642578125, 67.994140625, 70.15185546875, 72.3095703125, 74.46728515625, 76.625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 10.0, 10.0, 19.0, 31.0, 56.0, 80.0, 122.0, 179.0, 298.0, 482.0, 835.0, 1360.0, 2155.0, 3702.0, 6449.0, 11525.0, 20777.0, 38762.0, 75061.0, 153790.0, 341563.0, 858665.0, 1512003.0, 640100.0, 267476.0, 124939.0, 61247.0, 32215.0, 17247.0, 9650.0, 5529.0, 3130.0, 1814.0, 1137.0, 667.0, 465.0, 254.0, 182.0, 111.0, 89.0, 34.0, 25.0, 17.0, 2.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-161.875, -157.021484375, -152.16796875, -147.314453125, -142.4609375, -137.607421875, -132.75390625, -127.900390625, -123.046875, -118.193359375, -113.33984375, -108.486328125, -103.6328125, -98.779296875, -93.92578125, -89.072265625, -84.21875, -79.365234375, -74.51171875, -69.658203125, -64.8046875, -59.951171875, -55.09765625, -50.244140625, -45.390625, -40.537109375, -35.68359375, -30.830078125, -25.9765625, -21.123046875, -16.26953125, -11.416015625, -6.5625, -1.708984375, 3.14453125, 7.998046875, 12.8515625, 17.705078125, 22.55859375, 27.412109375, 32.265625, 37.119140625, 41.97265625, 46.826171875, 51.6796875, 56.533203125, 61.38671875, 66.240234375, 71.09375, 75.947265625, 80.80078125, 85.654296875, 90.5078125, 95.361328125, 100.21484375, 105.068359375, 109.921875, 114.775390625, 119.62890625, 124.482421875, 129.3359375, 134.189453125, 139.04296875, 143.896484375, 148.75]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 11.0, 10.0, 10.0, 18.0, 41.0, 39.0, 52.0, 55.0, 57.0, 90.0, 86.0, 97.0, 118.0, 141.0, 178.0, 206.0, 276.0, 317.0, 336.0, 324.0, 292.0, 225.0, 209.0, 173.0, 135.0, 114.0, 98.0, 68.0, 61.0, 53.0, 39.0, 30.0, 22.0, 17.0, 13.0, 8.0, 11.0, 9.0, 6.0, 6.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.5625, -38.26953125, -36.9765625, -35.68359375, -34.390625, -33.09765625, -31.8046875, -30.51171875, -29.21875, -27.92578125, -26.6328125, -25.33984375, -24.046875, -22.75390625, -21.4609375, -20.16796875, -18.875, -17.58203125, -16.2890625, -14.99609375, -13.703125, -12.41015625, -11.1171875, -9.82421875, -8.53125, -7.23828125, -5.9453125, -4.65234375, -3.359375, -2.06640625, -0.7734375, 0.51953125, 1.8125, 3.10546875, 4.3984375, 5.69140625, 6.984375, 8.27734375, 9.5703125, 10.86328125, 12.15625, 13.44921875, 14.7421875, 16.03515625, 17.328125, 18.62109375, 19.9140625, 21.20703125, 22.5, 23.79296875, 25.0859375, 26.37890625, 27.671875, 28.96484375, 30.2578125, 31.55078125, 32.84375, 34.13671875, 35.4296875, 36.72265625, 38.015625, 39.30859375, 40.6015625, 41.89453125, 43.1875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 7.0, 9.0, 11.0, 7.0, 15.0, 20.0, 14.0, 40.0, 32.0, 53.0, 46.0, 62.0, 60.0, 78.0, 82.0, 83.0, 70.0, 48.0, 47.0, 33.0, 28.0, 33.0, 26.0, 19.0, 20.0, 8.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-108.0521011352539, -104.62984466552734, -101.20758819580078, -97.78532409667969, -94.36306762695312, -90.94081115722656, -87.5185546875, -84.09629821777344, -80.67404174804688, -77.25178527832031, -73.82952880859375, -70.40727233886719, -66.9850082397461, -63.56275177001953, -60.14049530029297, -56.718238830566406, -53.29597473144531, -49.87371826171875, -46.45145797729492, -43.02920150756836, -39.60694122314453, -36.18468475341797, -32.762428283691406, -29.34016990661621, -25.917911529541016, -22.49565315246582, -19.073394775390625, -15.651138305664062, -12.228879928588867, -8.806621551513672, -5.384365081787109, -1.962106704711914, 1.46014404296875, 4.882401943206787, 8.304659843444824, 11.726917266845703, 15.149175643920898, 18.571434020996094, 21.993690490722656, 25.41594886779785, 28.838207244873047, 32.26046371459961, 35.68272399902344, 39.10498046875, 42.52723693847656, 45.94949722290039, 49.37175369262695, 52.79401397705078, 56.216270446777344, 59.638526916503906, 63.060787200927734, 66.48304748535156, 69.90530395507812, 73.32756042480469, 76.74981689453125, 80.17207336425781, 83.59432983398438, 87.01658630371094, 90.4388427734375, 93.86109924316406, 97.28336334228516, 100.70561981201172, 104.12787628173828, 107.55013275146484, 110.97239685058594]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 11.0, 13.0, 12.0, 11.0, 14.0, 20.0, 23.0, 22.0, 29.0, 28.0, 22.0, 31.0, 35.0, 47.0, 38.0, 38.0, 51.0, 41.0, 48.0, 51.0, 41.0, 46.0, 29.0, 49.0, 33.0, 22.0, 25.0, 20.0, 28.0, 19.0, 20.0, 11.0, 11.0, 10.0, 9.0, 8.0, 4.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-87.44540405273438, -84.80017852783203, -82.15494537353516, -79.50971984863281, -76.86448669433594, -74.2192611694336, -71.57402801513672, -68.92880249023438, -66.2835693359375, -63.63833999633789, -60.99311065673828, -58.34788131713867, -55.70265197753906, -53.05742645263672, -50.41219711303711, -47.7669677734375, -45.121742248535156, -42.47651290893555, -39.83128356933594, -37.18605422973633, -34.54082489013672, -31.895597457885742, -29.250370025634766, -26.605140686035156, -23.959911346435547, -21.314682006835938, -18.669452667236328, -16.02422523498535, -13.378995895385742, -10.733766555786133, -8.08853816986084, -5.443309783935547, -2.7980880737304688, -0.15285921096801758, 2.4923696517944336, 5.137598514556885, 7.782827377319336, 10.428056716918945, 13.073285102844238, 15.718513488769531, 18.36374282836914, 21.00897216796875, 23.65420150756836, 26.299428939819336, 28.944658279418945, 31.589887619018555, 34.23511505126953, 36.88034439086914, 39.52557373046875, 42.17080307006836, 44.81603240966797, 47.46126174926758, 50.10649108886719, 52.75171661376953, 55.39694595336914, 58.04217529296875, 60.68740463256836, 63.33263397216797, 65.97785949707031, 68.62309265136719, 71.26831817626953, 73.9135513305664, 76.55877685546875, 79.20401000976562, 81.84923553466797]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 5.0, 7.0, 11.0, 13.0, 30.0, 55.0, 55.0, 87.0, 86.0, 158.0, 237.0, 299.0, 479.0, 751.0, 1038.0, 1586.0, 2519.0, 3823.0, 6133.0, 10108.0, 16709.0, 28727.0, 49279.0, 89735.0, 179222.0, 300607.0, 161093.0, 82194.0, 45656.0, 26418.0, 15706.0, 9464.0, 5628.0, 3646.0, 2409.0, 1471.0, 964.0, 670.0, 476.0, 300.0, 185.0, 150.0, 100.0, 90.0, 61.0, 38.0, 21.0, 21.0, 8.0, 6.0, 5.0, 7.0, 6.0, 4.0, 0.0, 2.0, 1.0], "bins": [-85.125, -82.5, -79.875, -77.25, -74.625, -72.0, -69.375, -66.75, -64.125, -61.5, -58.875, -56.25, -53.625, -51.0, -48.375, -45.75, -43.125, -40.5, -37.875, -35.25, -32.625, -30.0, -27.375, -24.75, -22.125, -19.5, -16.875, -14.25, -11.625, -9.0, -6.375, -3.75, -1.125, 1.5, 4.125, 6.75, 9.375, 12.0, 14.625, 17.25, 19.875, 22.5, 25.125, 27.75, 30.375, 33.0, 35.625, 38.25, 40.875, 43.5, 46.125, 48.75, 51.375, 54.0, 56.625, 59.25, 61.875, 64.5, 67.125, 69.75, 72.375, 75.0, 77.625, 80.25, 82.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 2.0, 13.0, 4.0, 14.0, 20.0, 19.0, 19.0, 18.0, 25.0, 28.0, 22.0, 33.0, 34.0, 49.0, 36.0, 32.0, 44.0, 42.0, 48.0, 44.0, 42.0, 40.0, 47.0, 31.0, 35.0, 34.0, 34.0, 26.0, 18.0, 25.0, 22.0, 19.0, 11.0, 14.0, 8.0, 9.0, 10.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.8125, -70.4326171875, -68.052734375, -65.6728515625, -63.29296875, -60.9130859375, -58.533203125, -56.1533203125, -53.7734375, -51.3935546875, -49.013671875, -46.6337890625, -44.25390625, -41.8740234375, -39.494140625, -37.1142578125, -34.734375, -32.3544921875, -29.974609375, -27.5947265625, -25.21484375, -22.8349609375, -20.455078125, -18.0751953125, -15.6953125, -13.3154296875, -10.935546875, -8.5556640625, -6.17578125, -3.7958984375, -1.416015625, 0.9638671875, 3.34375, 5.7236328125, 8.103515625, 10.4833984375, 12.86328125, 15.2431640625, 17.623046875, 20.0029296875, 22.3828125, 24.7626953125, 27.142578125, 29.5224609375, 31.90234375, 34.2822265625, 36.662109375, 39.0419921875, 41.421875, 43.8017578125, 46.181640625, 48.5615234375, 50.94140625, 53.3212890625, 55.701171875, 58.0810546875, 60.4609375, 62.8408203125, 65.220703125, 67.6005859375, 69.98046875, 72.3603515625, 74.740234375, 77.1201171875, 79.5]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 11.0, 23.0, 30.0, 46.0, 57.0, 99.0, 132.0, 203.0, 310.0, 529.0, 906.0, 1370.0, 2191.0, 3795.0, 6259.0, 10634.0, 19055.0, 38001.0, 87618.0, 293781.0, 382217.0, 106030.0, 44004.0, 21655.0, 11827.0, 7103.0, 4079.0, 2586.0, 1531.0, 911.0, 585.0, 361.0, 206.0, 122.0, 94.0, 58.0, 41.0, 33.0, 23.0, 12.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.6875, -63.5751953125, -61.462890625, -59.3505859375, -57.23828125, -55.1259765625, -53.013671875, -50.9013671875, -48.7890625, -46.6767578125, -44.564453125, -42.4521484375, -40.33984375, -38.2275390625, -36.115234375, -34.0029296875, -31.890625, -29.7783203125, -27.666015625, -25.5537109375, -23.44140625, -21.3291015625, -19.216796875, -17.1044921875, -14.9921875, -12.8798828125, -10.767578125, -8.6552734375, -6.54296875, -4.4306640625, -2.318359375, -0.2060546875, 1.90625, 4.0185546875, 6.130859375, 8.2431640625, 10.35546875, 12.4677734375, 14.580078125, 16.6923828125, 18.8046875, 20.9169921875, 23.029296875, 25.1416015625, 27.25390625, 29.3662109375, 31.478515625, 33.5908203125, 35.703125, 37.8154296875, 39.927734375, 42.0400390625, 44.15234375, 46.2646484375, 48.376953125, 50.4892578125, 52.6015625, 54.7138671875, 56.826171875, 58.9384765625, 61.05078125, 63.1630859375, 65.275390625, 67.3876953125, 69.5]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 8.0, 8.0, 19.0, 18.0, 19.0, 29.0, 22.0, 24.0, 31.0, 34.0, 37.0, 22.0, 31.0, 51.0, 35.0, 34.0, 37.0, 35.0, 50.0, 35.0, 36.0, 43.0, 39.0, 31.0, 37.0, 34.0, 28.0, 21.0, 25.0, 18.0, 15.0, 18.0, 11.0, 8.0, 9.0, 4.0, 9.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-56.84375, -55.267578125, -53.69140625, -52.115234375, -50.5390625, -48.962890625, -47.38671875, -45.810546875, -44.234375, -42.658203125, -41.08203125, -39.505859375, -37.9296875, -36.353515625, -34.77734375, -33.201171875, -31.625, -30.048828125, -28.47265625, -26.896484375, -25.3203125, -23.744140625, -22.16796875, -20.591796875, -19.015625, -17.439453125, -15.86328125, -14.287109375, -12.7109375, -11.134765625, -9.55859375, -7.982421875, -6.40625, -4.830078125, -3.25390625, -1.677734375, -0.1015625, 1.474609375, 3.05078125, 4.626953125, 6.203125, 7.779296875, 9.35546875, 10.931640625, 12.5078125, 14.083984375, 15.66015625, 17.236328125, 18.8125, 20.388671875, 21.96484375, 23.541015625, 25.1171875, 26.693359375, 28.26953125, 29.845703125, 31.421875, 32.998046875, 34.57421875, 36.150390625, 37.7265625, 39.302734375, 40.87890625, 42.455078125, 44.03125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 7.0, 10.0, 9.0, 21.0, 26.0, 37.0, 68.0, 75.0, 103.0, 175.0, 209.0, 294.0, 409.0, 643.0, 945.0, 1408.0, 2273.0, 3724.0, 6401.0, 11852.0, 24430.0, 60147.0, 216357.0, 518266.0, 119076.0, 40846.0, 17945.0, 8999.0, 5134.0, 3003.0, 1804.0, 1177.0, 808.0, 540.0, 381.0, 241.0, 198.0, 131.0, 109.0, 73.0, 56.0, 35.0, 20.0, 21.0, 25.0, 8.0, 3.0, 3.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-17.265625, -16.7470703125, -16.228515625, -15.7099609375, -15.19140625, -14.6728515625, -14.154296875, -13.6357421875, -13.1171875, -12.5986328125, -12.080078125, -11.5615234375, -11.04296875, -10.5244140625, -10.005859375, -9.4873046875, -8.96875, -8.4501953125, -7.931640625, -7.4130859375, -6.89453125, -6.3759765625, -5.857421875, -5.3388671875, -4.8203125, -4.3017578125, -3.783203125, -3.2646484375, -2.74609375, -2.2275390625, -1.708984375, -1.1904296875, -0.671875, -0.1533203125, 0.365234375, 0.8837890625, 1.40234375, 1.9208984375, 2.439453125, 2.9580078125, 3.4765625, 3.9951171875, 4.513671875, 5.0322265625, 5.55078125, 6.0693359375, 6.587890625, 7.1064453125, 7.625, 8.1435546875, 8.662109375, 9.1806640625, 9.69921875, 10.2177734375, 10.736328125, 11.2548828125, 11.7734375, 12.2919921875, 12.810546875, 13.3291015625, 13.84765625, 14.3662109375, 14.884765625, 15.4033203125, 15.921875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 15.0, 13.0, 18.0, 22.0, 28.0, 22.0, 43.0, 53.0, 66.0, 92.0, 95.0, 91.0, 74.0, 94.0, 77.0, 31.0, 41.0, 34.0, 22.0, 9.0, 15.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003124237060546875, -0.0030086636543273926, -0.00289309024810791, -0.0027775168418884277, -0.0026619434356689453, -0.002546370029449463, -0.0024307966232299805, -0.002315223217010498, -0.0021996498107910156, -0.002084076404571533, -0.0019685029983520508, -0.0018529295921325684, -0.001737356185913086, -0.0016217827796936035, -0.001506209373474121, -0.0013906359672546387, -0.0012750625610351562, -0.0011594891548156738, -0.0010439157485961914, -0.000928342342376709, -0.0008127689361572266, -0.0006971955299377441, -0.0005816221237182617, -0.0004660487174987793, -0.0003504753112792969, -0.00023490190505981445, -0.00011932849884033203, -3.7550926208496094e-06, 0.00011181831359863281, 0.00022739171981811523, 0.00034296512603759766, 0.0004585385322570801, 0.0005741119384765625, 0.0006896853446960449, 0.0008052587509155273, 0.0009208321571350098, 0.0010364055633544922, 0.0011519789695739746, 0.001267552375793457, 0.0013831257820129395, 0.0014986991882324219, 0.0016142725944519043, 0.0017298460006713867, 0.0018454194068908691, 0.0019609928131103516, 0.002076566219329834, 0.0021921396255493164, 0.002307713031768799, 0.0024232864379882812, 0.0025388598442077637, 0.002654433250427246, 0.0027700066566467285, 0.002885580062866211, 0.0030011534690856934, 0.0031167268753051758, 0.003232300281524658, 0.0033478736877441406, 0.003463447093963623, 0.0035790205001831055, 0.003694593906402588, 0.0038101673126220703, 0.003925740718841553, 0.004041314125061035, 0.004156887531280518, 0.0042724609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 6.0, 14.0, 12.0, 30.0, 36.0, 45.0, 56.0, 115.0, 152.0, 218.0, 380.0, 556.0, 874.0, 1368.0, 2133.0, 3300.0, 5308.0, 8652.0, 15024.0, 26300.0, 48754.0, 97835.0, 225377.0, 324696.0, 139073.0, 65837.0, 34348.0, 19102.0, 11048.0, 6620.0, 4133.0, 2557.0, 1570.0, 967.0, 686.0, 440.0, 282.0, 219.0, 132.0, 98.0, 70.0, 39.0, 18.0, 20.0, 8.0, 10.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.8125, -20.18603515625, -19.5595703125, -18.93310546875, -18.306640625, -17.68017578125, -17.0537109375, -16.42724609375, -15.80078125, -15.17431640625, -14.5478515625, -13.92138671875, -13.294921875, -12.66845703125, -12.0419921875, -11.41552734375, -10.7890625, -10.16259765625, -9.5361328125, -8.90966796875, -8.283203125, -7.65673828125, -7.0302734375, -6.40380859375, -5.77734375, -5.15087890625, -4.5244140625, -3.89794921875, -3.271484375, -2.64501953125, -2.0185546875, -1.39208984375, -0.765625, -0.13916015625, 0.4873046875, 1.11376953125, 1.740234375, 2.36669921875, 2.9931640625, 3.61962890625, 4.24609375, 4.87255859375, 5.4990234375, 6.12548828125, 6.751953125, 7.37841796875, 8.0048828125, 8.63134765625, 9.2578125, 9.88427734375, 10.5107421875, 11.13720703125, 11.763671875, 12.39013671875, 13.0166015625, 13.64306640625, 14.26953125, 14.89599609375, 15.5224609375, 16.14892578125, 16.775390625, 17.40185546875, 18.0283203125, 18.65478515625, 19.28125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 4.0, 4.0, 5.0, 5.0, 11.0, 11.0, 13.0, 19.0, 18.0, 19.0, 20.0, 20.0, 28.0, 30.0, 32.0, 45.0, 32.0, 47.0, 48.0, 41.0, 52.0, 53.0, 34.0, 52.0, 49.0, 33.0, 23.0, 30.0, 25.0, 20.0, 31.0, 13.0, 16.0, 15.0, 18.0, 12.0, 7.0, 7.0, 10.0, 8.0, 5.0, 7.0, 3.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-3.986328125, -3.87152099609375, -3.7567138671875, -3.64190673828125, -3.527099609375, -3.41229248046875, -3.2974853515625, -3.18267822265625, -3.06787109375, -2.95306396484375, -2.8382568359375, -2.72344970703125, -2.608642578125, -2.49383544921875, -2.3790283203125, -2.26422119140625, -2.1494140625, -2.03460693359375, -1.9197998046875, -1.80499267578125, -1.690185546875, -1.57537841796875, -1.4605712890625, -1.34576416015625, -1.23095703125, -1.11614990234375, -1.0013427734375, -0.88653564453125, -0.771728515625, -0.65692138671875, -0.5421142578125, -0.42730712890625, -0.3125, -0.19769287109375, -0.0828857421875, 0.03192138671875, 0.146728515625, 0.26153564453125, 0.3763427734375, 0.49114990234375, 0.60595703125, 0.72076416015625, 0.8355712890625, 0.95037841796875, 1.065185546875, 1.17999267578125, 1.2947998046875, 1.40960693359375, 1.5244140625, 1.63922119140625, 1.7540283203125, 1.86883544921875, 1.983642578125, 2.09844970703125, 2.2132568359375, 2.32806396484375, 2.44287109375, 2.55767822265625, 2.6724853515625, 2.78729248046875, 2.902099609375, 3.01690673828125, 3.1317138671875, 3.24652099609375, 3.361328125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 16.0, 22.0, 11.0, 31.0, 29.0, 37.0, 46.0, 58.0, 76.0, 84.0, 95.0, 88.0, 83.0, 55.0, 49.0, 40.0, 22.0, 28.0, 23.0, 11.0, 11.0, 14.0, 5.0, 9.0, 5.0, 5.0, 7.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-114.72274017333984, -111.24276733398438, -107.76278686523438, -104.2828140258789, -100.8028335571289, -97.32286071777344, -93.84288024902344, -90.36290740966797, -86.8829345703125, -83.40296173095703, -79.92298126220703, -76.44300842285156, -72.96302795410156, -69.4830551147461, -66.00308227539062, -62.523101806640625, -59.043121337890625, -55.56314468383789, -52.083168029785156, -48.60319519042969, -45.12321472167969, -41.64324188232422, -38.163265228271484, -34.68328857421875, -31.203311920166016, -27.72333526611328, -24.243358612060547, -20.763383865356445, -17.28340721130371, -13.803430557250977, -10.323455810546875, -6.843479156494141, -3.3635101318359375, 0.11646604537963867, 3.596442222595215, 7.076417922973633, 10.556394577026367, 14.036371231079102, 17.516345977783203, 20.996322631835938, 24.476299285888672, 27.956275939941406, 31.43625259399414, 34.916229248046875, 38.396202087402344, 41.876182556152344, 45.35615539550781, 48.83613204956055, 52.31610870361328, 55.796085357666016, 59.27606201171875, 62.75603485107422, 66.23601531982422, 69.71598815917969, 73.19596862792969, 76.67594146728516, 80.15591430664062, 83.6358871459961, 87.1158676147461, 90.59584045410156, 94.07582092285156, 97.55579376220703, 101.0357666015625, 104.5157470703125, 107.9957275390625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 4.0, 10.0, 5.0, 13.0, 11.0, 16.0, 18.0, 17.0, 24.0, 23.0, 27.0, 31.0, 28.0, 31.0, 37.0, 41.0, 31.0, 64.0, 38.0, 39.0, 36.0, 57.0, 52.0, 34.0, 38.0, 28.0, 40.0, 24.0, 26.0, 23.0, 27.0, 23.0, 12.0, 11.0, 16.0, 3.0, 12.0, 6.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.50582122802734, -68.2693099975586, -66.03279113769531, -63.79627990722656, -61.55976867675781, -59.3232536315918, -57.08673858642578, -54.85022735595703, -52.613712310791016, -50.377197265625, -48.14068603515625, -45.904170989990234, -43.66765594482422, -41.43114471435547, -39.19462966918945, -36.95811462402344, -34.72160339355469, -32.48508834838867, -30.248577117919922, -28.012062072753906, -25.775548934936523, -23.53903579711914, -21.302520751953125, -19.066007614135742, -16.82949447631836, -14.592981338500977, -12.356467247009277, -10.119953155517578, -7.883440017700195, -5.6469268798828125, -3.4104127883911133, -1.173898696899414, 1.0626144409179688, 3.2991280555725098, 5.535641670227051, 7.772155284881592, 10.008668899536133, 12.245182037353516, 14.481696128845215, 16.718210220336914, 18.954723358154297, 21.19123649597168, 23.427749633789062, 25.664264678955078, 27.90077781677246, 30.137290954589844, 32.37380599975586, 34.610321044921875, 36.846832275390625, 39.08334732055664, 41.31985855102539, 43.556373596191406, 45.792884826660156, 48.02939987182617, 50.26591491699219, 52.50242614746094, 54.73894119262695, 56.97545623779297, 59.21196746826172, 61.448482513427734, 63.68499755859375, 65.9215087890625, 68.15802001953125, 70.39453887939453, 72.63105010986328]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 34.0, 31.0, 64.0, 79.0, 103.0, 211.0, 332.0, 487.0, 814.0, 1373.0, 2328.0, 3639.0, 5738.0, 9310.0, 15156.0, 24442.0, 39114.0, 63513.0, 101232.0, 161741.0, 203802.0, 156061.0, 98170.0, 60862.0, 38169.0, 23597.0, 14452.0, 9036.0, 5475.0, 3504.0, 2172.0, 1288.0, 872.0, 512.0, 318.0, 176.0, 117.0, 74.0, 66.0, 28.0, 24.0, 12.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.125, -123.208984375, -119.29296875, -115.376953125, -111.4609375, -107.544921875, -103.62890625, -99.712890625, -95.796875, -91.880859375, -87.96484375, -84.048828125, -80.1328125, -76.216796875, -72.30078125, -68.384765625, -64.46875, -60.552734375, -56.63671875, -52.720703125, -48.8046875, -44.888671875, -40.97265625, -37.056640625, -33.140625, -29.224609375, -25.30859375, -21.392578125, -17.4765625, -13.560546875, -9.64453125, -5.728515625, -1.8125, 2.103515625, 6.01953125, 9.935546875, 13.8515625, 17.767578125, 21.68359375, 25.599609375, 29.515625, 33.431640625, 37.34765625, 41.263671875, 45.1796875, 49.095703125, 53.01171875, 56.927734375, 60.84375, 64.759765625, 68.67578125, 72.591796875, 76.5078125, 80.423828125, 84.33984375, 88.255859375, 92.171875, 96.087890625, 100.00390625, 103.919921875, 107.8359375, 111.751953125, 115.66796875, 119.583984375, 123.5]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 9.0, 13.0, 7.0, 7.0, 11.0, 9.0, 14.0, 24.0, 15.0, 19.0, 25.0, 22.0, 29.0, 25.0, 40.0, 42.0, 29.0, 44.0, 33.0, 47.0, 36.0, 45.0, 37.0, 38.0, 39.0, 28.0, 25.0, 31.0, 37.0, 29.0, 26.0, 23.0, 15.0, 28.0, 13.0, 14.0, 10.0, 13.0, 9.0, 5.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-53.8125, -52.0517578125, -50.291015625, -48.5302734375, -46.76953125, -45.0087890625, -43.248046875, -41.4873046875, -39.7265625, -37.9658203125, -36.205078125, -34.4443359375, -32.68359375, -30.9228515625, -29.162109375, -27.4013671875, -25.640625, -23.8798828125, -22.119140625, -20.3583984375, -18.59765625, -16.8369140625, -15.076171875, -13.3154296875, -11.5546875, -9.7939453125, -8.033203125, -6.2724609375, -4.51171875, -2.7509765625, -0.990234375, 0.7705078125, 2.53125, 4.2919921875, 6.052734375, 7.8134765625, 9.57421875, 11.3349609375, 13.095703125, 14.8564453125, 16.6171875, 18.3779296875, 20.138671875, 21.8994140625, 23.66015625, 25.4208984375, 27.181640625, 28.9423828125, 30.703125, 32.4638671875, 34.224609375, 35.9853515625, 37.74609375, 39.5068359375, 41.267578125, 43.0283203125, 44.7890625, 46.5498046875, 48.310546875, 50.0712890625, 51.83203125, 53.5927734375, 55.353515625, 57.1142578125, 58.875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 9.0, 16.0, 25.0, 28.0, 52.0, 80.0, 92.0, 143.0, 210.0, 301.0, 394.0, 579.0, 825.0, 1242.0, 1772.0, 2469.0, 3749.0, 5462.0, 7989.0, 11963.0, 18415.0, 28259.0, 43735.0, 68871.0, 109160.0, 166439.0, 190598.0, 138007.0, 87523.0, 55629.0, 35485.0, 22643.0, 15230.0, 9875.0, 6746.0, 4524.0, 3090.0, 2002.0, 1456.0, 986.0, 740.0, 529.0, 334.0, 276.0, 185.0, 141.0, 85.0, 54.0, 45.0, 28.0, 21.0, 13.0, 11.0, 6.0, 5.0, 2.0, 0.0, 1.0], "bins": [-103.75, -100.5341796875, -97.318359375, -94.1025390625, -90.88671875, -87.6708984375, -84.455078125, -81.2392578125, -78.0234375, -74.8076171875, -71.591796875, -68.3759765625, -65.16015625, -61.9443359375, -58.728515625, -55.5126953125, -52.296875, -49.0810546875, -45.865234375, -42.6494140625, -39.43359375, -36.2177734375, -33.001953125, -29.7861328125, -26.5703125, -23.3544921875, -20.138671875, -16.9228515625, -13.70703125, -10.4912109375, -7.275390625, -4.0595703125, -0.84375, 2.3720703125, 5.587890625, 8.8037109375, 12.01953125, 15.2353515625, 18.451171875, 21.6669921875, 24.8828125, 28.0986328125, 31.314453125, 34.5302734375, 37.74609375, 40.9619140625, 44.177734375, 47.3935546875, 50.609375, 53.8251953125, 57.041015625, 60.2568359375, 63.47265625, 66.6884765625, 69.904296875, 73.1201171875, 76.3359375, 79.5517578125, 82.767578125, 85.9833984375, 89.19921875, 92.4150390625, 95.630859375, 98.8466796875, 102.0625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 7.0, 9.0, 17.0, 18.0, 11.0, 24.0, 16.0, 30.0, 24.0, 37.0, 38.0, 23.0, 36.0, 51.0, 44.0, 41.0, 56.0, 46.0, 50.0, 42.0, 37.0, 32.0, 31.0, 33.0, 29.0, 30.0, 29.0, 26.0, 22.0, 21.0, 15.0, 18.0, 9.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-58.71875, -57.0380859375, -55.357421875, -53.6767578125, -51.99609375, -50.3154296875, -48.634765625, -46.9541015625, -45.2734375, -43.5927734375, -41.912109375, -40.2314453125, -38.55078125, -36.8701171875, -35.189453125, -33.5087890625, -31.828125, -30.1474609375, -28.466796875, -26.7861328125, -25.10546875, -23.4248046875, -21.744140625, -20.0634765625, -18.3828125, -16.7021484375, -15.021484375, -13.3408203125, -11.66015625, -9.9794921875, -8.298828125, -6.6181640625, -4.9375, -3.2568359375, -1.576171875, 0.1044921875, 1.78515625, 3.4658203125, 5.146484375, 6.8271484375, 8.5078125, 10.1884765625, 11.869140625, 13.5498046875, 15.23046875, 16.9111328125, 18.591796875, 20.2724609375, 21.953125, 23.6337890625, 25.314453125, 26.9951171875, 28.67578125, 30.3564453125, 32.037109375, 33.7177734375, 35.3984375, 37.0791015625, 38.759765625, 40.4404296875, 42.12109375, 43.8017578125, 45.482421875, 47.1630859375, 48.84375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 10.0, 14.0, 31.0, 30.0, 41.0, 62.0, 67.0, 122.0, 152.0, 227.0, 343.0, 491.0, 629.0, 886.0, 1317.0, 1931.0, 3384.0, 6924.0, 19637.0, 102805.0, 777979.0, 96128.0, 18922.0, 6772.0, 3344.0, 1958.0, 1244.0, 912.0, 616.0, 509.0, 306.0, 232.0, 139.0, 105.0, 79.0, 59.0, 32.0, 31.0, 23.0, 19.0, 9.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-586.5, -568.4453125, -550.390625, -532.3359375, -514.28125, -496.2265625, -478.171875, -460.1171875, -442.0625, -424.0078125, -405.953125, -387.8984375, -369.84375, -351.7890625, -333.734375, -315.6796875, -297.625, -279.5703125, -261.515625, -243.4609375, -225.40625, -207.3515625, -189.296875, -171.2421875, -153.1875, -135.1328125, -117.078125, -99.0234375, -80.96875, -62.9140625, -44.859375, -26.8046875, -8.75, 9.3046875, 27.359375, 45.4140625, 63.46875, 81.5234375, 99.578125, 117.6328125, 135.6875, 153.7421875, 171.796875, 189.8515625, 207.90625, 225.9609375, 244.015625, 262.0703125, 280.125, 298.1796875, 316.234375, 334.2890625, 352.34375, 370.3984375, 388.453125, 406.5078125, 424.5625, 442.6171875, 460.671875, 478.7265625, 496.78125, 514.8359375, 532.890625, 550.9453125, 569.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 19.0, 40.0, 112.0, 216.0, 326.0, 156.0, 68.0, 27.0, 9.0, 13.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.01954364776611328, -0.018579483032226562, -0.017615318298339844, -0.016651153564453125, -0.015686988830566406, -0.014722824096679688, -0.013758659362792969, -0.01279449462890625, -0.011830329895019531, -0.010866165161132812, -0.009902000427246094, -0.008937835693359375, -0.007973670959472656, -0.0070095062255859375, -0.006045341491699219, -0.0050811767578125, -0.004117012023925781, -0.0031528472900390625, -0.0021886825561523438, -0.001224517822265625, -0.00026035308837890625, 0.0007038116455078125, 0.0016679763793945312, 0.00263214111328125, 0.0035963058471679688, 0.0045604705810546875, 0.005524635314941406, 0.006488800048828125, 0.007452964782714844, 0.008417129516601562, 0.009381294250488281, 0.010345458984375, 0.011309623718261719, 0.012273788452148438, 0.013237953186035156, 0.014202117919921875, 0.015166282653808594, 0.016130447387695312, 0.01709461212158203, 0.01805877685546875, 0.01902294158935547, 0.019987106323242188, 0.020951271057128906, 0.021915435791015625, 0.022879600524902344, 0.023843765258789062, 0.02480792999267578, 0.0257720947265625, 0.02673625946044922, 0.027700424194335938, 0.028664588928222656, 0.029628753662109375, 0.030592918395996094, 0.03155708312988281, 0.03252124786376953, 0.03348541259765625, 0.03444957733154297, 0.03541374206542969, 0.036377906799316406, 0.037342071533203125, 0.038306236267089844, 0.03927040100097656, 0.04023456573486328, 0.04119873046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 10.0, 7.0, 21.0, 22.0, 18.0, 46.0, 61.0, 79.0, 100.0, 145.0, 186.0, 262.0, 391.0, 510.0, 756.0, 1118.0, 1654.0, 2712.0, 5235.0, 13731.0, 65221.0, 749710.0, 166618.0, 23019.0, 7135.0, 3421.0, 1988.0, 1272.0, 898.0, 618.0, 417.0, 319.0, 213.0, 155.0, 120.0, 102.0, 74.0, 46.0, 24.0, 31.0, 19.0, 20.0, 11.0, 6.0, 7.0, 1.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-526.0, -508.2890625, -490.578125, -472.8671875, -455.15625, -437.4453125, -419.734375, -402.0234375, -384.3125, -366.6015625, -348.890625, -331.1796875, -313.46875, -295.7578125, -278.046875, -260.3359375, -242.625, -224.9140625, -207.203125, -189.4921875, -171.78125, -154.0703125, -136.359375, -118.6484375, -100.9375, -83.2265625, -65.515625, -47.8046875, -30.09375, -12.3828125, 5.328125, 23.0390625, 40.75, 58.4609375, 76.171875, 93.8828125, 111.59375, 129.3046875, 147.015625, 164.7265625, 182.4375, 200.1484375, 217.859375, 235.5703125, 253.28125, 270.9921875, 288.703125, 306.4140625, 324.125, 341.8359375, 359.546875, 377.2578125, 394.96875, 412.6796875, 430.390625, 448.1015625, 465.8125, 483.5234375, 501.234375, 518.9453125, 536.65625, 554.3671875, 572.078125, 589.7890625, 607.5]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 6.0, 11.0, 16.0, 51.0, 80.0, 124.0, 177.0, 170.0, 128.0, 98.0, 52.0, 30.0, 14.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-175.375, -170.7666015625, -166.158203125, -161.5498046875, -156.94140625, -152.3330078125, -147.724609375, -143.1162109375, -138.5078125, -133.8994140625, -129.291015625, -124.6826171875, -120.07421875, -115.4658203125, -110.857421875, -106.2490234375, -101.640625, -97.0322265625, -92.423828125, -87.8154296875, -83.20703125, -78.5986328125, -73.990234375, -69.3818359375, -64.7734375, -60.1650390625, -55.556640625, -50.9482421875, -46.33984375, -41.7314453125, -37.123046875, -32.5146484375, -27.90625, -23.2978515625, -18.689453125, -14.0810546875, -9.47265625, -4.8642578125, -0.255859375, 4.3525390625, 8.9609375, 13.5693359375, 18.177734375, 22.7861328125, 27.39453125, 32.0029296875, 36.611328125, 41.2197265625, 45.828125, 50.4365234375, 55.044921875, 59.6533203125, 64.26171875, 68.8701171875, 73.478515625, 78.0869140625, 82.6953125, 87.3037109375, 91.912109375, 96.5205078125, 101.12890625, 105.7373046875, 110.345703125, 114.9541015625, 119.5625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 10.0, 19.0, 22.0, 41.0, 75.0, 95.0, 121.0, 124.0, 99.0, 77.0, 61.0, 44.0, 38.0, 23.0, 26.0, 26.0, 20.0, 8.0, 6.0, 8.0, 8.0, 4.0, 7.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-110.30298614501953, -105.17820739746094, -100.05343627929688, -94.92865753173828, -89.80387878417969, -84.6791000366211, -79.5543212890625, -74.42955017089844, -69.30477142333984, -64.17999267578125, -59.05521774291992, -53.930442810058594, -48.8056640625, -43.680885314941406, -38.55611038208008, -33.43133544921875, -28.306556701660156, -23.181779861450195, -18.057003021240234, -12.932226181030273, -7.8074493408203125, -2.6826725006103516, 2.4421043395996094, 7.5668792724609375, 12.691658020019531, 17.816434860229492, 22.941211700439453, 28.065988540649414, 33.190765380859375, 38.31554412841797, 43.4403190612793, 48.565093994140625, 53.68986511230469, 58.81464385986328, 63.93941879272461, 69.06419372558594, 74.18897247314453, 79.31375122070312, 84.43852233886719, 89.56330108642578, 94.68807983398438, 99.81285858154297, 104.93763732910156, 110.06240844726562, 115.18718719482422, 120.31196594238281, 125.43673706054688, 130.5615234375, 135.68629455566406, 140.81106567382812, 145.93585205078125, 151.0606231689453, 156.18539428710938, 161.3101806640625, 166.43495178222656, 171.55972290039062, 176.68450927734375, 181.8092803955078, 186.93406677246094, 192.058837890625, 197.18362426757812, 202.3083953857422, 207.43316650390625, 212.55795288085938, 217.68272399902344]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 13.0, 11.0, 7.0, 15.0, 19.0, 11.0, 18.0, 22.0, 26.0, 21.0, 28.0, 27.0, 48.0, 41.0, 28.0, 41.0, 40.0, 52.0, 38.0, 49.0, 44.0, 39.0, 37.0, 32.0, 35.0, 36.0, 28.0, 29.0, 29.0, 18.0, 13.0, 16.0, 14.0, 15.0, 11.0, 14.0, 9.0, 6.0, 7.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.78646850585938, -81.228515625, -78.6705551147461, -76.11260223388672, -73.55464172363281, -70.99668884277344, -68.43873596191406, -65.88078308105469, -63.32282257080078, -60.76486587524414, -58.2069091796875, -55.648956298828125, -53.090999603271484, -50.533042907714844, -47.97509002685547, -45.41713333129883, -42.85917663574219, -40.30121994018555, -37.743263244628906, -35.18531036376953, -32.62735366821289, -30.06939697265625, -27.511442184448242, -24.953487396240234, -22.395530700683594, -19.837574005126953, -17.279619216918945, -14.721663475036621, -12.163707733154297, -9.605751991271973, -7.047796249389648, -4.489841461181641, -1.9318923950195312, 0.626063346862793, 3.184019088745117, 5.741974830627441, 8.299930572509766, 10.85788631439209, 13.415842056274414, 15.973796844482422, 18.531753540039062, 21.089710235595703, 23.64766502380371, 26.20561981201172, 28.76357650756836, 31.321533203125, 33.879486083984375, 36.437442779541016, 38.995399475097656, 41.5533561706543, 44.11131286621094, 46.66926574707031, 49.22722244262695, 51.785179138183594, 54.34313201904297, 56.90108871459961, 59.45904541015625, 62.01700210571289, 64.57495880126953, 67.1329116821289, 69.69087219238281, 72.24882507324219, 74.80677795410156, 77.36473083496094, 79.92269134521484]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 8.0, 4.0, 5.0, 5.0, 9.0, 11.0, 13.0, 19.0, 33.0, 35.0, 50.0, 74.0, 89.0, 129.0, 215.0, 296.0, 424.0, 587.0, 910.0, 1431.0, 2125.0, 3229.0, 5122.0, 8346.0, 13552.0, 22159.0, 37449.0, 66278.0, 125725.0, 287751.0, 1018814.0, 1677503.0, 517911.0, 188982.0, 92262.0, 49847.0, 28202.0, 16802.0, 10426.0, 6316.0, 4019.0, 2417.0, 1638.0, 1041.0, 691.0, 443.0, 300.0, 183.0, 139.0, 83.0, 62.0, 47.0, 26.0, 21.0, 15.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0], "bins": [-121.1875, -117.6494140625, -114.111328125, -110.5732421875, -107.03515625, -103.4970703125, -99.958984375, -96.4208984375, -92.8828125, -89.3447265625, -85.806640625, -82.2685546875, -78.73046875, -75.1923828125, -71.654296875, -68.1162109375, -64.578125, -61.0400390625, -57.501953125, -53.9638671875, -50.42578125, -46.8876953125, -43.349609375, -39.8115234375, -36.2734375, -32.7353515625, -29.197265625, -25.6591796875, -22.12109375, -18.5830078125, -15.044921875, -11.5068359375, -7.96875, -4.4306640625, -0.892578125, 2.6455078125, 6.18359375, 9.7216796875, 13.259765625, 16.7978515625, 20.3359375, 23.8740234375, 27.412109375, 30.9501953125, 34.48828125, 38.0263671875, 41.564453125, 45.1025390625, 48.640625, 52.1787109375, 55.716796875, 59.2548828125, 62.79296875, 66.3310546875, 69.869140625, 73.4072265625, 76.9453125, 80.4833984375, 84.021484375, 87.5595703125, 91.09765625, 94.6357421875, 98.173828125, 101.7119140625, 105.25]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 13.0, 14.0, 11.0, 17.0, 21.0, 30.0, 17.0, 18.0, 32.0, 40.0, 31.0, 35.0, 38.0, 49.0, 32.0, 49.0, 37.0, 43.0, 55.0, 51.0, 42.0, 33.0, 32.0, 30.0, 19.0, 29.0, 25.0, 28.0, 24.0, 18.0, 15.0, 9.0, 11.0, 5.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-48.3125, -46.98974609375, -45.6669921875, -44.34423828125, -43.021484375, -41.69873046875, -40.3759765625, -39.05322265625, -37.73046875, -36.40771484375, -35.0849609375, -33.76220703125, -32.439453125, -31.11669921875, -29.7939453125, -28.47119140625, -27.1484375, -25.82568359375, -24.5029296875, -23.18017578125, -21.857421875, -20.53466796875, -19.2119140625, -17.88916015625, -16.56640625, -15.24365234375, -13.9208984375, -12.59814453125, -11.275390625, -9.95263671875, -8.6298828125, -7.30712890625, -5.984375, -4.66162109375, -3.3388671875, -2.01611328125, -0.693359375, 0.62939453125, 1.9521484375, 3.27490234375, 4.59765625, 5.92041015625, 7.2431640625, 8.56591796875, 9.888671875, 11.21142578125, 12.5341796875, 13.85693359375, 15.1796875, 16.50244140625, 17.8251953125, 19.14794921875, 20.470703125, 21.79345703125, 23.1162109375, 24.43896484375, 25.76171875, 27.08447265625, 28.4072265625, 29.72998046875, 31.052734375, 32.37548828125, 33.6982421875, 35.02099609375, 36.34375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 10.0, 16.0, 22.0, 37.0, 54.0, 93.0, 101.0, 196.0, 286.0, 458.0, 719.0, 1202.0, 1860.0, 3145.0, 5237.0, 9778.0, 18347.0, 39255.0, 91721.0, 262780.0, 1027142.0, 1992400.0, 476863.0, 147575.0, 57872.0, 26305.0, 13293.0, 7095.0, 4128.0, 2410.0, 1445.0, 908.0, 551.0, 356.0, 190.0, 155.0, 101.0, 58.0, 37.0, 30.0, 12.0, 13.0, 4.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-145.75, -141.4931640625, -137.236328125, -132.9794921875, -128.72265625, -124.4658203125, -120.208984375, -115.9521484375, -111.6953125, -107.4384765625, -103.181640625, -98.9248046875, -94.66796875, -90.4111328125, -86.154296875, -81.8974609375, -77.640625, -73.3837890625, -69.126953125, -64.8701171875, -60.61328125, -56.3564453125, -52.099609375, -47.8427734375, -43.5859375, -39.3291015625, -35.072265625, -30.8154296875, -26.55859375, -22.3017578125, -18.044921875, -13.7880859375, -9.53125, -5.2744140625, -1.017578125, 3.2392578125, 7.49609375, 11.7529296875, 16.009765625, 20.2666015625, 24.5234375, 28.7802734375, 33.037109375, 37.2939453125, 41.55078125, 45.8076171875, 50.064453125, 54.3212890625, 58.578125, 62.8349609375, 67.091796875, 71.3486328125, 75.60546875, 79.8623046875, 84.119140625, 88.3759765625, 92.6328125, 96.8896484375, 101.146484375, 105.4033203125, 109.66015625, 113.9169921875, 118.173828125, 122.4306640625, 126.6875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 5.0, 3.0, 8.0, 9.0, 18.0, 6.0, 14.0, 18.0, 15.0, 28.0, 40.0, 46.0, 46.0, 55.0, 88.0, 107.0, 142.0, 154.0, 184.0, 241.0, 287.0, 320.0, 378.0, 329.0, 307.0, 266.0, 196.0, 157.0, 133.0, 91.0, 69.0, 73.0, 53.0, 43.0, 37.0, 26.0, 21.0, 15.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.234375, -26.4013671875, -25.568359375, -24.7353515625, -23.90234375, -23.0693359375, -22.236328125, -21.4033203125, -20.5703125, -19.7373046875, -18.904296875, -18.0712890625, -17.23828125, -16.4052734375, -15.572265625, -14.7392578125, -13.90625, -13.0732421875, -12.240234375, -11.4072265625, -10.57421875, -9.7412109375, -8.908203125, -8.0751953125, -7.2421875, -6.4091796875, -5.576171875, -4.7431640625, -3.91015625, -3.0771484375, -2.244140625, -1.4111328125, -0.578125, 0.2548828125, 1.087890625, 1.9208984375, 2.75390625, 3.5869140625, 4.419921875, 5.2529296875, 6.0859375, 6.9189453125, 7.751953125, 8.5849609375, 9.41796875, 10.2509765625, 11.083984375, 11.9169921875, 12.75, 13.5830078125, 14.416015625, 15.2490234375, 16.08203125, 16.9150390625, 17.748046875, 18.5810546875, 19.4140625, 20.2470703125, 21.080078125, 21.9130859375, 22.74609375, 23.5791015625, 24.412109375, 25.2451171875, 26.078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 10.0, 5.0, 7.0, 3.0, 17.0, 23.0, 16.0, 48.0, 69.0, 98.0, 130.0, 150.0, 126.0, 103.0, 58.0, 41.0, 25.0, 19.0, 15.0, 11.0, 12.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-98.96485137939453, -95.12291717529297, -91.28097534179688, -87.43904113769531, -83.59710693359375, -79.75517272949219, -75.9132308959961, -72.07129669189453, -68.22935485839844, -64.38742065429688, -60.54548263549805, -56.70354461669922, -52.861610412597656, -49.01967239379883, -45.177734375, -41.33580017089844, -37.493865966796875, -33.65192794799805, -29.809993743896484, -25.968055725097656, -22.12611961364746, -18.284183502197266, -14.442245483398438, -10.600309371948242, -6.758373260498047, -2.9164366722106934, 0.9254999160766602, 4.767436981201172, 8.609373092651367, 12.451309204101562, 16.29324722290039, 20.135183334350586, 23.977127075195312, 27.819063186645508, 31.660999298095703, 35.50293731689453, 39.344871520996094, 43.18680953979492, 47.02874755859375, 50.87068176269531, 54.71261978149414, 58.55455780029297, 62.39649200439453, 66.23843383789062, 70.08036804199219, 73.92230224609375, 77.76423645019531, 81.6061782836914, 85.44811248779297, 89.29004669189453, 93.13198852539062, 96.97392272949219, 100.81585693359375, 104.65779113769531, 108.4997329711914, 112.34166717529297, 116.18360900878906, 120.02554321289062, 123.86748504638672, 127.70941925048828, 131.55136108398438, 135.39329528808594, 139.2352294921875, 143.07716369628906, 146.91909790039062]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 7.0, 4.0, 12.0, 13.0, 15.0, 9.0, 25.0, 24.0, 26.0, 17.0, 31.0, 39.0, 28.0, 30.0, 42.0, 37.0, 43.0, 41.0, 43.0, 40.0, 46.0, 50.0, 36.0, 30.0, 31.0, 41.0, 32.0, 26.0, 23.0, 21.0, 23.0, 26.0, 17.0, 13.0, 13.0, 9.0, 16.0, 4.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.307769775390625, -56.57895278930664, -54.850135803222656, -53.121315002441406, -51.39249801635742, -49.66368103027344, -47.93486404418945, -46.20604705810547, -44.47722625732422, -42.748409271240234, -41.01959228515625, -39.290771484375, -37.561954498291016, -35.83313751220703, -34.10432052612305, -32.37550354003906, -30.646684646606445, -28.91786766052246, -27.189048767089844, -25.46023178100586, -23.731412887573242, -22.002595901489258, -20.27377700805664, -18.544960021972656, -16.816143035888672, -15.087325096130371, -13.35850715637207, -11.629690170288086, -9.900871276855469, -8.172054290771484, -6.443236351013184, -4.714418411254883, -2.9855995178222656, -1.2567816972732544, 0.47203612327575684, 2.2008538246154785, 3.9296717643737793, 5.658489227294922, 7.387307167053223, 9.116125106811523, 10.844943046569824, 12.573760986328125, 14.302578926086426, 16.031396865844727, 17.76021385192871, 19.489032745361328, 21.217849731445312, 22.946666717529297, 24.675485610961914, 26.4043025970459, 28.133121490478516, 29.8619384765625, 31.590757369995117, 33.31957244873047, 35.04839324951172, 36.7772102355957, 38.50602722167969, 40.23484420776367, 41.963661193847656, 43.692481994628906, 45.42129898071289, 47.150115966796875, 48.87893295288086, 50.607749938964844, 52.336570739746094]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 10.0, 29.0, 29.0, 40.0, 59.0, 106.0, 118.0, 181.0, 245.0, 368.0, 512.0, 823.0, 1244.0, 1782.0, 2614.0, 4058.0, 6353.0, 9820.0, 15545.0, 25957.0, 44878.0, 80109.0, 155745.0, 274878.0, 191650.0, 97209.0, 53249.0, 30543.0, 18166.0, 11250.0, 7230.0, 4637.0, 2876.0, 1945.0, 1398.0, 908.0, 626.0, 411.0, 274.0, 196.0, 135.0, 101.0, 74.0, 69.0, 18.0, 29.0, 21.0, 10.0, 2.0, 6.0, 4.0, 3.0, 0.0, 4.0], "bins": [-37.28125, -36.17333984375, -35.0654296875, -33.95751953125, -32.849609375, -31.74169921875, -30.6337890625, -29.52587890625, -28.41796875, -27.31005859375, -26.2021484375, -25.09423828125, -23.986328125, -22.87841796875, -21.7705078125, -20.66259765625, -19.5546875, -18.44677734375, -17.3388671875, -16.23095703125, -15.123046875, -14.01513671875, -12.9072265625, -11.79931640625, -10.69140625, -9.58349609375, -8.4755859375, -7.36767578125, -6.259765625, -5.15185546875, -4.0439453125, -2.93603515625, -1.828125, -0.72021484375, 0.3876953125, 1.49560546875, 2.603515625, 3.71142578125, 4.8193359375, 5.92724609375, 7.03515625, 8.14306640625, 9.2509765625, 10.35888671875, 11.466796875, 12.57470703125, 13.6826171875, 14.79052734375, 15.8984375, 17.00634765625, 18.1142578125, 19.22216796875, 20.330078125, 21.43798828125, 22.5458984375, 23.65380859375, 24.76171875, 25.86962890625, 26.9775390625, 28.08544921875, 29.193359375, 30.30126953125, 31.4091796875, 32.51708984375, 33.625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 3.0, 8.0, 3.0, 6.0, 4.0, 9.0, 15.0, 20.0, 12.0, 22.0, 24.0, 23.0, 24.0, 23.0, 32.0, 27.0, 41.0, 45.0, 42.0, 37.0, 37.0, 38.0, 31.0, 48.0, 44.0, 56.0, 25.0, 29.0, 33.0, 27.0, 35.0, 22.0, 20.0, 26.0, 14.0, 23.0, 12.0, 18.0, 13.0, 9.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.15625, -51.58251953125, -50.0087890625, -48.43505859375, -46.861328125, -45.28759765625, -43.7138671875, -42.14013671875, -40.56640625, -38.99267578125, -37.4189453125, -35.84521484375, -34.271484375, -32.69775390625, -31.1240234375, -29.55029296875, -27.9765625, -26.40283203125, -24.8291015625, -23.25537109375, -21.681640625, -20.10791015625, -18.5341796875, -16.96044921875, -15.38671875, -13.81298828125, -12.2392578125, -10.66552734375, -9.091796875, -7.51806640625, -5.9443359375, -4.37060546875, -2.796875, -1.22314453125, 0.3505859375, 1.92431640625, 3.498046875, 5.07177734375, 6.6455078125, 8.21923828125, 9.79296875, 11.36669921875, 12.9404296875, 14.51416015625, 16.087890625, 17.66162109375, 19.2353515625, 20.80908203125, 22.3828125, 23.95654296875, 25.5302734375, 27.10400390625, 28.677734375, 30.25146484375, 31.8251953125, 33.39892578125, 34.97265625, 36.54638671875, 38.1201171875, 39.69384765625, 41.267578125, 42.84130859375, 44.4150390625, 45.98876953125, 47.5625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 10.0, 7.0, 11.0, 23.0, 23.0, 42.0, 49.0, 105.0, 134.0, 210.0, 263.0, 446.0, 688.0, 1215.0, 2076.0, 3774.0, 6840.0, 13363.0, 28585.0, 72631.0, 275305.0, 462187.0, 106306.0, 38180.0, 16738.0, 8430.0, 4455.0, 2532.0, 1401.0, 919.0, 554.0, 379.0, 243.0, 145.0, 108.0, 60.0, 31.0, 31.0, 15.0, 11.0, 10.0, 8.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.75, -44.2333984375, -42.716796875, -41.2001953125, -39.68359375, -38.1669921875, -36.650390625, -35.1337890625, -33.6171875, -32.1005859375, -30.583984375, -29.0673828125, -27.55078125, -26.0341796875, -24.517578125, -23.0009765625, -21.484375, -19.9677734375, -18.451171875, -16.9345703125, -15.41796875, -13.9013671875, -12.384765625, -10.8681640625, -9.3515625, -7.8349609375, -6.318359375, -4.8017578125, -3.28515625, -1.7685546875, -0.251953125, 1.2646484375, 2.78125, 4.2978515625, 5.814453125, 7.3310546875, 8.84765625, 10.3642578125, 11.880859375, 13.3974609375, 14.9140625, 16.4306640625, 17.947265625, 19.4638671875, 20.98046875, 22.4970703125, 24.013671875, 25.5302734375, 27.046875, 28.5634765625, 30.080078125, 31.5966796875, 33.11328125, 34.6298828125, 36.146484375, 37.6630859375, 39.1796875, 40.6962890625, 42.212890625, 43.7294921875, 45.24609375, 46.7626953125, 48.279296875, 49.7958984375, 51.3125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 6.0, 10.0, 11.0, 13.0, 10.0, 12.0, 18.0, 17.0, 20.0, 29.0, 26.0, 20.0, 32.0, 37.0, 40.0, 39.0, 51.0, 44.0, 41.0, 51.0, 42.0, 44.0, 40.0, 33.0, 37.0, 33.0, 29.0, 31.0, 23.0, 26.0, 27.0, 19.0, 15.0, 14.0, 8.0, 14.0, 13.0, 6.0, 4.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.375, -34.2568359375, -33.138671875, -32.0205078125, -30.90234375, -29.7841796875, -28.666015625, -27.5478515625, -26.4296875, -25.3115234375, -24.193359375, -23.0751953125, -21.95703125, -20.8388671875, -19.720703125, -18.6025390625, -17.484375, -16.3662109375, -15.248046875, -14.1298828125, -13.01171875, -11.8935546875, -10.775390625, -9.6572265625, -8.5390625, -7.4208984375, -6.302734375, -5.1845703125, -4.06640625, -2.9482421875, -1.830078125, -0.7119140625, 0.40625, 1.5244140625, 2.642578125, 3.7607421875, 4.87890625, 5.9970703125, 7.115234375, 8.2333984375, 9.3515625, 10.4697265625, 11.587890625, 12.7060546875, 13.82421875, 14.9423828125, 16.060546875, 17.1787109375, 18.296875, 19.4150390625, 20.533203125, 21.6513671875, 22.76953125, 23.8876953125, 25.005859375, 26.1240234375, 27.2421875, 28.3603515625, 29.478515625, 30.5966796875, 31.71484375, 32.8330078125, 33.951171875, 35.0693359375, 36.1875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 8.0, 5.0, 8.0, 7.0, 9.0, 20.0, 20.0, 31.0, 29.0, 35.0, 67.0, 76.0, 111.0, 162.0, 193.0, 276.0, 384.0, 495.0, 747.0, 1138.0, 1668.0, 2511.0, 4226.0, 7592.0, 15009.0, 35243.0, 112124.0, 584143.0, 189744.0, 49529.0, 19570.0, 9419.0, 4890.0, 2962.0, 1864.0, 1263.0, 820.0, 567.0, 409.0, 292.0, 249.0, 192.0, 117.0, 93.0, 61.0, 41.0, 42.0, 16.0, 23.0, 19.0, 14.0, 12.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-12.3828125, -11.97900390625, -11.5751953125, -11.17138671875, -10.767578125, -10.36376953125, -9.9599609375, -9.55615234375, -9.15234375, -8.74853515625, -8.3447265625, -7.94091796875, -7.537109375, -7.13330078125, -6.7294921875, -6.32568359375, -5.921875, -5.51806640625, -5.1142578125, -4.71044921875, -4.306640625, -3.90283203125, -3.4990234375, -3.09521484375, -2.69140625, -2.28759765625, -1.8837890625, -1.47998046875, -1.076171875, -0.67236328125, -0.2685546875, 0.13525390625, 0.5390625, 0.94287109375, 1.3466796875, 1.75048828125, 2.154296875, 2.55810546875, 2.9619140625, 3.36572265625, 3.76953125, 4.17333984375, 4.5771484375, 4.98095703125, 5.384765625, 5.78857421875, 6.1923828125, 6.59619140625, 7.0, 7.40380859375, 7.8076171875, 8.21142578125, 8.615234375, 9.01904296875, 9.4228515625, 9.82666015625, 10.23046875, 10.63427734375, 11.0380859375, 11.44189453125, 11.845703125, 12.24951171875, 12.6533203125, 13.05712890625, 13.4609375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 12.0, 14.0, 19.0, 20.0, 12.0, 17.0, 23.0, 46.0, 41.0, 40.0, 33.0, 47.0, 58.0, 63.0, 47.0, 53.0, 42.0, 46.0, 45.0, 32.0, 37.0, 40.0, 30.0, 38.0, 29.0, 20.0, 15.0, 19.0, 12.0, 7.0, 7.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00146484375, -0.0014178454875946045, -0.001370847225189209, -0.0013238489627838135, -0.001276850700378418, -0.0012298524379730225, -0.001182854175567627, -0.0011358559131622314, -0.001088857650756836, -0.0010418593883514404, -0.000994861125946045, -0.0009478628635406494, -0.0009008646011352539, -0.0008538663387298584, -0.0008068680763244629, -0.0007598698139190674, -0.0007128715515136719, -0.0006658732891082764, -0.0006188750267028809, -0.0005718767642974854, -0.0005248785018920898, -0.00047788023948669434, -0.00043088197708129883, -0.0003838837146759033, -0.0003368854522705078, -0.0002898871898651123, -0.0002428889274597168, -0.0001958906650543213, -0.00014889240264892578, -0.00010189414024353027, -5.4895877838134766e-05, -7.897615432739258e-06, 3.910064697265625e-05, 8.609890937805176e-05, 0.00013309717178344727, 0.00018009543418884277, 0.00022709369659423828, 0.0002740919589996338, 0.0003210902214050293, 0.0003680884838104248, 0.0004150867462158203, 0.0004620850086212158, 0.0005090832710266113, 0.0005560815334320068, 0.0006030797958374023, 0.0006500780582427979, 0.0006970763206481934, 0.0007440745830535889, 0.0007910728454589844, 0.0008380711078643799, 0.0008850693702697754, 0.0009320676326751709, 0.0009790658950805664, 0.001026064157485962, 0.0010730624198913574, 0.001120060682296753, 0.0011670589447021484, 0.001214057207107544, 0.0012610554695129395, 0.001308053731918335, 0.0013550519943237305, 0.001402050256729126, 0.0014490485191345215, 0.001496046781539917, 0.0015430450439453125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 7.0, 3.0, 7.0, 12.0, 11.0, 16.0, 32.0, 11.0, 35.0, 39.0, 93.0, 88.0, 162.0, 232.0, 357.0, 544.0, 831.0, 1443.0, 2625.0, 4655.0, 9021.0, 17972.0, 40120.0, 101386.0, 348072.0, 342833.0, 99933.0, 39862.0, 18128.0, 8786.0, 4708.0, 2572.0, 1467.0, 885.0, 527.0, 344.0, 218.0, 166.0, 84.0, 75.0, 51.0, 43.0, 30.0, 19.0, 13.0, 15.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-18.3125, -17.7216796875, -17.130859375, -16.5400390625, -15.94921875, -15.3583984375, -14.767578125, -14.1767578125, -13.5859375, -12.9951171875, -12.404296875, -11.8134765625, -11.22265625, -10.6318359375, -10.041015625, -9.4501953125, -8.859375, -8.2685546875, -7.677734375, -7.0869140625, -6.49609375, -5.9052734375, -5.314453125, -4.7236328125, -4.1328125, -3.5419921875, -2.951171875, -2.3603515625, -1.76953125, -1.1787109375, -0.587890625, 0.0029296875, 0.59375, 1.1845703125, 1.775390625, 2.3662109375, 2.95703125, 3.5478515625, 4.138671875, 4.7294921875, 5.3203125, 5.9111328125, 6.501953125, 7.0927734375, 7.68359375, 8.2744140625, 8.865234375, 9.4560546875, 10.046875, 10.6376953125, 11.228515625, 11.8193359375, 12.41015625, 13.0009765625, 13.591796875, 14.1826171875, 14.7734375, 15.3642578125, 15.955078125, 16.5458984375, 17.13671875, 17.7275390625, 18.318359375, 18.9091796875, 19.5]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 17.0, 21.0, 16.0, 38.0, 40.0, 57.0, 54.0, 73.0, 84.0, 96.0, 88.0, 78.0, 72.0, 53.0, 48.0, 45.0, 27.0, 25.0, 13.0, 10.0, 9.0, 7.0, 4.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3671875, -5.21319580078125, -5.0592041015625, -4.90521240234375, -4.751220703125, -4.59722900390625, -4.4432373046875, -4.28924560546875, -4.13525390625, -3.98126220703125, -3.8272705078125, -3.67327880859375, -3.519287109375, -3.36529541015625, -3.2113037109375, -3.05731201171875, -2.9033203125, -2.74932861328125, -2.5953369140625, -2.44134521484375, -2.287353515625, -2.13336181640625, -1.9793701171875, -1.82537841796875, -1.67138671875, -1.51739501953125, -1.3634033203125, -1.20941162109375, -1.055419921875, -0.90142822265625, -0.7474365234375, -0.59344482421875, -0.439453125, -0.28546142578125, -0.1314697265625, 0.02252197265625, 0.176513671875, 0.33050537109375, 0.4844970703125, 0.63848876953125, 0.79248046875, 0.94647216796875, 1.1004638671875, 1.25445556640625, 1.408447265625, 1.56243896484375, 1.7164306640625, 1.87042236328125, 2.0244140625, 2.17840576171875, 2.3323974609375, 2.48638916015625, 2.640380859375, 2.79437255859375, 2.9483642578125, 3.10235595703125, 3.25634765625, 3.41033935546875, 3.5643310546875, 3.71832275390625, 3.872314453125, 4.02630615234375, 4.1802978515625, 4.33428955078125, 4.48828125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 8.0, 9.0, 9.0, 13.0, 24.0, 35.0, 56.0, 89.0, 113.0, 158.0, 143.0, 110.0, 66.0, 48.0, 38.0, 16.0, 20.0, 10.0, 4.0, 10.0, 3.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.15624237060547, -89.26184844970703, -85.36744689941406, -81.47305297851562, -77.57865905761719, -73.68425750732422, -69.78986358642578, -65.89546203613281, -62.001068115234375, -58.10667037963867, -54.21227264404297, -50.31787872314453, -46.42348098754883, -42.529083251953125, -38.63468933105469, -34.740291595458984, -30.84589385986328, -26.951496124267578, -23.057100296020508, -19.162704467773438, -15.268306732177734, -11.373908996582031, -7.479513168334961, -3.5851173400878906, 0.3092803955078125, 4.203677177429199, 8.098073959350586, 11.992470741271973, 15.88686752319336, 19.781265258789062, 23.675661087036133, 27.570056915283203, 31.464462280273438, 35.35886001586914, 39.253257751464844, 43.14765167236328, 47.042049407958984, 50.93644714355469, 54.830841064453125, 58.72523880004883, 62.61963653564453, 66.51403045654297, 70.40843200683594, 74.30282592773438, 78.19721984863281, 82.09162139892578, 85.98601531982422, 89.88041687011719, 93.77481079101562, 97.66920471191406, 101.56360626220703, 105.45800018310547, 109.35240173339844, 113.24679565429688, 117.14118957519531, 121.03558349609375, 124.92998504638672, 128.8243865966797, 132.71878051757812, 136.61317443847656, 140.507568359375, 144.4019775390625, 148.29637145996094, 152.19076538085938, 156.0851593017578]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 11.0, 9.0, 14.0, 12.0, 20.0, 26.0, 22.0, 22.0, 22.0, 35.0, 30.0, 42.0, 31.0, 42.0, 38.0, 45.0, 39.0, 45.0, 42.0, 43.0, 41.0, 32.0, 30.0, 43.0, 42.0, 22.0, 17.0, 23.0, 27.0, 17.0, 31.0, 11.0, 14.0, 9.0, 14.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-54.68360900878906, -53.0902099609375, -51.49680709838867, -49.90340805053711, -48.31000518798828, -46.71660614013672, -45.123207092285156, -43.52980422973633, -41.9364013671875, -40.34300231933594, -38.74959945678711, -37.15620040893555, -35.56279754638672, -33.969398498535156, -32.375999450683594, -30.782596588134766, -29.189197540283203, -27.595796585083008, -26.002395629882812, -24.40899658203125, -22.815593719482422, -21.22219467163086, -19.628793716430664, -18.03539276123047, -16.441991806030273, -14.848590850830078, -13.255189895629883, -11.661789894104004, -10.068388938903809, -8.474987983703613, -6.881587982177734, -5.288187026977539, -3.6947860717773438, -2.1013853549957275, -0.5079846382141113, 1.0854158401489258, 2.678816795349121, 4.272217750549316, 5.865617752075195, 7.459018707275391, 9.052419662475586, 10.645820617675781, 12.239221572875977, 13.832621574401855, 15.42602252960205, 17.019424438476562, 18.612823486328125, 20.20622444152832, 21.799625396728516, 23.39302635192871, 24.986427307128906, 26.57982635498047, 28.173229217529297, 29.76662826538086, 31.360029220581055, 32.95343017578125, 34.54682922363281, 36.140228271484375, 37.7336311340332, 39.327030181884766, 40.920433044433594, 42.513832092285156, 44.10723114013672, 45.70063400268555, 47.294036865234375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 18.0, 21.0, 36.0, 56.0, 71.0, 116.0, 145.0, 224.0, 361.0, 556.0, 860.0, 1285.0, 1973.0, 3249.0, 4976.0, 8012.0, 12903.0, 21042.0, 34609.0, 56254.0, 91227.0, 146678.0, 209229.0, 172307.0, 108305.0, 67098.0, 40697.0, 24845.0, 15374.0, 9528.0, 5834.0, 3781.0, 2380.0, 1528.0, 1034.0, 625.0, 424.0, 296.0, 210.0, 115.0, 78.0, 60.0, 31.0, 31.0, 21.0, 15.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.3125, -86.4931640625, -83.673828125, -80.8544921875, -78.03515625, -75.2158203125, -72.396484375, -69.5771484375, -66.7578125, -63.9384765625, -61.119140625, -58.2998046875, -55.48046875, -52.6611328125, -49.841796875, -47.0224609375, -44.203125, -41.3837890625, -38.564453125, -35.7451171875, -32.92578125, -30.1064453125, -27.287109375, -24.4677734375, -21.6484375, -18.8291015625, -16.009765625, -13.1904296875, -10.37109375, -7.5517578125, -4.732421875, -1.9130859375, 0.90625, 3.7255859375, 6.544921875, 9.3642578125, 12.18359375, 15.0029296875, 17.822265625, 20.6416015625, 23.4609375, 26.2802734375, 29.099609375, 31.9189453125, 34.73828125, 37.5576171875, 40.376953125, 43.1962890625, 46.015625, 48.8349609375, 51.654296875, 54.4736328125, 57.29296875, 60.1123046875, 62.931640625, 65.7509765625, 68.5703125, 71.3896484375, 74.208984375, 77.0283203125, 79.84765625, 82.6669921875, 85.486328125, 88.3056640625, 91.125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 5.0, 4.0, 7.0, 14.0, 6.0, 14.0, 15.0, 13.0, 22.0, 21.0, 24.0, 24.0, 26.0, 27.0, 32.0, 35.0, 41.0, 40.0, 44.0, 41.0, 31.0, 68.0, 43.0, 33.0, 33.0, 41.0, 37.0, 23.0, 35.0, 26.0, 24.0, 30.0, 32.0, 19.0, 20.0, 13.0, 6.0, 9.0, 5.0, 9.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-52.78125, -51.3427734375, -49.904296875, -48.4658203125, -47.02734375, -45.5888671875, -44.150390625, -42.7119140625, -41.2734375, -39.8349609375, -38.396484375, -36.9580078125, -35.51953125, -34.0810546875, -32.642578125, -31.2041015625, -29.765625, -28.3271484375, -26.888671875, -25.4501953125, -24.01171875, -22.5732421875, -21.134765625, -19.6962890625, -18.2578125, -16.8193359375, -15.380859375, -13.9423828125, -12.50390625, -11.0654296875, -9.626953125, -8.1884765625, -6.75, -5.3115234375, -3.873046875, -2.4345703125, -0.99609375, 0.4423828125, 1.880859375, 3.3193359375, 4.7578125, 6.1962890625, 7.634765625, 9.0732421875, 10.51171875, 11.9501953125, 13.388671875, 14.8271484375, 16.265625, 17.7041015625, 19.142578125, 20.5810546875, 22.01953125, 23.4580078125, 24.896484375, 26.3349609375, 27.7734375, 29.2119140625, 30.650390625, 32.0888671875, 33.52734375, 34.9658203125, 36.404296875, 37.8427734375, 39.28125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 8.0, 12.0, 20.0, 25.0, 49.0, 64.0, 94.0, 154.0, 237.0, 352.0, 516.0, 849.0, 1227.0, 1940.0, 2960.0, 4765.0, 7691.0, 12909.0, 22064.0, 38195.0, 69957.0, 135071.0, 257248.0, 230298.0, 116518.0, 61501.0, 33557.0, 19580.0, 11502.0, 7026.0, 4296.0, 2794.0, 1695.0, 1111.0, 762.0, 490.0, 351.0, 211.0, 143.0, 98.0, 68.0, 52.0, 36.0, 16.0, 9.0, 12.0, 4.0, 2.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-102.9375, -99.7099609375, -96.482421875, -93.2548828125, -90.02734375, -86.7998046875, -83.572265625, -80.3447265625, -77.1171875, -73.8896484375, -70.662109375, -67.4345703125, -64.20703125, -60.9794921875, -57.751953125, -54.5244140625, -51.296875, -48.0693359375, -44.841796875, -41.6142578125, -38.38671875, -35.1591796875, -31.931640625, -28.7041015625, -25.4765625, -22.2490234375, -19.021484375, -15.7939453125, -12.56640625, -9.3388671875, -6.111328125, -2.8837890625, 0.34375, 3.5712890625, 6.798828125, 10.0263671875, 13.25390625, 16.4814453125, 19.708984375, 22.9365234375, 26.1640625, 29.3916015625, 32.619140625, 35.8466796875, 39.07421875, 42.3017578125, 45.529296875, 48.7568359375, 51.984375, 55.2119140625, 58.439453125, 61.6669921875, 64.89453125, 68.1220703125, 71.349609375, 74.5771484375, 77.8046875, 81.0322265625, 84.259765625, 87.4873046875, 90.71484375, 93.9423828125, 97.169921875, 100.3974609375, 103.625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 9.0, 4.0, 13.0, 11.0, 15.0, 21.0, 20.0, 23.0, 34.0, 38.0, 34.0, 46.0, 34.0, 40.0, 43.0, 48.0, 40.0, 53.0, 50.0, 54.0, 45.0, 44.0, 41.0, 31.0, 30.0, 25.0, 36.0, 17.0, 22.0, 18.0, 9.0, 8.0, 11.0, 12.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.34375, -46.9228515625, -45.501953125, -44.0810546875, -42.66015625, -41.2392578125, -39.818359375, -38.3974609375, -36.9765625, -35.5556640625, -34.134765625, -32.7138671875, -31.29296875, -29.8720703125, -28.451171875, -27.0302734375, -25.609375, -24.1884765625, -22.767578125, -21.3466796875, -19.92578125, -18.5048828125, -17.083984375, -15.6630859375, -14.2421875, -12.8212890625, -11.400390625, -9.9794921875, -8.55859375, -7.1376953125, -5.716796875, -4.2958984375, -2.875, -1.4541015625, -0.033203125, 1.3876953125, 2.80859375, 4.2294921875, 5.650390625, 7.0712890625, 8.4921875, 9.9130859375, 11.333984375, 12.7548828125, 14.17578125, 15.5966796875, 17.017578125, 18.4384765625, 19.859375, 21.2802734375, 22.701171875, 24.1220703125, 25.54296875, 26.9638671875, 28.384765625, 29.8056640625, 31.2265625, 32.6474609375, 34.068359375, 35.4892578125, 36.91015625, 38.3310546875, 39.751953125, 41.1728515625, 42.59375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 9.0, 20.0, 20.0, 33.0, 30.0, 47.0, 54.0, 79.0, 112.0, 173.0, 206.0, 275.0, 386.0, 612.0, 889.0, 1358.0, 2438.0, 4931.0, 12400.0, 45705.0, 674496.0, 252614.0, 31850.0, 9652.0, 4108.0, 2050.0, 1253.0, 834.0, 507.0, 372.0, 286.0, 198.0, 119.0, 98.0, 78.0, 60.0, 48.0, 33.0, 29.0, 16.0, 18.0, 15.0, 6.0, 4.0, 2.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-598.0, -579.2421875, -560.484375, -541.7265625, -522.96875, -504.2109375, -485.453125, -466.6953125, -447.9375, -429.1796875, -410.421875, -391.6640625, -372.90625, -354.1484375, -335.390625, -316.6328125, -297.875, -279.1171875, -260.359375, -241.6015625, -222.84375, -204.0859375, -185.328125, -166.5703125, -147.8125, -129.0546875, -110.296875, -91.5390625, -72.78125, -54.0234375, -35.265625, -16.5078125, 2.25, 21.0078125, 39.765625, 58.5234375, 77.28125, 96.0390625, 114.796875, 133.5546875, 152.3125, 171.0703125, 189.828125, 208.5859375, 227.34375, 246.1015625, 264.859375, 283.6171875, 302.375, 321.1328125, 339.890625, 358.6484375, 377.40625, 396.1640625, 414.921875, 433.6796875, 452.4375, 471.1953125, 489.953125, 508.7109375, 527.46875, 546.2265625, 564.984375, 583.7421875, 602.5]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 11.0, 21.0, 24.0, 57.0, 116.0, 300.0, 252.0, 105.0, 54.0, 23.0, 15.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0234375, -0.0226287841796875, -0.021820068359375, -0.0210113525390625, -0.02020263671875, -0.0193939208984375, -0.018585205078125, -0.0177764892578125, -0.0169677734375, -0.0161590576171875, -0.015350341796875, -0.0145416259765625, -0.01373291015625, -0.0129241943359375, -0.012115478515625, -0.0113067626953125, -0.010498046875, -0.0096893310546875, -0.008880615234375, -0.0080718994140625, -0.00726318359375, -0.0064544677734375, -0.005645751953125, -0.0048370361328125, -0.0040283203125, -0.0032196044921875, -0.002410888671875, -0.0016021728515625, -0.00079345703125, 1.52587890625e-05, 0.000823974609375, 0.0016326904296875, 0.00244140625, 0.0032501220703125, 0.004058837890625, 0.0048675537109375, 0.00567626953125, 0.0064849853515625, 0.007293701171875, 0.0081024169921875, 0.0089111328125, 0.0097198486328125, 0.010528564453125, 0.0113372802734375, 0.01214599609375, 0.0129547119140625, 0.013763427734375, 0.0145721435546875, 0.015380859375, 0.0161895751953125, 0.016998291015625, 0.0178070068359375, 0.01861572265625, 0.0194244384765625, 0.020233154296875, 0.0210418701171875, 0.0218505859375, 0.0226593017578125, 0.023468017578125, 0.0242767333984375, 0.02508544921875, 0.0258941650390625, 0.026702880859375, 0.0275115966796875, 0.0283203125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 5.0, 11.0, 18.0, 10.0, 22.0, 33.0, 29.0, 34.0, 47.0, 87.0, 101.0, 172.0, 201.0, 305.0, 381.0, 622.0, 1032.0, 1636.0, 3190.0, 7315.0, 27186.0, 388911.0, 570879.0, 30138.0, 7916.0, 3316.0, 1723.0, 1039.0, 648.0, 480.0, 285.0, 206.0, 136.0, 107.0, 73.0, 82.0, 34.0, 43.0, 28.0, 18.0, 7.0, 13.0, 9.0, 5.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-553.0, -533.953125, -514.90625, -495.859375, -476.8125, -457.765625, -438.71875, -419.671875, -400.625, -381.578125, -362.53125, -343.484375, -324.4375, -305.390625, -286.34375, -267.296875, -248.25, -229.203125, -210.15625, -191.109375, -172.0625, -153.015625, -133.96875, -114.921875, -95.875, -76.828125, -57.78125, -38.734375, -19.6875, -0.640625, 18.40625, 37.453125, 56.5, 75.546875, 94.59375, 113.640625, 132.6875, 151.734375, 170.78125, 189.828125, 208.875, 227.921875, 246.96875, 266.015625, 285.0625, 304.109375, 323.15625, 342.203125, 361.25, 380.296875, 399.34375, 418.390625, 437.4375, 456.484375, 475.53125, 494.578125, 513.625, 532.671875, 551.71875, 570.765625, 589.8125, 608.859375, 627.90625, 646.953125, 666.0]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 7.0, 4.0, 7.0, 11.0, 24.0, 44.0, 67.0, 124.0, 245.0, 188.0, 112.0, 81.0, 31.0, 16.0, 10.0, 1.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-173.375, -168.7900390625, -164.205078125, -159.6201171875, -155.03515625, -150.4501953125, -145.865234375, -141.2802734375, -136.6953125, -132.1103515625, -127.525390625, -122.9404296875, -118.35546875, -113.7705078125, -109.185546875, -104.6005859375, -100.015625, -95.4306640625, -90.845703125, -86.2607421875, -81.67578125, -77.0908203125, -72.505859375, -67.9208984375, -63.3359375, -58.7509765625, -54.166015625, -49.5810546875, -44.99609375, -40.4111328125, -35.826171875, -31.2412109375, -26.65625, -22.0712890625, -17.486328125, -12.9013671875, -8.31640625, -3.7314453125, 0.853515625, 5.4384765625, 10.0234375, 14.6083984375, 19.193359375, 23.7783203125, 28.36328125, 32.9482421875, 37.533203125, 42.1181640625, 46.703125, 51.2880859375, 55.873046875, 60.4580078125, 65.04296875, 69.6279296875, 74.212890625, 78.7978515625, 83.3828125, 87.9677734375, 92.552734375, 97.1376953125, 101.72265625, 106.3076171875, 110.892578125, 115.4775390625, 120.0625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 8.0, 7.0, 13.0, 46.0, 108.0, 266.0, 235.0, 101.0, 66.0, 58.0, 33.0, 18.0, 14.0, 10.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.9625473022461, -63.84415054321289, -55.72575378417969, -47.60736083984375, -39.48896408081055, -31.370567321777344, -23.252174377441406, -15.133777618408203, -7.015380859375, 1.1030149459838867, 9.221410751342773, 17.339805603027344, 25.458202362060547, 33.57659912109375, 41.69499206542969, 49.81338882446289, 57.931785583496094, 66.05017852783203, 74.1685791015625, 82.28697204589844, 90.40536499023438, 98.52376556396484, 106.64215850830078, 114.76055908203125, 122.87895202636719, 130.99734497070312, 139.11573791503906, 147.234130859375, 155.3525390625, 163.47093200683594, 171.58932495117188, 179.7077178955078, 187.82614135742188, 195.9445343017578, 204.06292724609375, 212.18133544921875, 220.2997283935547, 228.41812133789062, 236.53651428222656, 244.6549072265625, 252.7733154296875, 260.8917236328125, 269.0101013183594, 277.1285095214844, 285.24688720703125, 293.36529541015625, 301.48370361328125, 309.6020812988281, 317.720458984375, 325.8388671875, 333.9572448730469, 342.0756530761719, 350.19403076171875, 358.31243896484375, 366.43084716796875, 374.5492248535156, 382.6676330566406, 390.7860412597656, 398.9044189453125, 407.0228271484375, 415.1412048339844, 423.2596130371094, 431.37799072265625, 439.49639892578125, 447.61480712890625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 7.0, 10.0, 18.0, 20.0, 20.0, 23.0, 23.0, 23.0, 24.0, 30.0, 40.0, 40.0, 41.0, 42.0, 35.0, 42.0, 39.0, 53.0, 49.0, 42.0, 51.0, 31.0, 40.0, 32.0, 28.0, 24.0, 23.0, 23.0, 20.0, 15.0, 5.0, 12.0, 13.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-61.047054290771484, -59.028282165527344, -57.0095100402832, -54.99073791503906, -52.97196578979492, -50.95319366455078, -48.934417724609375, -46.9156494140625, -44.896873474121094, -42.87810134887695, -40.85932922363281, -38.84055709838867, -36.82178497314453, -34.80301284790039, -32.78424072265625, -30.765466690063477, -28.74669647216797, -26.727924346923828, -24.709152221679688, -22.690380096435547, -20.671607971191406, -18.652835845947266, -16.634061813354492, -14.615289688110352, -12.596517562866211, -10.57774543762207, -8.55897331237793, -6.540200233459473, -4.521428108215332, -2.5026559829711914, -0.4838829040527344, 1.5348892211914062, 3.5536575317382812, 5.572429656982422, 7.591202259063721, 9.60997486114502, 11.62874698638916, 13.6475191116333, 15.666292190551758, 17.6850643157959, 19.70383644104004, 21.72260856628418, 23.74138069152832, 25.760154724121094, 27.778926849365234, 29.797698974609375, 31.816471099853516, 33.835243225097656, 35.8540153503418, 37.87278747558594, 39.89155960083008, 41.91033172607422, 43.92910385131836, 45.9478759765625, 47.966651916503906, 49.98542022705078, 52.00419616699219, 54.02296829223633, 56.04174041748047, 58.06051254272461, 60.07928466796875, 62.09805679321289, 64.11682891845703, 66.13560485839844, 68.15437316894531]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 7.0, 10.0, 13.0, 18.0, 31.0, 46.0, 66.0, 115.0, 191.0, 251.0, 407.0, 637.0, 917.0, 1432.0, 2134.0, 3240.0, 4912.0, 7250.0, 11324.0, 17886.0, 28903.0, 49726.0, 90534.0, 188390.0, 552932.0, 1868390.0, 862815.0, 247044.0, 109563.0, 58173.0, 33536.0, 19812.0, 12045.0, 7540.0, 4796.0, 3160.0, 1966.0, 1341.0, 906.0, 602.0, 411.0, 258.0, 192.0, 126.0, 81.0, 55.0, 42.0, 23.0, 13.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-86.1875, -83.4638671875, -80.740234375, -78.0166015625, -75.29296875, -72.5693359375, -69.845703125, -67.1220703125, -64.3984375, -61.6748046875, -58.951171875, -56.2275390625, -53.50390625, -50.7802734375, -48.056640625, -45.3330078125, -42.609375, -39.8857421875, -37.162109375, -34.4384765625, -31.71484375, -28.9912109375, -26.267578125, -23.5439453125, -20.8203125, -18.0966796875, -15.373046875, -12.6494140625, -9.92578125, -7.2021484375, -4.478515625, -1.7548828125, 0.96875, 3.6923828125, 6.416015625, 9.1396484375, 11.86328125, 14.5869140625, 17.310546875, 20.0341796875, 22.7578125, 25.4814453125, 28.205078125, 30.9287109375, 33.65234375, 36.3759765625, 39.099609375, 41.8232421875, 44.546875, 47.2705078125, 49.994140625, 52.7177734375, 55.44140625, 58.1650390625, 60.888671875, 63.6123046875, 66.3359375, 69.0595703125, 71.783203125, 74.5068359375, 77.23046875, 79.9541015625, 82.677734375, 85.4013671875, 88.125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 8.0, 8.0, 15.0, 11.0, 9.0, 21.0, 24.0, 19.0, 25.0, 27.0, 31.0, 35.0, 41.0, 31.0, 40.0, 42.0, 54.0, 37.0, 48.0, 40.0, 38.0, 35.0, 42.0, 49.0, 46.0, 40.0, 35.0, 23.0, 19.0, 11.0, 22.0, 10.0, 13.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.25, -32.177734375, -31.10546875, -30.033203125, -28.9609375, -27.888671875, -26.81640625, -25.744140625, -24.671875, -23.599609375, -22.52734375, -21.455078125, -20.3828125, -19.310546875, -18.23828125, -17.166015625, -16.09375, -15.021484375, -13.94921875, -12.876953125, -11.8046875, -10.732421875, -9.66015625, -8.587890625, -7.515625, -6.443359375, -5.37109375, -4.298828125, -3.2265625, -2.154296875, -1.08203125, -0.009765625, 1.0625, 2.134765625, 3.20703125, 4.279296875, 5.3515625, 6.423828125, 7.49609375, 8.568359375, 9.640625, 10.712890625, 11.78515625, 12.857421875, 13.9296875, 15.001953125, 16.07421875, 17.146484375, 18.21875, 19.291015625, 20.36328125, 21.435546875, 22.5078125, 23.580078125, 24.65234375, 25.724609375, 26.796875, 27.869140625, 28.94140625, 30.013671875, 31.0859375, 32.158203125, 33.23046875, 34.302734375, 35.375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 10.0, 10.0, 15.0, 19.0, 32.0, 57.0, 67.0, 96.0, 148.0, 232.0, 355.0, 543.0, 808.0, 1312.0, 2174.0, 3536.0, 6106.0, 10842.0, 20945.0, 43432.0, 101337.0, 293579.0, 1319212.0, 1800565.0, 366098.0, 119695.0, 49848.0, 23752.0, 12366.0, 6829.0, 3928.0, 2318.0, 1447.0, 970.0, 510.0, 350.0, 239.0, 163.0, 118.0, 73.0, 51.0, 39.0, 16.0, 10.0, 14.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-112.1875, -108.990234375, -105.79296875, -102.595703125, -99.3984375, -96.201171875, -93.00390625, -89.806640625, -86.609375, -83.412109375, -80.21484375, -77.017578125, -73.8203125, -70.623046875, -67.42578125, -64.228515625, -61.03125, -57.833984375, -54.63671875, -51.439453125, -48.2421875, -45.044921875, -41.84765625, -38.650390625, -35.453125, -32.255859375, -29.05859375, -25.861328125, -22.6640625, -19.466796875, -16.26953125, -13.072265625, -9.875, -6.677734375, -3.48046875, -0.283203125, 2.9140625, 6.111328125, 9.30859375, 12.505859375, 15.703125, 18.900390625, 22.09765625, 25.294921875, 28.4921875, 31.689453125, 34.88671875, 38.083984375, 41.28125, 44.478515625, 47.67578125, 50.873046875, 54.0703125, 57.267578125, 60.46484375, 63.662109375, 66.859375, 70.056640625, 73.25390625, 76.451171875, 79.6484375, 82.845703125, 86.04296875, 89.240234375, 92.4375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 6.0, 14.0, 11.0, 17.0, 18.0, 25.0, 34.0, 53.0, 60.0, 82.0, 100.0, 129.0, 205.0, 221.0, 323.0, 395.0, 476.0, 415.0, 352.0, 267.0, 197.0, 148.0, 132.0, 90.0, 62.0, 52.0, 35.0, 39.0, 24.0, 18.0, 15.0, 13.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.59375, -22.80419921875, -22.0146484375, -21.22509765625, -20.435546875, -19.64599609375, -18.8564453125, -18.06689453125, -17.27734375, -16.48779296875, -15.6982421875, -14.90869140625, -14.119140625, -13.32958984375, -12.5400390625, -11.75048828125, -10.9609375, -10.17138671875, -9.3818359375, -8.59228515625, -7.802734375, -7.01318359375, -6.2236328125, -5.43408203125, -4.64453125, -3.85498046875, -3.0654296875, -2.27587890625, -1.486328125, -0.69677734375, 0.0927734375, 0.88232421875, 1.671875, 2.46142578125, 3.2509765625, 4.04052734375, 4.830078125, 5.61962890625, 6.4091796875, 7.19873046875, 7.98828125, 8.77783203125, 9.5673828125, 10.35693359375, 11.146484375, 11.93603515625, 12.7255859375, 13.51513671875, 14.3046875, 15.09423828125, 15.8837890625, 16.67333984375, 17.462890625, 18.25244140625, 19.0419921875, 19.83154296875, 20.62109375, 21.41064453125, 22.2001953125, 22.98974609375, 23.779296875, 24.56884765625, 25.3583984375, 26.14794921875, 26.9375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 6.0, 10.0, 7.0, 21.0, 22.0, 39.0, 43.0, 80.0, 130.0, 149.0, 176.0, 102.0, 59.0, 35.0, 27.0, 25.0, 14.0, 11.0, 17.0, 8.0, 3.0, 4.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.67001342773438, -91.53361511230469, -88.39722442626953, -85.26083374023438, -82.12443542480469, -78.988037109375, -75.85164642333984, -72.71525573730469, -69.578857421875, -66.44245910644531, -63.306068420410156, -60.169673919677734, -57.03327941894531, -53.89688491821289, -50.76049041748047, -47.62409591674805, -44.487701416015625, -41.3513069152832, -38.21491241455078, -35.07851791381836, -31.942123413085938, -28.805728912353516, -25.669334411621094, -22.532939910888672, -19.39654541015625, -16.260150909423828, -13.123756408691406, -9.987361907958984, -6.8509674072265625, -3.7145729064941406, -0.5781784057617188, 2.558216094970703, 5.694602966308594, 8.830997467041016, 11.967391967773438, 15.10378646850586, 18.24018096923828, 21.376575469970703, 24.512969970703125, 27.649364471435547, 30.78575897216797, 33.92215347290039, 37.05854797363281, 40.194942474365234, 43.331336975097656, 46.46773147583008, 49.6041259765625, 52.74052047729492, 55.876914978027344, 59.013309478759766, 62.14970397949219, 65.28610229492188, 68.42249298095703, 71.55888366699219, 74.69528198242188, 77.83168029785156, 80.96807098388672, 84.10446166992188, 87.24085998535156, 90.37725830078125, 93.5136489868164, 96.65003967285156, 99.78643798828125, 102.92283630371094, 106.0592269897461]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 8.0, 11.0, 5.0, 11.0, 24.0, 17.0, 29.0, 14.0, 20.0, 27.0, 30.0, 31.0, 41.0, 45.0, 44.0, 44.0, 39.0, 51.0, 55.0, 42.0, 54.0, 38.0, 39.0, 34.0, 37.0, 29.0, 29.0, 34.0, 20.0, 18.0, 16.0, 18.0, 9.0, 10.0, 10.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.01542282104492, -48.450958251953125, -46.88648986816406, -45.322025299072266, -43.7575569152832, -42.193092346191406, -40.628623962402344, -39.06415939331055, -37.49969482421875, -35.93523025512695, -34.37076187133789, -32.806297302246094, -31.24182891845703, -29.677364349365234, -28.112897872924805, -26.548431396484375, -24.983963012695312, -23.419496536254883, -21.855030059814453, -20.290565490722656, -18.726097106933594, -17.161632537841797, -15.597166061401367, -14.032699584960938, -12.468233108520508, -10.903766632080078, -9.339300155639648, -7.774834632873535, -6.2103681564331055, -4.645901679992676, -3.0814361572265625, -1.5169696807861328, 0.04749298095703125, 1.6119592189788818, 3.1764254570007324, 4.740891456604004, 6.305357933044434, 7.869824409484863, 9.434289932250977, 10.998756408691406, 12.563222885131836, 14.127689361572266, 15.692155838012695, 17.256622314453125, 18.821086883544922, 20.385555267333984, 21.95001983642578, 23.51448631286621, 25.07895278930664, 26.64341926574707, 28.2078857421875, 29.772350311279297, 31.33681869506836, 32.901283264160156, 34.46575164794922, 36.030216217041016, 37.59468078613281, 39.15914535522461, 40.72361373901367, 42.28807830810547, 43.85254669189453, 45.41701126098633, 46.981475830078125, 48.54594421386719, 50.11041259765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 7.0, 11.0, 8.0, 17.0, 12.0, 16.0, 26.0, 35.0, 58.0, 84.0, 115.0, 152.0, 214.0, 339.0, 465.0, 677.0, 1017.0, 1463.0, 2119.0, 3342.0, 5153.0, 8350.0, 13634.0, 22986.0, 41725.0, 79005.0, 165973.0, 314235.0, 187983.0, 87943.0, 45735.0, 25434.0, 14607.0, 8903.0, 5762.0, 3655.0, 2331.0, 1513.0, 1092.0, 718.0, 484.0, 365.0, 240.0, 138.0, 129.0, 87.0, 70.0, 41.0, 26.0, 18.0, 14.0, 11.0, 8.0, 11.0, 5.0, 4.0, 1.0, 1.0, 2.0], "bins": [-29.5625, -28.655029296875, -27.74755859375, -26.840087890625, -25.9326171875, -25.025146484375, -24.11767578125, -23.210205078125, -22.302734375, -21.395263671875, -20.48779296875, -19.580322265625, -18.6728515625, -17.765380859375, -16.85791015625, -15.950439453125, -15.04296875, -14.135498046875, -13.22802734375, -12.320556640625, -11.4130859375, -10.505615234375, -9.59814453125, -8.690673828125, -7.783203125, -6.875732421875, -5.96826171875, -5.060791015625, -4.1533203125, -3.245849609375, -2.33837890625, -1.430908203125, -0.5234375, 0.384033203125, 1.29150390625, 2.198974609375, 3.1064453125, 4.013916015625, 4.92138671875, 5.828857421875, 6.736328125, 7.643798828125, 8.55126953125, 9.458740234375, 10.3662109375, 11.273681640625, 12.18115234375, 13.088623046875, 13.99609375, 14.903564453125, 15.81103515625, 16.718505859375, 17.6259765625, 18.533447265625, 19.44091796875, 20.348388671875, 21.255859375, 22.163330078125, 23.07080078125, 23.978271484375, 24.8857421875, 25.793212890625, 26.70068359375, 27.608154296875, 28.515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 9.0, 2.0, 9.0, 8.0, 12.0, 16.0, 19.0, 16.0, 28.0, 17.0, 20.0, 33.0, 33.0, 33.0, 41.0, 37.0, 36.0, 41.0, 45.0, 58.0, 43.0, 46.0, 56.0, 36.0, 33.0, 33.0, 28.0, 25.0, 37.0, 24.0, 25.0, 13.0, 22.0, 19.0, 15.0, 5.0, 5.0, 5.0, 6.0, 6.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-47.59375, -46.1396484375, -44.685546875, -43.2314453125, -41.77734375, -40.3232421875, -38.869140625, -37.4150390625, -35.9609375, -34.5068359375, -33.052734375, -31.5986328125, -30.14453125, -28.6904296875, -27.236328125, -25.7822265625, -24.328125, -22.8740234375, -21.419921875, -19.9658203125, -18.51171875, -17.0576171875, -15.603515625, -14.1494140625, -12.6953125, -11.2412109375, -9.787109375, -8.3330078125, -6.87890625, -5.4248046875, -3.970703125, -2.5166015625, -1.0625, 0.3916015625, 1.845703125, 3.2998046875, 4.75390625, 6.2080078125, 7.662109375, 9.1162109375, 10.5703125, 12.0244140625, 13.478515625, 14.9326171875, 16.38671875, 17.8408203125, 19.294921875, 20.7490234375, 22.203125, 23.6572265625, 25.111328125, 26.5654296875, 28.01953125, 29.4736328125, 30.927734375, 32.3818359375, 33.8359375, 35.2900390625, 36.744140625, 38.1982421875, 39.65234375, 41.1064453125, 42.560546875, 44.0146484375, 45.46875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 6.0, 5.0, 12.0, 13.0, 13.0, 31.0, 30.0, 44.0, 61.0, 85.0, 109.0, 156.0, 209.0, 306.0, 347.0, 531.0, 671.0, 1019.0, 1567.0, 2445.0, 3973.0, 6883.0, 14125.0, 33664.0, 110224.0, 551425.0, 223279.0, 53927.0, 20034.0, 9164.0, 4994.0, 2984.0, 1938.0, 1264.0, 890.0, 567.0, 423.0, 312.0, 233.0, 164.0, 109.0, 89.0, 72.0, 34.0, 36.0, 31.0, 19.0, 14.0, 8.0, 4.0, 9.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.53125, -41.10009765625, -39.6689453125, -38.23779296875, -36.806640625, -35.37548828125, -33.9443359375, -32.51318359375, -31.08203125, -29.65087890625, -28.2197265625, -26.78857421875, -25.357421875, -23.92626953125, -22.4951171875, -21.06396484375, -19.6328125, -18.20166015625, -16.7705078125, -15.33935546875, -13.908203125, -12.47705078125, -11.0458984375, -9.61474609375, -8.18359375, -6.75244140625, -5.3212890625, -3.89013671875, -2.458984375, -1.02783203125, 0.4033203125, 1.83447265625, 3.265625, 4.69677734375, 6.1279296875, 7.55908203125, 8.990234375, 10.42138671875, 11.8525390625, 13.28369140625, 14.71484375, 16.14599609375, 17.5771484375, 19.00830078125, 20.439453125, 21.87060546875, 23.3017578125, 24.73291015625, 26.1640625, 27.59521484375, 29.0263671875, 30.45751953125, 31.888671875, 33.31982421875, 34.7509765625, 36.18212890625, 37.61328125, 39.04443359375, 40.4755859375, 41.90673828125, 43.337890625, 44.76904296875, 46.2001953125, 47.63134765625, 49.0625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 7.0, 10.0, 12.0, 19.0, 26.0, 21.0, 28.0, 28.0, 25.0, 32.0, 39.0, 45.0, 49.0, 36.0, 54.0, 53.0, 45.0, 44.0, 43.0, 47.0, 33.0, 37.0, 35.0, 28.0, 21.0, 25.0, 20.0, 22.0, 19.0, 10.0, 14.0, 12.0, 14.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-31.125, -30.191650390625, -29.25830078125, -28.324951171875, -27.3916015625, -26.458251953125, -25.52490234375, -24.591552734375, -23.658203125, -22.724853515625, -21.79150390625, -20.858154296875, -19.9248046875, -18.991455078125, -18.05810546875, -17.124755859375, -16.19140625, -15.258056640625, -14.32470703125, -13.391357421875, -12.4580078125, -11.524658203125, -10.59130859375, -9.657958984375, -8.724609375, -7.791259765625, -6.85791015625, -5.924560546875, -4.9912109375, -4.057861328125, -3.12451171875, -2.191162109375, -1.2578125, -0.324462890625, 0.60888671875, 1.542236328125, 2.4755859375, 3.408935546875, 4.34228515625, 5.275634765625, 6.208984375, 7.142333984375, 8.07568359375, 9.009033203125, 9.9423828125, 10.875732421875, 11.80908203125, 12.742431640625, 13.67578125, 14.609130859375, 15.54248046875, 16.475830078125, 17.4091796875, 18.342529296875, 19.27587890625, 20.209228515625, 21.142578125, 22.075927734375, 23.00927734375, 23.942626953125, 24.8759765625, 25.809326171875, 26.74267578125, 27.676025390625, 28.609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 4.0, 8.0, 10.0, 17.0, 21.0, 31.0, 33.0, 51.0, 69.0, 122.0, 125.0, 197.0, 248.0, 327.0, 457.0, 686.0, 955.0, 1305.0, 1993.0, 2945.0, 4826.0, 7976.0, 15325.0, 36151.0, 166087.0, 664054.0, 86993.0, 26328.0, 12102.0, 6716.0, 3974.0, 2477.0, 1649.0, 1207.0, 865.0, 612.0, 453.0, 289.0, 220.0, 167.0, 129.0, 92.0, 78.0, 52.0, 32.0, 26.0, 16.0, 12.0, 8.0, 10.0, 10.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.1640625, -10.8077392578125, -10.451416015625, -10.0950927734375, -9.73876953125, -9.3824462890625, -9.026123046875, -8.6697998046875, -8.3134765625, -7.9571533203125, -7.600830078125, -7.2445068359375, -6.88818359375, -6.5318603515625, -6.175537109375, -5.8192138671875, -5.462890625, -5.1065673828125, -4.750244140625, -4.3939208984375, -4.03759765625, -3.6812744140625, -3.324951171875, -2.9686279296875, -2.6123046875, -2.2559814453125, -1.899658203125, -1.5433349609375, -1.18701171875, -0.8306884765625, -0.474365234375, -0.1180419921875, 0.23828125, 0.5946044921875, 0.950927734375, 1.3072509765625, 1.66357421875, 2.0198974609375, 2.376220703125, 2.7325439453125, 3.0888671875, 3.4451904296875, 3.801513671875, 4.1578369140625, 4.51416015625, 4.8704833984375, 5.226806640625, 5.5831298828125, 5.939453125, 6.2957763671875, 6.652099609375, 7.0084228515625, 7.36474609375, 7.7210693359375, 8.077392578125, 8.4337158203125, 8.7900390625, 9.1463623046875, 9.502685546875, 9.8590087890625, 10.21533203125, 10.5716552734375, 10.927978515625, 11.2843017578125, 11.640625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 9.0, 2.0, 14.0, 13.0, 16.0, 16.0, 27.0, 30.0, 31.0, 49.0, 52.0, 58.0, 84.0, 81.0, 83.0, 83.0, 67.0, 63.0, 37.0, 39.0, 37.0, 22.0, 18.0, 15.0, 13.0, 5.0, 8.0, 7.0, 6.0, 3.0, 1.0, 7.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007672309875488281, -0.0007407888770103455, -0.0007143467664718628, -0.0006879046559333801, -0.0006614625453948975, -0.0006350204348564148, -0.0006085783243179321, -0.0005821362137794495, -0.0005556941032409668, -0.0005292519927024841, -0.0005028098821640015, -0.0004763677716255188, -0.00044992566108703613, -0.00042348355054855347, -0.0003970414400100708, -0.00037059932947158813, -0.00034415721893310547, -0.0003177151083946228, -0.00029127299785614014, -0.00026483088731765747, -0.0002383887767791748, -0.00021194666624069214, -0.00018550455570220947, -0.0001590624451637268, -0.00013262033462524414, -0.00010617822408676147, -7.973611354827881e-05, -5.329400300979614e-05, -2.6851892471313477e-05, -4.0978193283081055e-07, 2.6032328605651855e-05, 5.247443914413452e-05, 7.891654968261719e-05, 0.00010535866022109985, 0.00013180077075958252, 0.00015824288129806519, 0.00018468499183654785, 0.00021112710237503052, 0.00023756921291351318, 0.00026401132345199585, 0.0002904534339904785, 0.0003168955445289612, 0.00034333765506744385, 0.0003697797656059265, 0.0003962218761444092, 0.00042266398668289185, 0.0004491060972213745, 0.0004755482077598572, 0.0005019903182983398, 0.0005284324288368225, 0.0005548745393753052, 0.0005813166499137878, 0.0006077587604522705, 0.0006342008709907532, 0.0006606429815292358, 0.0006870850920677185, 0.0007135272026062012, 0.0007399693131446838, 0.0007664114236831665, 0.0007928535342216492, 0.0008192956447601318, 0.0008457377552986145, 0.0008721798658370972, 0.0008986219763755798, 0.0009250640869140625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 3.0, 10.0, 17.0, 12.0, 26.0, 26.0, 25.0, 51.0, 55.0, 93.0, 124.0, 186.0, 253.0, 363.0, 525.0, 741.0, 1022.0, 1561.0, 2327.0, 3571.0, 5583.0, 9238.0, 16045.0, 29734.0, 62203.0, 168081.0, 469601.0, 151104.0, 57871.0, 28023.0, 15318.0, 8756.0, 5350.0, 3390.0, 2310.0, 1526.0, 1049.0, 700.0, 492.0, 310.0, 254.0, 180.0, 142.0, 79.0, 73.0, 43.0, 27.0, 28.0, 21.0, 12.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5703125, -12.1435546875, -11.716796875, -11.2900390625, -10.86328125, -10.4365234375, -10.009765625, -9.5830078125, -9.15625, -8.7294921875, -8.302734375, -7.8759765625, -7.44921875, -7.0224609375, -6.595703125, -6.1689453125, -5.7421875, -5.3154296875, -4.888671875, -4.4619140625, -4.03515625, -3.6083984375, -3.181640625, -2.7548828125, -2.328125, -1.9013671875, -1.474609375, -1.0478515625, -0.62109375, -0.1943359375, 0.232421875, 0.6591796875, 1.0859375, 1.5126953125, 1.939453125, 2.3662109375, 2.79296875, 3.2197265625, 3.646484375, 4.0732421875, 4.5, 4.9267578125, 5.353515625, 5.7802734375, 6.20703125, 6.6337890625, 7.060546875, 7.4873046875, 7.9140625, 8.3408203125, 8.767578125, 9.1943359375, 9.62109375, 10.0478515625, 10.474609375, 10.9013671875, 11.328125, 11.7548828125, 12.181640625, 12.6083984375, 13.03515625, 13.4619140625, 13.888671875, 14.3154296875, 14.7421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 7.0, 8.0, 11.0, 8.0, 3.0, 9.0, 18.0, 17.0, 19.0, 22.0, 28.0, 22.0, 34.0, 43.0, 34.0, 52.0, 67.0, 86.0, 67.0, 50.0, 61.0, 55.0, 50.0, 35.0, 30.0, 22.0, 20.0, 13.0, 16.0, 20.0, 13.0, 9.0, 7.0, 15.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.810546875, -3.699493408203125, -3.58843994140625, -3.477386474609375, -3.3663330078125, -3.255279541015625, -3.14422607421875, -3.033172607421875, -2.922119140625, -2.811065673828125, -2.70001220703125, -2.588958740234375, -2.4779052734375, -2.366851806640625, -2.25579833984375, -2.144744873046875, -2.03369140625, -1.922637939453125, -1.81158447265625, -1.700531005859375, -1.5894775390625, -1.478424072265625, -1.36737060546875, -1.256317138671875, -1.145263671875, -1.034210205078125, -0.92315673828125, -0.812103271484375, -0.7010498046875, -0.589996337890625, -0.47894287109375, -0.367889404296875, -0.2568359375, -0.145782470703125, -0.03472900390625, 0.076324462890625, 0.1873779296875, 0.298431396484375, 0.40948486328125, 0.520538330078125, 0.631591796875, 0.742645263671875, 0.85369873046875, 0.964752197265625, 1.0758056640625, 1.186859130859375, 1.29791259765625, 1.408966064453125, 1.52001953125, 1.631072998046875, 1.74212646484375, 1.853179931640625, 1.9642333984375, 2.075286865234375, 2.18634033203125, 2.297393798828125, 2.408447265625, 2.519500732421875, 2.63055419921875, 2.741607666015625, 2.8526611328125, 2.963714599609375, 3.07476806640625, 3.185821533203125, 3.296875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 8.0, 16.0, 15.0, 30.0, 49.0, 71.0, 113.0, 157.0, 184.0, 109.0, 69.0, 44.0, 29.0, 25.0, 11.0, 17.0, 9.0, 12.0, 5.0, 5.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.4000473022461, -87.19126892089844, -83.98249816894531, -80.77371978759766, -77.56494140625, -74.35617065429688, -71.14739227294922, -67.93861389160156, -64.72984313964844, -61.52106857299805, -58.31229019165039, -55.103515625, -51.894737243652344, -48.68596267700195, -45.47718811035156, -42.268409729003906, -39.05963134765625, -35.85085678100586, -32.6420783996582, -29.433303833007812, -26.22452735900879, -23.015750885009766, -19.806976318359375, -16.59819984436035, -13.389423370361328, -10.180646896362305, -6.971871376037598, -3.7630958557128906, -0.5543193817138672, 2.6544570922851562, 5.863231658935547, 9.07200813293457, 12.280792236328125, 15.489568710327148, 18.698345184326172, 21.907119750976562, 25.115896224975586, 28.32467269897461, 31.533447265625, 34.742225646972656, 37.95100021362305, 41.15977478027344, 44.368553161621094, 47.577327728271484, 50.786102294921875, 53.99488067626953, 57.20365524291992, 60.41242980957031, 63.62120819091797, 66.82998657226562, 70.03875732421875, 73.2475357055664, 76.45631408691406, 79.66508483886719, 82.87386322021484, 86.0826416015625, 89.29141235351562, 92.50019073486328, 95.7089614868164, 98.91773986816406, 102.12651824951172, 105.33529663085938, 108.5440673828125, 111.75284576416016, 114.96162414550781]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 2.0, 9.0, 8.0, 9.0, 10.0, 21.0, 20.0, 19.0, 27.0, 16.0, 23.0, 44.0, 32.0, 43.0, 30.0, 40.0, 54.0, 48.0, 44.0, 55.0, 40.0, 49.0, 46.0, 41.0, 37.0, 22.0, 28.0, 44.0, 26.0, 19.0, 17.0, 17.0, 14.0, 12.0, 10.0, 8.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.114906311035156, -47.572784423828125, -46.030662536621094, -44.4885368347168, -42.946414947509766, -41.404293060302734, -39.86216735839844, -38.320045471191406, -36.777923583984375, -35.235801696777344, -33.69367980957031, -32.151554107666016, -30.609432220458984, -29.067310333251953, -27.52518653869629, -25.983062744140625, -24.440940856933594, -22.898818969726562, -21.3566951751709, -19.814571380615234, -18.272449493408203, -16.730327606201172, -15.188203811645508, -13.64608097076416, -12.103958129882812, -10.561835289001465, -9.019712448120117, -7.4775896072387695, -5.935466766357422, -4.393343925476074, -2.8512210845947266, -1.309098243713379, 0.23302841186523438, 1.775151252746582, 3.3172740936279297, 4.859396934509277, 6.401519775390625, 7.943642616271973, 9.48576545715332, 11.027888298034668, 12.570011138916016, 14.112133979797363, 15.654256820678711, 17.196380615234375, 18.738502502441406, 20.280624389648438, 21.8227481842041, 23.364871978759766, 24.906993865966797, 26.449115753173828, 27.991239547729492, 29.533363342285156, 31.075485229492188, 32.61760711669922, 34.15972900390625, 35.70185470581055, 37.24397659301758, 38.78609848022461, 40.328224182128906, 41.87034606933594, 43.41246795654297, 44.95458984375, 46.49671173095703, 48.03883743286133, 49.58095932006836]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 5.0, 12.0, 15.0, 27.0, 40.0, 74.0, 89.0, 161.0, 199.0, 309.0, 482.0, 757.0, 1101.0, 1646.0, 2594.0, 4264.0, 6620.0, 10591.0, 17329.0, 29169.0, 48649.0, 82952.0, 144886.0, 232684.0, 191867.0, 110305.0, 64080.0, 37876.0, 22492.0, 13701.0, 8463.0, 5386.0, 3458.0, 2229.0, 1386.0, 956.0, 581.0, 370.0, 254.0, 157.0, 121.0, 69.0, 45.0, 40.0, 28.0, 11.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-64.1875, -62.2861328125, -60.384765625, -58.4833984375, -56.58203125, -54.6806640625, -52.779296875, -50.8779296875, -48.9765625, -47.0751953125, -45.173828125, -43.2724609375, -41.37109375, -39.4697265625, -37.568359375, -35.6669921875, -33.765625, -31.8642578125, -29.962890625, -28.0615234375, -26.16015625, -24.2587890625, -22.357421875, -20.4560546875, -18.5546875, -16.6533203125, -14.751953125, -12.8505859375, -10.94921875, -9.0478515625, -7.146484375, -5.2451171875, -3.34375, -1.4423828125, 0.458984375, 2.3603515625, 4.26171875, 6.1630859375, 8.064453125, 9.9658203125, 11.8671875, 13.7685546875, 15.669921875, 17.5712890625, 19.47265625, 21.3740234375, 23.275390625, 25.1767578125, 27.078125, 28.9794921875, 30.880859375, 32.7822265625, 34.68359375, 36.5849609375, 38.486328125, 40.3876953125, 42.2890625, 44.1904296875, 46.091796875, 47.9931640625, 49.89453125, 51.7958984375, 53.697265625, 55.5986328125, 57.5]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 9.0, 12.0, 8.0, 20.0, 13.0, 25.0, 27.0, 27.0, 36.0, 37.0, 34.0, 44.0, 38.0, 46.0, 54.0, 51.0, 58.0, 45.0, 36.0, 50.0, 46.0, 31.0, 38.0, 34.0, 26.0, 29.0, 20.0, 24.0, 15.0, 18.0, 5.0, 3.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21875, -39.74267578125, -38.2666015625, -36.79052734375, -35.314453125, -33.83837890625, -32.3623046875, -30.88623046875, -29.41015625, -27.93408203125, -26.4580078125, -24.98193359375, -23.505859375, -22.02978515625, -20.5537109375, -19.07763671875, -17.6015625, -16.12548828125, -14.6494140625, -13.17333984375, -11.697265625, -10.22119140625, -8.7451171875, -7.26904296875, -5.79296875, -4.31689453125, -2.8408203125, -1.36474609375, 0.111328125, 1.58740234375, 3.0634765625, 4.53955078125, 6.015625, 7.49169921875, 8.9677734375, 10.44384765625, 11.919921875, 13.39599609375, 14.8720703125, 16.34814453125, 17.82421875, 19.30029296875, 20.7763671875, 22.25244140625, 23.728515625, 25.20458984375, 26.6806640625, 28.15673828125, 29.6328125, 31.10888671875, 32.5849609375, 34.06103515625, 35.537109375, 37.01318359375, 38.4892578125, 39.96533203125, 41.44140625, 42.91748046875, 44.3935546875, 45.86962890625, 47.345703125, 48.82177734375, 50.2978515625, 51.77392578125, 53.25]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 11.0, 12.0, 23.0, 32.0, 38.0, 65.0, 118.0, 150.0, 232.0, 353.0, 535.0, 818.0, 1336.0, 2129.0, 3439.0, 5763.0, 10039.0, 18219.0, 34461.0, 69163.0, 154002.0, 345366.0, 214185.0, 90856.0, 44249.0, 22739.0, 12314.0, 6907.0, 4052.0, 2554.0, 1566.0, 985.0, 624.0, 409.0, 262.0, 202.0, 126.0, 78.0, 53.0, 22.0, 24.0, 12.0, 11.0, 5.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-96.5625, -93.6953125, -90.828125, -87.9609375, -85.09375, -82.2265625, -79.359375, -76.4921875, -73.625, -70.7578125, -67.890625, -65.0234375, -62.15625, -59.2890625, -56.421875, -53.5546875, -50.6875, -47.8203125, -44.953125, -42.0859375, -39.21875, -36.3515625, -33.484375, -30.6171875, -27.75, -24.8828125, -22.015625, -19.1484375, -16.28125, -13.4140625, -10.546875, -7.6796875, -4.8125, -1.9453125, 0.921875, 3.7890625, 6.65625, 9.5234375, 12.390625, 15.2578125, 18.125, 20.9921875, 23.859375, 26.7265625, 29.59375, 32.4609375, 35.328125, 38.1953125, 41.0625, 43.9296875, 46.796875, 49.6640625, 52.53125, 55.3984375, 58.265625, 61.1328125, 64.0, 66.8671875, 69.734375, 72.6015625, 75.46875, 78.3359375, 81.203125, 84.0703125, 86.9375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 4.0, 4.0, 7.0, 9.0, 5.0, 8.0, 12.0, 17.0, 27.0, 27.0, 26.0, 49.0, 34.0, 35.0, 46.0, 37.0, 41.0, 36.0, 39.0, 40.0, 48.0, 46.0, 44.0, 35.0, 35.0, 28.0, 41.0, 26.0, 30.0, 30.0, 17.0, 22.0, 15.0, 15.0, 12.0, 15.0, 11.0, 5.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.41748046875, -31.1787109375, -29.93994140625, -28.701171875, -27.46240234375, -26.2236328125, -24.98486328125, -23.74609375, -22.50732421875, -21.2685546875, -20.02978515625, -18.791015625, -17.55224609375, -16.3134765625, -15.07470703125, -13.8359375, -12.59716796875, -11.3583984375, -10.11962890625, -8.880859375, -7.64208984375, -6.4033203125, -5.16455078125, -3.92578125, -2.68701171875, -1.4482421875, -0.20947265625, 1.029296875, 2.26806640625, 3.5068359375, 4.74560546875, 5.984375, 7.22314453125, 8.4619140625, 9.70068359375, 10.939453125, 12.17822265625, 13.4169921875, 14.65576171875, 15.89453125, 17.13330078125, 18.3720703125, 19.61083984375, 20.849609375, 22.08837890625, 23.3271484375, 24.56591796875, 25.8046875, 27.04345703125, 28.2822265625, 29.52099609375, 30.759765625, 31.99853515625, 33.2373046875, 34.47607421875, 35.71484375, 36.95361328125, 38.1923828125, 39.43115234375, 40.669921875, 41.90869140625, 43.1474609375, 44.38623046875, 45.625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 2.0, 11.0, 13.0, 22.0, 25.0, 52.0, 52.0, 84.0, 146.0, 202.0, 350.0, 628.0, 1270.0, 3150.0, 9023.0, 36277.0, 582271.0, 369440.0, 31663.0, 8338.0, 2831.0, 1229.0, 562.0, 303.0, 202.0, 120.0, 77.0, 66.0, 40.0, 27.0, 21.0, 16.0, 9.0, 10.0, 7.0, 2.0, 5.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-580.0, -557.65625, -535.3125, -512.96875, -490.625, -468.28125, -445.9375, -423.59375, -401.25, -378.90625, -356.5625, -334.21875, -311.875, -289.53125, -267.1875, -244.84375, -222.5, -200.15625, -177.8125, -155.46875, -133.125, -110.78125, -88.4375, -66.09375, -43.75, -21.40625, 0.9375, 23.28125, 45.625, 67.96875, 90.3125, 112.65625, 135.0, 157.34375, 179.6875, 202.03125, 224.375, 246.71875, 269.0625, 291.40625, 313.75, 336.09375, 358.4375, 380.78125, 403.125, 425.46875, 447.8125, 470.15625, 492.5, 514.84375, 537.1875, 559.53125, 581.875, 604.21875, 626.5625, 648.90625, 671.25, 693.59375, 715.9375, 738.28125, 760.625, 782.96875, 805.3125, 827.65625, 850.0]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 16.0, 17.0, 19.0, 45.0, 86.0, 131.0, 167.0, 195.0, 123.0, 81.0, 47.0, 29.0, 17.0, 9.0, 6.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01904296875, -0.0185546875, -0.01806640625, -0.017578125, -0.01708984375, -0.0166015625, -0.01611328125, -0.015625, -0.01513671875, -0.0146484375, -0.01416015625, -0.013671875, -0.01318359375, -0.0126953125, -0.01220703125, -0.01171875, -0.01123046875, -0.0107421875, -0.01025390625, -0.009765625, -0.00927734375, -0.0087890625, -0.00830078125, -0.0078125, -0.00732421875, -0.0068359375, -0.00634765625, -0.005859375, -0.00537109375, -0.0048828125, -0.00439453125, -0.00390625, -0.00341796875, -0.0029296875, -0.00244140625, -0.001953125, -0.00146484375, -0.0009765625, -0.00048828125, 0.0, 0.00048828125, 0.0009765625, 0.00146484375, 0.001953125, 0.00244140625, 0.0029296875, 0.00341796875, 0.00390625, 0.00439453125, 0.0048828125, 0.00537109375, 0.005859375, 0.00634765625, 0.0068359375, 0.00732421875, 0.0078125, 0.00830078125, 0.0087890625, 0.00927734375, 0.009765625, 0.01025390625, 0.0107421875, 0.01123046875, 0.01171875, 0.01220703125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 13.0, 15.0, 25.0, 29.0, 37.0, 53.0, 73.0, 113.0, 144.0, 219.0, 355.0, 565.0, 895.0, 1612.0, 3279.0, 8632.0, 32096.0, 266337.0, 664056.0, 49395.0, 11728.0, 4126.0, 1926.0, 970.0, 656.0, 380.0, 245.0, 161.0, 117.0, 86.0, 51.0, 48.0, 28.0, 20.0, 21.0, 8.0, 13.0, 3.0, 10.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-565.0, -548.4453125, -531.890625, -515.3359375, -498.78125, -482.2265625, -465.671875, -449.1171875, -432.5625, -416.0078125, -399.453125, -382.8984375, -366.34375, -349.7890625, -333.234375, -316.6796875, -300.125, -283.5703125, -267.015625, -250.4609375, -233.90625, -217.3515625, -200.796875, -184.2421875, -167.6875, -151.1328125, -134.578125, -118.0234375, -101.46875, -84.9140625, -68.359375, -51.8046875, -35.25, -18.6953125, -2.140625, 14.4140625, 30.96875, 47.5234375, 64.078125, 80.6328125, 97.1875, 113.7421875, 130.296875, 146.8515625, 163.40625, 179.9609375, 196.515625, 213.0703125, 229.625, 246.1796875, 262.734375, 279.2890625, 295.84375, 312.3984375, 328.953125, 345.5078125, 362.0625, 378.6171875, 395.171875, 411.7265625, 428.28125, 444.8359375, 461.390625, 477.9453125, 494.5]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 10.0, 20.0, 46.0, 66.0, 95.0, 137.0, 159.0, 122.0, 118.0, 75.0, 55.0, 30.0, 16.0, 13.0, 6.0, 4.0, 3.0, 1.0, 6.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.875, -108.10546875, -104.3359375, -100.56640625, -96.796875, -93.02734375, -89.2578125, -85.48828125, -81.71875, -77.94921875, -74.1796875, -70.41015625, -66.640625, -62.87109375, -59.1015625, -55.33203125, -51.5625, -47.79296875, -44.0234375, -40.25390625, -36.484375, -32.71484375, -28.9453125, -25.17578125, -21.40625, -17.63671875, -13.8671875, -10.09765625, -6.328125, -2.55859375, 1.2109375, 4.98046875, 8.75, 12.51953125, 16.2890625, 20.05859375, 23.828125, 27.59765625, 31.3671875, 35.13671875, 38.90625, 42.67578125, 46.4453125, 50.21484375, 53.984375, 57.75390625, 61.5234375, 65.29296875, 69.0625, 72.83203125, 76.6015625, 80.37109375, 84.140625, 87.91015625, 91.6796875, 95.44921875, 99.21875, 102.98828125, 106.7578125, 110.52734375, 114.296875, 118.06640625, 121.8359375, 125.60546875, 129.375]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 16.0, 34.0, 121.0, 248.0, 223.0, 126.0, 54.0, 70.0, 28.0, 14.0, 17.0, 14.0, 6.0, 9.0, 3.0, 3.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.37152862548828, -68.08378601074219, -61.796043395996094, -55.508304595947266, -49.22056198120117, -42.93281936645508, -36.64508056640625, -30.357337951660156, -24.069595336914062, -17.78185272216797, -11.494112014770508, -5.206371307373047, 1.0813713073730469, 7.369113922119141, 13.656852722167969, 19.944595336914062, 26.232337951660156, 32.52008056640625, 38.807823181152344, 45.09556198120117, 51.383304595947266, 57.67104721069336, 63.95878601074219, 70.24652862548828, 76.53427124023438, 82.82201385498047, 89.10975646972656, 95.39749145507812, 101.68524169921875, 107.97297668457031, 114.2607192993164, 120.5484619140625, 126.83621215820312, 133.1239471435547, 139.4116973876953, 145.69943237304688, 151.9871826171875, 158.27491760253906, 164.56265258789062, 170.85040283203125, 177.13815307617188, 183.42588806152344, 189.71363830566406, 196.00137329101562, 202.28912353515625, 208.5768585205078, 214.86459350585938, 221.15234375, 227.44007873535156, 233.72781372070312, 240.01556396484375, 246.3032989501953, 252.59104919433594, 258.8787841796875, 265.1665344238281, 271.45428466796875, 277.74200439453125, 284.0297546386719, 290.3174743652344, 296.605224609375, 302.8929748535156, 309.18072509765625, 315.46844482421875, 321.7561950683594, 328.0439453125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 7.0, 9.0, 7.0, 6.0, 14.0, 11.0, 18.0, 19.0, 19.0, 27.0, 26.0, 28.0, 36.0, 31.0, 42.0, 33.0, 39.0, 45.0, 39.0, 50.0, 40.0, 32.0, 45.0, 44.0, 42.0, 30.0, 29.0, 30.0, 28.0, 30.0, 22.0, 17.0, 17.0, 14.0, 15.0, 12.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-55.0633544921875, -53.438804626464844, -51.81425476074219, -50.18970489501953, -48.56515884399414, -46.940608978271484, -45.31605911254883, -43.69150924682617, -42.06696319580078, -40.442413330078125, -38.81786346435547, -37.19331359863281, -35.56876754760742, -33.944217681884766, -32.31966781616211, -30.695117950439453, -29.070568084716797, -27.44601821899414, -25.821470260620117, -24.19692039489746, -22.572372436523438, -20.94782257080078, -19.323272705078125, -17.69872283935547, -16.074174880981445, -14.449625968933105, -12.825077056884766, -11.20052719116211, -9.57597827911377, -7.95142936706543, -6.326879501342773, -4.702330589294434, -3.0777816772460938, -1.4532325267791748, 0.17131662368774414, 1.7958660125732422, 3.420414924621582, 5.044963836669922, 6.669513702392578, 8.294062614440918, 9.918611526489258, 11.543160438537598, 13.167709350585938, 14.792259216308594, 16.41680908203125, 18.041357040405273, 19.66590690612793, 21.290454864501953, 22.91500473022461, 24.539554595947266, 26.16410255432129, 27.788652420043945, 29.41320037841797, 31.037750244140625, 32.66230010986328, 34.28684997558594, 35.911399841308594, 37.53594970703125, 39.160499572753906, 40.78504943847656, 42.40959548950195, 44.03414535522461, 45.658695220947266, 47.28324508666992, 48.90779113769531]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 10.0, 17.0, 26.0, 43.0, 51.0, 87.0, 95.0, 157.0, 287.0, 526.0, 809.0, 1576.0, 2754.0, 4767.0, 9286.0, 18129.0, 37079.0, 84075.0, 232381.0, 1317713.0, 1985944.0, 306407.0, 101585.0, 44773.0, 21665.0, 11050.0, 5778.0, 3063.0, 1617.0, 984.0, 590.0, 334.0, 201.0, 161.0, 90.0, 63.0, 43.0, 20.0, 16.0, 15.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.5625, -95.39453125, -92.2265625, -89.05859375, -85.890625, -82.72265625, -79.5546875, -76.38671875, -73.21875, -70.05078125, -66.8828125, -63.71484375, -60.546875, -57.37890625, -54.2109375, -51.04296875, -47.875, -44.70703125, -41.5390625, -38.37109375, -35.203125, -32.03515625, -28.8671875, -25.69921875, -22.53125, -19.36328125, -16.1953125, -13.02734375, -9.859375, -6.69140625, -3.5234375, -0.35546875, 2.8125, 5.98046875, 9.1484375, 12.31640625, 15.484375, 18.65234375, 21.8203125, 24.98828125, 28.15625, 31.32421875, 34.4921875, 37.66015625, 40.828125, 43.99609375, 47.1640625, 50.33203125, 53.5, 56.66796875, 59.8359375, 63.00390625, 66.171875, 69.33984375, 72.5078125, 75.67578125, 78.84375, 82.01171875, 85.1796875, 88.34765625, 91.515625, 94.68359375, 97.8515625, 101.01953125, 104.1875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 9.0, 17.0, 20.0, 13.0, 25.0, 27.0, 29.0, 45.0, 44.0, 29.0, 43.0, 51.0, 51.0, 52.0, 65.0, 52.0, 48.0, 55.0, 38.0, 46.0, 41.0, 31.0, 29.0, 27.0, 29.0, 13.0, 14.0, 16.0, 6.0, 5.0, 7.0, 5.0, 9.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -33.10986328125, -32.0634765625, -31.01708984375, -29.970703125, -28.92431640625, -27.8779296875, -26.83154296875, -25.78515625, -24.73876953125, -23.6923828125, -22.64599609375, -21.599609375, -20.55322265625, -19.5068359375, -18.46044921875, -17.4140625, -16.36767578125, -15.3212890625, -14.27490234375, -13.228515625, -12.18212890625, -11.1357421875, -10.08935546875, -9.04296875, -7.99658203125, -6.9501953125, -5.90380859375, -4.857421875, -3.81103515625, -2.7646484375, -1.71826171875, -0.671875, 0.37451171875, 1.4208984375, 2.46728515625, 3.513671875, 4.56005859375, 5.6064453125, 6.65283203125, 7.69921875, 8.74560546875, 9.7919921875, 10.83837890625, 11.884765625, 12.93115234375, 13.9775390625, 15.02392578125, 16.0703125, 17.11669921875, 18.1630859375, 19.20947265625, 20.255859375, 21.30224609375, 22.3486328125, 23.39501953125, 24.44140625, 25.48779296875, 26.5341796875, 27.58056640625, 28.626953125, 29.67333984375, 30.7197265625, 31.76611328125, 32.8125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 3.0, 11.0, 10.0, 8.0, 18.0, 32.0, 41.0, 65.0, 108.0, 136.0, 187.0, 291.0, 450.0, 689.0, 1091.0, 1765.0, 2739.0, 4534.0, 7938.0, 13572.0, 25865.0, 52170.0, 119297.0, 333108.0, 1432035.0, 1594912.0, 360423.0, 125944.0, 54529.0, 26980.0, 14574.0, 8053.0, 4756.0, 2924.0, 1797.0, 1095.0, 708.0, 484.0, 289.0, 216.0, 156.0, 104.0, 59.0, 47.0, 20.0, 13.0, 19.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-77.625, -75.4091796875, -73.193359375, -70.9775390625, -68.76171875, -66.5458984375, -64.330078125, -62.1142578125, -59.8984375, -57.6826171875, -55.466796875, -53.2509765625, -51.03515625, -48.8193359375, -46.603515625, -44.3876953125, -42.171875, -39.9560546875, -37.740234375, -35.5244140625, -33.30859375, -31.0927734375, -28.876953125, -26.6611328125, -24.4453125, -22.2294921875, -20.013671875, -17.7978515625, -15.58203125, -13.3662109375, -11.150390625, -8.9345703125, -6.71875, -4.5029296875, -2.287109375, -0.0712890625, 2.14453125, 4.3603515625, 6.576171875, 8.7919921875, 11.0078125, 13.2236328125, 15.439453125, 17.6552734375, 19.87109375, 22.0869140625, 24.302734375, 26.5185546875, 28.734375, 30.9501953125, 33.166015625, 35.3818359375, 37.59765625, 39.8134765625, 42.029296875, 44.2451171875, 46.4609375, 48.6767578125, 50.892578125, 53.1083984375, 55.32421875, 57.5400390625, 59.755859375, 61.9716796875, 64.1875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 4.0, 6.0, 9.0, 14.0, 18.0, 17.0, 24.0, 28.0, 37.0, 42.0, 63.0, 65.0, 79.0, 98.0, 113.0, 146.0, 161.0, 233.0, 267.0, 315.0, 341.0, 351.0, 288.0, 244.0, 192.0, 159.0, 161.0, 109.0, 77.0, 62.0, 62.0, 45.0, 44.0, 34.0, 24.0, 13.0, 29.0, 17.0, 11.0, 6.0, 10.0, 9.0, 6.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.375, -12.91259765625, -12.4501953125, -11.98779296875, -11.525390625, -11.06298828125, -10.6005859375, -10.13818359375, -9.67578125, -9.21337890625, -8.7509765625, -8.28857421875, -7.826171875, -7.36376953125, -6.9013671875, -6.43896484375, -5.9765625, -5.51416015625, -5.0517578125, -4.58935546875, -4.126953125, -3.66455078125, -3.2021484375, -2.73974609375, -2.27734375, -1.81494140625, -1.3525390625, -0.89013671875, -0.427734375, 0.03466796875, 0.4970703125, 0.95947265625, 1.421875, 1.88427734375, 2.3466796875, 2.80908203125, 3.271484375, 3.73388671875, 4.1962890625, 4.65869140625, 5.12109375, 5.58349609375, 6.0458984375, 6.50830078125, 6.970703125, 7.43310546875, 7.8955078125, 8.35791015625, 8.8203125, 9.28271484375, 9.7451171875, 10.20751953125, 10.669921875, 11.13232421875, 11.5947265625, 12.05712890625, 12.51953125, 12.98193359375, 13.4443359375, 13.90673828125, 14.369140625, 14.83154296875, 15.2939453125, 15.75634765625, 16.21875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 5.0, 22.0, 31.0, 54.0, 74.0, 139.0, 249.0, 172.0, 99.0, 48.0, 24.0, 18.0, 7.0, 10.0, 9.0, 14.0, 1.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.17815399169922, -92.96552276611328, -89.75289154052734, -86.54025268554688, -83.32762145996094, -80.114990234375, -76.90235900878906, -73.68972778320312, -70.47709655761719, -67.26446533203125, -64.05183410644531, -60.83919906616211, -57.626564025878906, -54.41393280029297, -51.20130157470703, -47.988670349121094, -44.776031494140625, -41.56340026855469, -38.350765228271484, -35.13813400268555, -31.925500869750977, -28.712867736816406, -25.50023651123047, -22.2876033782959, -19.074970245361328, -15.862337112426758, -12.649704933166504, -9.43707275390625, -6.22443962097168, -3.0118064880371094, 0.20082473754882812, 3.4134578704833984, 6.6260833740234375, 9.838716506958008, 13.051348686218262, 16.263980865478516, 19.476613998413086, 22.689247131347656, 25.901878356933594, 29.114511489868164, 32.327144622802734, 35.53977584838867, 38.752410888671875, 41.96504211425781, 45.17767333984375, 48.39030838012695, 51.60293960571289, 54.815574645996094, 58.02820587158203, 61.24083709716797, 64.4534683227539, 67.66610717773438, 70.87873840332031, 74.09136962890625, 77.30400085449219, 80.51663208007812, 83.72926330566406, 86.94189453125, 90.15452575683594, 93.36715698242188, 96.57979583740234, 99.79242706298828, 103.00505828857422, 106.21768951416016, 109.43032836914062]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 10.0, 3.0, 6.0, 13.0, 10.0, 15.0, 28.0, 19.0, 33.0, 32.0, 31.0, 41.0, 44.0, 37.0, 42.0, 42.0, 53.0, 36.0, 34.0, 50.0, 51.0, 47.0, 34.0, 35.0, 31.0, 29.0, 29.0, 33.0, 16.0, 18.0, 13.0, 17.0, 18.0, 5.0, 13.0, 6.0, 7.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-33.818477630615234, -32.725120544433594, -31.631759643554688, -30.538400650024414, -29.44504165649414, -28.3516845703125, -27.258325576782227, -26.164966583251953, -25.07160758972168, -23.978248596191406, -22.884889602661133, -21.79153060913086, -20.69817352294922, -19.604812622070312, -18.511455535888672, -17.4180965423584, -16.324737548828125, -15.231378555297852, -14.138019561767578, -13.044661521911621, -11.951302528381348, -10.857943534851074, -9.764585494995117, -8.671226501464844, -7.57786750793457, -6.484508514404297, -5.391149997711182, -4.297791481018066, -3.204432487487793, -2.1110734939575195, -1.0177149772644043, 0.07564353942871094, 1.1690025329589844, 2.2623612880706787, 3.355720043182373, 4.449078559875488, 5.542437553405762, 6.635796546936035, 7.72915506362915, 8.822513580322266, 9.915872573852539, 11.009231567382812, 12.102590560913086, 13.195948600769043, 14.289307594299316, 15.38266658782959, 16.476024627685547, 17.56938362121582, 18.662742614746094, 19.756101608276367, 20.84946060180664, 21.942819595336914, 23.036178588867188, 24.129535675048828, 25.2228946685791, 26.316253662109375, 27.40961265563965, 28.502971649169922, 29.596330642700195, 30.68968963623047, 31.78304672241211, 32.876407623291016, 33.969764709472656, 35.06312561035156, 36.1564826965332]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 14.0, 8.0, 19.0, 15.0, 44.0, 42.0, 62.0, 73.0, 119.0, 174.0, 238.0, 393.0, 530.0, 756.0, 1187.0, 1835.0, 2796.0, 4473.0, 7599.0, 13198.0, 24240.0, 49443.0, 117412.0, 355463.0, 280555.0, 94810.0, 41925.0, 21297.0, 11482.0, 6724.0, 4035.0, 2545.0, 1642.0, 1088.0, 721.0, 494.0, 336.0, 219.0, 161.0, 123.0, 73.0, 64.0, 37.0, 26.0, 23.0, 16.0, 11.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-33.0625, -32.0869140625, -31.111328125, -30.1357421875, -29.16015625, -28.1845703125, -27.208984375, -26.2333984375, -25.2578125, -24.2822265625, -23.306640625, -22.3310546875, -21.35546875, -20.3798828125, -19.404296875, -18.4287109375, -17.453125, -16.4775390625, -15.501953125, -14.5263671875, -13.55078125, -12.5751953125, -11.599609375, -10.6240234375, -9.6484375, -8.6728515625, -7.697265625, -6.7216796875, -5.74609375, -4.7705078125, -3.794921875, -2.8193359375, -1.84375, -0.8681640625, 0.107421875, 1.0830078125, 2.05859375, 3.0341796875, 4.009765625, 4.9853515625, 5.9609375, 6.9365234375, 7.912109375, 8.8876953125, 9.86328125, 10.8388671875, 11.814453125, 12.7900390625, 13.765625, 14.7412109375, 15.716796875, 16.6923828125, 17.66796875, 18.6435546875, 19.619140625, 20.5947265625, 21.5703125, 22.5458984375, 23.521484375, 24.4970703125, 25.47265625, 26.4482421875, 27.423828125, 28.3994140625, 29.375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 10.0, 10.0, 12.0, 18.0, 23.0, 22.0, 33.0, 31.0, 38.0, 35.0, 47.0, 53.0, 53.0, 47.0, 51.0, 58.0, 43.0, 39.0, 60.0, 46.0, 47.0, 27.0, 39.0, 31.0, 21.0, 16.0, 12.0, 16.0, 23.0, 10.0, 8.0, 5.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.375, -35.17333984375, -33.9716796875, -32.77001953125, -31.568359375, -30.36669921875, -29.1650390625, -27.96337890625, -26.76171875, -25.56005859375, -24.3583984375, -23.15673828125, -21.955078125, -20.75341796875, -19.5517578125, -18.35009765625, -17.1484375, -15.94677734375, -14.7451171875, -13.54345703125, -12.341796875, -11.14013671875, -9.9384765625, -8.73681640625, -7.53515625, -6.33349609375, -5.1318359375, -3.93017578125, -2.728515625, -1.52685546875, -0.3251953125, 0.87646484375, 2.078125, 3.27978515625, 4.4814453125, 5.68310546875, 6.884765625, 8.08642578125, 9.2880859375, 10.48974609375, 11.69140625, 12.89306640625, 14.0947265625, 15.29638671875, 16.498046875, 17.69970703125, 18.9013671875, 20.10302734375, 21.3046875, 22.50634765625, 23.7080078125, 24.90966796875, 26.111328125, 27.31298828125, 28.5146484375, 29.71630859375, 30.91796875, 32.11962890625, 33.3212890625, 34.52294921875, 35.724609375, 36.92626953125, 38.1279296875, 39.32958984375, 40.53125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 3.0, 10.0, 22.0, 25.0, 30.0, 52.0, 63.0, 83.0, 112.0, 141.0, 222.0, 278.0, 393.0, 544.0, 788.0, 1161.0, 1784.0, 2841.0, 4598.0, 8079.0, 17368.0, 50619.0, 289543.0, 548117.0, 74155.0, 22551.0, 10113.0, 5312.0, 3186.0, 2014.0, 1294.0, 883.0, 602.0, 437.0, 309.0, 225.0, 179.0, 128.0, 71.0, 56.0, 42.0, 32.0, 24.0, 16.0, 20.0, 1.0, 9.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.5, -41.08984375, -39.6796875, -38.26953125, -36.859375, -35.44921875, -34.0390625, -32.62890625, -31.21875, -29.80859375, -28.3984375, -26.98828125, -25.578125, -24.16796875, -22.7578125, -21.34765625, -19.9375, -18.52734375, -17.1171875, -15.70703125, -14.296875, -12.88671875, -11.4765625, -10.06640625, -8.65625, -7.24609375, -5.8359375, -4.42578125, -3.015625, -1.60546875, -0.1953125, 1.21484375, 2.625, 4.03515625, 5.4453125, 6.85546875, 8.265625, 9.67578125, 11.0859375, 12.49609375, 13.90625, 15.31640625, 16.7265625, 18.13671875, 19.546875, 20.95703125, 22.3671875, 23.77734375, 25.1875, 26.59765625, 28.0078125, 29.41796875, 30.828125, 32.23828125, 33.6484375, 35.05859375, 36.46875, 37.87890625, 39.2890625, 40.69921875, 42.109375, 43.51953125, 44.9296875, 46.33984375, 47.75]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 5.0, 9.0, 7.0, 7.0, 18.0, 20.0, 19.0, 19.0, 25.0, 17.0, 27.0, 24.0, 29.0, 35.0, 46.0, 44.0, 44.0, 35.0, 40.0, 43.0, 51.0, 43.0, 41.0, 42.0, 46.0, 29.0, 34.0, 24.0, 19.0, 22.0, 17.0, 21.0, 13.0, 10.0, 8.0, 8.0, 7.0, 9.0, 10.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-22.296875, -21.63671875, -20.9765625, -20.31640625, -19.65625, -18.99609375, -18.3359375, -17.67578125, -17.015625, -16.35546875, -15.6953125, -15.03515625, -14.375, -13.71484375, -13.0546875, -12.39453125, -11.734375, -11.07421875, -10.4140625, -9.75390625, -9.09375, -8.43359375, -7.7734375, -7.11328125, -6.453125, -5.79296875, -5.1328125, -4.47265625, -3.8125, -3.15234375, -2.4921875, -1.83203125, -1.171875, -0.51171875, 0.1484375, 0.80859375, 1.46875, 2.12890625, 2.7890625, 3.44921875, 4.109375, 4.76953125, 5.4296875, 6.08984375, 6.75, 7.41015625, 8.0703125, 8.73046875, 9.390625, 10.05078125, 10.7109375, 11.37109375, 12.03125, 12.69140625, 13.3515625, 14.01171875, 14.671875, 15.33203125, 15.9921875, 16.65234375, 17.3125, 17.97265625, 18.6328125, 19.29296875, 19.953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0, 10.0, 7.0, 10.0, 19.0, 23.0, 32.0, 54.0, 94.0, 120.0, 153.0, 269.0, 383.0, 564.0, 825.0, 1153.0, 1829.0, 2829.0, 4489.0, 7754.0, 15155.0, 33058.0, 122195.0, 679081.0, 112071.0, 31979.0, 14176.0, 7334.0, 4579.0, 2696.0, 1914.0, 1163.0, 869.0, 593.0, 339.0, 244.0, 161.0, 116.0, 57.0, 31.0, 57.0, 34.0, 17.0, 9.0, 6.0, 1.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.10546875, -6.872314453125, -6.63916015625, -6.406005859375, -6.1728515625, -5.939697265625, -5.70654296875, -5.473388671875, -5.240234375, -5.007080078125, -4.77392578125, -4.540771484375, -4.3076171875, -4.074462890625, -3.84130859375, -3.608154296875, -3.375, -3.141845703125, -2.90869140625, -2.675537109375, -2.4423828125, -2.209228515625, -1.97607421875, -1.742919921875, -1.509765625, -1.276611328125, -1.04345703125, -0.810302734375, -0.5771484375, -0.343994140625, -0.11083984375, 0.122314453125, 0.35546875, 0.588623046875, 0.82177734375, 1.054931640625, 1.2880859375, 1.521240234375, 1.75439453125, 1.987548828125, 2.220703125, 2.453857421875, 2.68701171875, 2.920166015625, 3.1533203125, 3.386474609375, 3.61962890625, 3.852783203125, 4.0859375, 4.319091796875, 4.55224609375, 4.785400390625, 5.0185546875, 5.251708984375, 5.48486328125, 5.718017578125, 5.951171875, 6.184326171875, 6.41748046875, 6.650634765625, 6.8837890625, 7.116943359375, 7.35009765625, 7.583251953125, 7.81640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 13.0, 22.0, 18.0, 36.0, 54.0, 78.0, 96.0, 128.0, 126.0, 108.0, 79.0, 61.0, 40.0, 28.0, 21.0, 24.0, 14.0, 12.0, 8.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007476806640625, -0.0007257759571075439, -0.0007038712501525879, -0.0006819665431976318, -0.0006600618362426758, -0.0006381571292877197, -0.0006162524223327637, -0.0005943477153778076, -0.0005724430084228516, -0.0005505383014678955, -0.0005286335945129395, -0.0005067288875579834, -0.00048482418060302734, -0.0004629194736480713, -0.00044101476669311523, -0.0004191100597381592, -0.0003972053527832031, -0.00037530064582824707, -0.000353395938873291, -0.00033149123191833496, -0.0003095865249633789, -0.00028768181800842285, -0.0002657771110534668, -0.00024387240409851074, -0.0002219676971435547, -0.00020006299018859863, -0.00017815828323364258, -0.00015625357627868652, -0.00013434886932373047, -0.00011244416236877441, -9.053945541381836e-05, -6.86347484588623e-05, -4.673004150390625e-05, -2.4825334548950195e-05, -2.9206275939941406e-06, 1.8984079360961914e-05, 4.088878631591797e-05, 6.279349327087402e-05, 8.469820022583008e-05, 0.00010660290718078613, 0.0001285076141357422, 0.00015041232109069824, 0.0001723170280456543, 0.00019422173500061035, 0.0002161264419555664, 0.00023803114891052246, 0.0002599358558654785, 0.00028184056282043457, 0.0003037452697753906, 0.0003256499767303467, 0.00034755468368530273, 0.0003694593906402588, 0.00039136409759521484, 0.0004132688045501709, 0.00043517351150512695, 0.000457078218460083, 0.00047898292541503906, 0.0005008876323699951, 0.0005227923393249512, 0.0005446970462799072, 0.0005666017532348633, 0.0005885064601898193, 0.0006104111671447754, 0.0006323158740997314, 0.0006542205810546875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 16.0, 11.0, 21.0, 35.0, 39.0, 80.0, 124.0, 155.0, 245.0, 353.0, 568.0, 853.0, 1417.0, 2378.0, 3931.0, 7068.0, 12783.0, 24680.0, 51554.0, 129294.0, 481238.0, 196545.0, 67494.0, 30906.0, 15759.0, 8611.0, 4902.0, 2874.0, 1690.0, 1030.0, 636.0, 460.0, 251.0, 155.0, 132.0, 80.0, 54.0, 39.0, 23.0, 22.0, 10.0, 12.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.5185546875, -6.298828125, -6.0791015625, -5.859375, -5.6396484375, -5.419921875, -5.2001953125, -4.98046875, -4.7607421875, -4.541015625, -4.3212890625, -4.1015625, -3.8818359375, -3.662109375, -3.4423828125, -3.22265625, -3.0029296875, -2.783203125, -2.5634765625, -2.34375, -2.1240234375, -1.904296875, -1.6845703125, -1.46484375, -1.2451171875, -1.025390625, -0.8056640625, -0.5859375, -0.3662109375, -0.146484375, 0.0732421875, 0.29296875, 0.5126953125, 0.732421875, 0.9521484375, 1.171875, 1.3916015625, 1.611328125, 1.8310546875, 2.05078125, 2.2705078125, 2.490234375, 2.7099609375, 2.9296875, 3.1494140625, 3.369140625, 3.5888671875, 3.80859375, 4.0283203125, 4.248046875, 4.4677734375, 4.6875, 4.9072265625, 5.126953125, 5.3466796875, 5.56640625, 5.7861328125, 6.005859375, 6.2255859375, 6.4453125, 6.6650390625, 6.884765625, 7.1044921875, 7.32421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 6.0, 6.0, 14.0, 10.0, 18.0, 22.0, 30.0, 33.0, 31.0, 31.0, 55.0, 54.0, 59.0, 82.0, 72.0, 81.0, 58.0, 55.0, 40.0, 38.0, 41.0, 30.0, 22.0, 16.0, 18.0, 14.0, 17.0, 9.0, 9.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5556640625, -1.508880615234375, -1.46209716796875, -1.415313720703125, -1.3685302734375, -1.321746826171875, -1.27496337890625, -1.228179931640625, -1.181396484375, -1.134613037109375, -1.08782958984375, -1.041046142578125, -0.9942626953125, -0.947479248046875, -0.90069580078125, -0.853912353515625, -0.80712890625, -0.760345458984375, -0.71356201171875, -0.666778564453125, -0.6199951171875, -0.573211669921875, -0.52642822265625, -0.479644775390625, -0.432861328125, -0.386077880859375, -0.33929443359375, -0.292510986328125, -0.2457275390625, -0.198944091796875, -0.15216064453125, -0.105377197265625, -0.05859375, -0.011810302734375, 0.03497314453125, 0.081756591796875, 0.1285400390625, 0.175323486328125, 0.22210693359375, 0.268890380859375, 0.315673828125, 0.362457275390625, 0.40924072265625, 0.456024169921875, 0.5028076171875, 0.549591064453125, 0.59637451171875, 0.643157958984375, 0.68994140625, 0.736724853515625, 0.78350830078125, 0.830291748046875, 0.8770751953125, 0.923858642578125, 0.97064208984375, 1.017425537109375, 1.064208984375, 1.110992431640625, 1.15777587890625, 1.204559326171875, 1.2513427734375, 1.298126220703125, 1.34490966796875, 1.391693115234375, 1.4384765625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 6.0, 10.0, 11.0, 25.0, 40.0, 81.0, 132.0, 262.0, 176.0, 103.0, 50.0, 24.0, 21.0, 8.0, 11.0, 8.0, 6.0, 10.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.99330139160156, -82.90961456298828, -79.825927734375, -76.74223327636719, -73.6585464477539, -70.57485961914062, -67.49116516113281, -64.40747833251953, -61.32379150390625, -58.24010467529297, -55.15641403198242, -52.072723388671875, -48.989036560058594, -45.90534973144531, -42.821659088134766, -39.73796844482422, -36.65428161621094, -33.570594787597656, -30.48690414428711, -27.403215408325195, -24.31952667236328, -21.235837936401367, -18.152149200439453, -15.068460464477539, -11.984771728515625, -8.901082992553711, -5.817394256591797, -2.733705520629883, 0.34998321533203125, 3.4336719512939453, 6.517360687255859, 9.601049423217773, 12.684730529785156, 15.76841926574707, 18.852108001708984, 21.9357967376709, 25.019485473632812, 28.103174209594727, 31.18686294555664, 34.27055358886719, 37.35424041748047, 40.43792724609375, 43.5216178894043, 46.605308532714844, 49.688995361328125, 52.772682189941406, 55.85637283325195, 58.9400634765625, 62.02375030517578, 65.10743713378906, 68.19113159179688, 71.27481842041016, 74.35850524902344, 77.44219207763672, 80.52587890625, 83.60957336425781, 86.6932601928711, 89.77694702148438, 92.86064147949219, 95.94432830810547, 99.02801513671875, 102.11170196533203, 105.19538879394531, 108.27908325195312, 111.3627700805664]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 4.0, 9.0, 9.0, 4.0, 11.0, 9.0, 21.0, 26.0, 24.0, 28.0, 33.0, 34.0, 36.0, 44.0, 37.0, 38.0, 43.0, 55.0, 41.0, 33.0, 47.0, 49.0, 43.0, 38.0, 36.0, 33.0, 27.0, 29.0, 33.0, 13.0, 20.0, 16.0, 15.0, 15.0, 11.0, 12.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-31.8544921875, -30.825944900512695, -29.79739761352539, -28.768850326538086, -27.74030303955078, -26.71175765991211, -25.683210372924805, -24.6546630859375, -23.626115798950195, -22.59756851196289, -21.569021224975586, -20.54047393798828, -19.51192855834961, -18.483379364013672, -17.454833984375, -16.426286697387695, -15.39773941040039, -14.369192123413086, -13.340644836425781, -12.312098503112793, -11.283551216125488, -10.255003929138184, -9.226457595825195, -8.19791030883789, -7.169363021850586, -6.140815734863281, -5.112268924713135, -4.083722114562988, -3.0551748275756836, -2.026627540588379, -0.9980807304382324, 0.030466079711914062, 1.0590133666992188, 2.0875604152679443, 3.11610746383667, 4.144654273986816, 5.173201560974121, 6.201748847961426, 7.230295658111572, 8.258842468261719, 9.287389755249023, 10.315937042236328, 11.344484329223633, 12.373030662536621, 13.401577949523926, 14.43012523651123, 15.458671569824219, 16.487218856811523, 17.515766143798828, 18.544313430786133, 19.572860717773438, 20.601408004760742, 21.629955291748047, 22.65850067138672, 23.687047958374023, 24.715595245361328, 25.744142532348633, 26.772689819335938, 27.801237106323242, 28.829784393310547, 29.85832977294922, 30.886878967285156, 31.915424346923828, 32.9439697265625, 33.97251892089844]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 3.0, 13.0, 8.0, 21.0, 33.0, 41.0, 47.0, 90.0, 134.0, 210.0, 340.0, 557.0, 854.0, 1445.0, 2401.0, 4053.0, 7291.0, 13404.0, 25349.0, 48792.0, 97091.0, 199653.0, 301239.0, 170172.0, 83717.0, 42258.0, 22028.0, 11649.0, 6400.0, 3574.0, 2250.0, 1252.0, 790.0, 487.0, 346.0, 186.0, 125.0, 84.0, 56.0, 39.0, 20.0, 19.0, 13.0, 11.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.1875, -52.5146484375, -50.841796875, -49.1689453125, -47.49609375, -45.8232421875, -44.150390625, -42.4775390625, -40.8046875, -39.1318359375, -37.458984375, -35.7861328125, -34.11328125, -32.4404296875, -30.767578125, -29.0947265625, -27.421875, -25.7490234375, -24.076171875, -22.4033203125, -20.73046875, -19.0576171875, -17.384765625, -15.7119140625, -14.0390625, -12.3662109375, -10.693359375, -9.0205078125, -7.34765625, -5.6748046875, -4.001953125, -2.3291015625, -0.65625, 1.0166015625, 2.689453125, 4.3623046875, 6.03515625, 7.7080078125, 9.380859375, 11.0537109375, 12.7265625, 14.3994140625, 16.072265625, 17.7451171875, 19.41796875, 21.0908203125, 22.763671875, 24.4365234375, 26.109375, 27.7822265625, 29.455078125, 31.1279296875, 32.80078125, 34.4736328125, 36.146484375, 37.8193359375, 39.4921875, 41.1650390625, 42.837890625, 44.5107421875, 46.18359375, 47.8564453125, 49.529296875, 51.2021484375, 52.875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 2.0, 5.0, 8.0, 9.0, 12.0, 17.0, 21.0, 28.0, 27.0, 28.0, 44.0, 34.0, 38.0, 32.0, 47.0, 53.0, 54.0, 49.0, 42.0, 47.0, 48.0, 45.0, 39.0, 38.0, 32.0, 36.0, 25.0, 21.0, 21.0, 15.0, 12.0, 12.0, 18.0, 5.0, 7.0, 8.0, 7.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.5, -28.540771484375, -27.58154296875, -26.622314453125, -25.6630859375, -24.703857421875, -23.74462890625, -22.785400390625, -21.826171875, -20.866943359375, -19.90771484375, -18.948486328125, -17.9892578125, -17.030029296875, -16.07080078125, -15.111572265625, -14.15234375, -13.193115234375, -12.23388671875, -11.274658203125, -10.3154296875, -9.356201171875, -8.39697265625, -7.437744140625, -6.478515625, -5.519287109375, -4.56005859375, -3.600830078125, -2.6416015625, -1.682373046875, -0.72314453125, 0.236083984375, 1.1953125, 2.154541015625, 3.11376953125, 4.072998046875, 5.0322265625, 5.991455078125, 6.95068359375, 7.909912109375, 8.869140625, 9.828369140625, 10.78759765625, 11.746826171875, 12.7060546875, 13.665283203125, 14.62451171875, 15.583740234375, 16.54296875, 17.502197265625, 18.46142578125, 19.420654296875, 20.3798828125, 21.339111328125, 22.29833984375, 23.257568359375, 24.216796875, 25.176025390625, 26.13525390625, 27.094482421875, 28.0537109375, 29.012939453125, 29.97216796875, 30.931396484375, 31.890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 13.0, 26.0, 28.0, 25.0, 54.0, 69.0, 116.0, 170.0, 266.0, 399.0, 642.0, 1014.0, 1693.0, 2729.0, 4895.0, 8727.0, 16672.0, 34556.0, 76801.0, 186792.0, 353061.0, 200543.0, 83159.0, 36548.0, 17656.0, 9260.0, 5062.0, 2931.0, 1708.0, 1006.0, 650.0, 447.0, 269.0, 186.0, 117.0, 71.0, 66.0, 46.0, 22.0, 15.0, 14.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-53.625, -51.74609375, -49.8671875, -47.98828125, -46.109375, -44.23046875, -42.3515625, -40.47265625, -38.59375, -36.71484375, -34.8359375, -32.95703125, -31.078125, -29.19921875, -27.3203125, -25.44140625, -23.5625, -21.68359375, -19.8046875, -17.92578125, -16.046875, -14.16796875, -12.2890625, -10.41015625, -8.53125, -6.65234375, -4.7734375, -2.89453125, -1.015625, 0.86328125, 2.7421875, 4.62109375, 6.5, 8.37890625, 10.2578125, 12.13671875, 14.015625, 15.89453125, 17.7734375, 19.65234375, 21.53125, 23.41015625, 25.2890625, 27.16796875, 29.046875, 30.92578125, 32.8046875, 34.68359375, 36.5625, 38.44140625, 40.3203125, 42.19921875, 44.078125, 45.95703125, 47.8359375, 49.71484375, 51.59375, 53.47265625, 55.3515625, 57.23046875, 59.109375, 60.98828125, 62.8671875, 64.74609375, 66.625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 0.0, 4.0, 9.0, 9.0, 17.0, 10.0, 20.0, 18.0, 18.0, 29.0, 19.0, 32.0, 37.0, 23.0, 30.0, 34.0, 32.0, 39.0, 50.0, 37.0, 32.0, 41.0, 31.0, 38.0, 37.0, 38.0, 32.0, 34.0, 30.0, 24.0, 22.0, 24.0, 36.0, 16.0, 18.0, 14.0, 13.0, 10.0, 5.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.925537109375, -18.31982421875, -17.714111328125, -17.1083984375, -16.502685546875, -15.89697265625, -15.291259765625, -14.685546875, -14.079833984375, -13.47412109375, -12.868408203125, -12.2626953125, -11.656982421875, -11.05126953125, -10.445556640625, -9.83984375, -9.234130859375, -8.62841796875, -8.022705078125, -7.4169921875, -6.811279296875, -6.20556640625, -5.599853515625, -4.994140625, -4.388427734375, -3.78271484375, -3.177001953125, -2.5712890625, -1.965576171875, -1.35986328125, -0.754150390625, -0.1484375, 0.457275390625, 1.06298828125, 1.668701171875, 2.2744140625, 2.880126953125, 3.48583984375, 4.091552734375, 4.697265625, 5.302978515625, 5.90869140625, 6.514404296875, 7.1201171875, 7.725830078125, 8.33154296875, 8.937255859375, 9.54296875, 10.148681640625, 10.75439453125, 11.360107421875, 11.9658203125, 12.571533203125, 13.17724609375, 13.782958984375, 14.388671875, 14.994384765625, 15.60009765625, 16.205810546875, 16.8115234375, 17.417236328125, 18.02294921875, 18.628662109375, 19.234375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 13.0, 13.0, 22.0, 44.0, 56.0, 80.0, 155.0, 241.0, 367.0, 588.0, 1092.0, 1799.0, 3410.0, 7117.0, 16405.0, 45572.0, 194369.0, 645535.0, 84180.0, 26267.0, 10572.0, 4673.0, 2532.0, 1391.0, 778.0, 443.0, 303.0, 196.0, 119.0, 73.0, 38.0, 27.0, 25.0, 14.0, 12.0, 7.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-136.875, -132.349609375, -127.82421875, -123.298828125, -118.7734375, -114.248046875, -109.72265625, -105.197265625, -100.671875, -96.146484375, -91.62109375, -87.095703125, -82.5703125, -78.044921875, -73.51953125, -68.994140625, -64.46875, -59.943359375, -55.41796875, -50.892578125, -46.3671875, -41.841796875, -37.31640625, -32.791015625, -28.265625, -23.740234375, -19.21484375, -14.689453125, -10.1640625, -5.638671875, -1.11328125, 3.412109375, 7.9375, 12.462890625, 16.98828125, 21.513671875, 26.0390625, 30.564453125, 35.08984375, 39.615234375, 44.140625, 48.666015625, 53.19140625, 57.716796875, 62.2421875, 66.767578125, 71.29296875, 75.818359375, 80.34375, 84.869140625, 89.39453125, 93.919921875, 98.4453125, 102.970703125, 107.49609375, 112.021484375, 116.546875, 121.072265625, 125.59765625, 130.123046875, 134.6484375, 139.173828125, 143.69921875, 148.224609375, 152.75]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 18.0, 19.0, 27.0, 42.0, 48.0, 54.0, 74.0, 118.0, 167.0, 118.0, 80.0, 49.0, 43.0, 40.0, 19.0, 21.0, 15.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004241943359375, -0.004114627838134766, -0.003987312316894531, -0.003859996795654297, -0.0037326812744140625, -0.003605365753173828, -0.0034780502319335938, -0.0033507347106933594, -0.003223419189453125, -0.0030961036682128906, -0.0029687881469726562, -0.002841472625732422, -0.0027141571044921875, -0.002586841583251953, -0.0024595260620117188, -0.0023322105407714844, -0.00220489501953125, -0.0020775794982910156, -0.0019502639770507812, -0.0018229484558105469, -0.0016956329345703125, -0.0015683174133300781, -0.0014410018920898438, -0.0013136863708496094, -0.001186370849609375, -0.0010590553283691406, -0.0009317398071289062, -0.0008044242858886719, -0.0006771087646484375, -0.0005497932434082031, -0.00042247772216796875, -0.0002951622009277344, -0.0001678466796875, -4.0531158447265625e-05, 8.678436279296875e-05, 0.00021409988403320312, 0.0003414154052734375, 0.0004687309265136719, 0.0005960464477539062, 0.0007233619689941406, 0.000850677490234375, 0.0009779930114746094, 0.0011053085327148438, 0.0012326240539550781, 0.0013599395751953125, 0.0014872550964355469, 0.0016145706176757812, 0.0017418861389160156, 0.00186920166015625, 0.0019965171813964844, 0.0021238327026367188, 0.002251148223876953, 0.0023784637451171875, 0.002505779266357422, 0.0026330947875976562, 0.0027604103088378906, 0.002887725830078125, 0.0030150413513183594, 0.0031423568725585938, 0.003269672393798828, 0.0033969879150390625, 0.003524303436279297, 0.0036516189575195312, 0.0037789344787597656, 0.00390625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 10.0, 6.0, 16.0, 22.0, 31.0, 42.0, 54.0, 82.0, 117.0, 161.0, 217.0, 352.0, 541.0, 755.0, 1196.0, 1859.0, 3086.0, 5670.0, 11301.0, 27150.0, 86720.0, 623612.0, 203747.0, 45907.0, 17182.0, 7825.0, 4052.0, 2461.0, 1459.0, 963.0, 618.0, 391.0, 298.0, 203.0, 133.0, 87.0, 55.0, 55.0, 36.0, 19.0, 19.0, 12.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.625, -100.1416015625, -96.658203125, -93.1748046875, -89.69140625, -86.2080078125, -82.724609375, -79.2412109375, -75.7578125, -72.2744140625, -68.791015625, -65.3076171875, -61.82421875, -58.3408203125, -54.857421875, -51.3740234375, -47.890625, -44.4072265625, -40.923828125, -37.4404296875, -33.95703125, -30.4736328125, -26.990234375, -23.5068359375, -20.0234375, -16.5400390625, -13.056640625, -9.5732421875, -6.08984375, -2.6064453125, 0.876953125, 4.3603515625, 7.84375, 11.3271484375, 14.810546875, 18.2939453125, 21.77734375, 25.2607421875, 28.744140625, 32.2275390625, 35.7109375, 39.1943359375, 42.677734375, 46.1611328125, 49.64453125, 53.1279296875, 56.611328125, 60.0947265625, 63.578125, 67.0615234375, 70.544921875, 74.0283203125, 77.51171875, 80.9951171875, 84.478515625, 87.9619140625, 91.4453125, 94.9287109375, 98.412109375, 101.8955078125, 105.37890625, 108.8623046875, 112.345703125, 115.8291015625, 119.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 3.0, 10.0, 11.0, 11.0, 18.0, 27.0, 36.0, 41.0, 59.0, 86.0, 68.0, 101.0, 129.0, 81.0, 65.0, 49.0, 42.0, 29.0, 28.0, 21.0, 15.0, 11.0, 6.0, 5.0, 5.0, 2.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-25.296875, -24.55419921875, -23.8115234375, -23.06884765625, -22.326171875, -21.58349609375, -20.8408203125, -20.09814453125, -19.35546875, -18.61279296875, -17.8701171875, -17.12744140625, -16.384765625, -15.64208984375, -14.8994140625, -14.15673828125, -13.4140625, -12.67138671875, -11.9287109375, -11.18603515625, -10.443359375, -9.70068359375, -8.9580078125, -8.21533203125, -7.47265625, -6.72998046875, -5.9873046875, -5.24462890625, -4.501953125, -3.75927734375, -3.0166015625, -2.27392578125, -1.53125, -0.78857421875, -0.0458984375, 0.69677734375, 1.439453125, 2.18212890625, 2.9248046875, 3.66748046875, 4.41015625, 5.15283203125, 5.8955078125, 6.63818359375, 7.380859375, 8.12353515625, 8.8662109375, 9.60888671875, 10.3515625, 11.09423828125, 11.8369140625, 12.57958984375, 13.322265625, 14.06494140625, 14.8076171875, 15.55029296875, 16.29296875, 17.03564453125, 17.7783203125, 18.52099609375, 19.263671875, 20.00634765625, 20.7490234375, 21.49169921875, 22.234375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 8.0, 15.0, 28.0, 39.0, 90.0, 163.0, 199.0, 145.0, 100.0, 63.0, 29.0, 22.0, 17.0, 17.0, 9.0, 9.0, 7.0, 10.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.20444107055664, -44.77104187011719, -42.337642669677734, -39.90424346923828, -37.470848083496094, -35.03744888305664, -32.60404968261719, -30.170652389526367, -27.737253189086914, -25.30385398864746, -22.87045669555664, -20.437057495117188, -18.003658294677734, -15.570261001586914, -13.136861801147461, -10.70346450805664, -8.270065307617188, -5.836667060852051, -3.403268337249756, -0.9698696136474609, 1.4635286331176758, 3.8969268798828125, 6.330326080322266, 8.763723373413086, 11.197122573852539, 13.630520820617676, 16.063919067382812, 18.497318267822266, 20.93071746826172, 23.36411476135254, 25.797513961791992, 28.230911254882812, 30.664306640625, 33.09770584106445, 35.531105041503906, 37.964500427246094, 40.39789962768555, 42.831298828125, 45.26469802856445, 47.698097229003906, 50.131492614746094, 52.56489181518555, 54.998291015625, 57.43168640136719, 59.86508560180664, 62.298484802246094, 64.73188781738281, 67.165283203125, 69.59867858886719, 72.03207397460938, 74.4654769897461, 76.89887237548828, 79.332275390625, 81.76567077636719, 84.19906616210938, 86.6324691772461, 89.06587219238281, 91.499267578125, 93.93267059326172, 96.3660659790039, 98.79946899414062, 101.23286437988281, 103.666259765625, 106.09966278076172, 108.5330581665039]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 8.0, 2.0, 2.0, 6.0, 5.0, 11.0, 12.0, 8.0, 15.0, 19.0, 18.0, 14.0, 25.0, 23.0, 34.0, 31.0, 34.0, 48.0, 40.0, 43.0, 39.0, 36.0, 42.0, 41.0, 39.0, 44.0, 36.0, 31.0, 24.0, 29.0, 21.0, 25.0, 26.0, 30.0, 26.0, 15.0, 9.0, 18.0, 21.0, 13.0, 11.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-25.71710777282715, -24.87038803100586, -24.02366828918457, -23.17694854736328, -22.330230712890625, -21.483510971069336, -20.636791229248047, -19.790071487426758, -18.94335174560547, -18.09663200378418, -17.24991226196289, -16.403194427490234, -15.556474685668945, -14.709754943847656, -13.863035202026367, -13.016315460205078, -12.169597625732422, -11.322877883911133, -10.47615909576416, -9.629439353942871, -8.782720565795898, -7.936000823974609, -7.08928108215332, -6.2425618171691895, -5.395842552185059, -4.549123287200928, -3.7024037837982178, -2.855684280395508, -2.008965015411377, -1.162245750427246, -0.31552600860595703, 0.5311932563781738, 1.3779125213623047, 2.2246317863464355, 3.0713512897491455, 3.9180707931518555, 4.764790058135986, 5.611509323120117, 6.458229064941406, 7.304948329925537, 8.151667594909668, 8.998387336730957, 9.84510612487793, 10.691825866699219, 11.538545608520508, 12.38526439666748, 13.23198413848877, 14.078702926635742, 14.925422668457031, 15.77214241027832, 16.61886215209961, 17.465579986572266, 18.312299728393555, 19.159019470214844, 20.005739212036133, 20.852458953857422, 21.699176788330078, 22.545896530151367, 23.392616271972656, 24.239334106445312, 25.0860538482666, 25.93277359008789, 26.77949333190918, 27.62621307373047, 28.472932815551758]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 10.0, 19.0, 34.0, 41.0, 72.0, 107.0, 182.0, 294.0, 478.0, 740.0, 1254.0, 1955.0, 3116.0, 4900.0, 8415.0, 14353.0, 25923.0, 48884.0, 102827.0, 255584.0, 1039556.0, 1976235.0, 412552.0, 141092.0, 66518.0, 35528.0, 20361.0, 12365.0, 7363.0, 4681.0, 3005.0, 1978.0, 1318.0, 881.0, 588.0, 361.0, 253.0, 169.0, 94.0, 76.0, 44.0, 26.0, 13.0, 14.0, 6.0, 4.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.15625, -44.67822265625, -43.2001953125, -41.72216796875, -40.244140625, -38.76611328125, -37.2880859375, -35.81005859375, -34.33203125, -32.85400390625, -31.3759765625, -29.89794921875, -28.419921875, -26.94189453125, -25.4638671875, -23.98583984375, -22.5078125, -21.02978515625, -19.5517578125, -18.07373046875, -16.595703125, -15.11767578125, -13.6396484375, -12.16162109375, -10.68359375, -9.20556640625, -7.7275390625, -6.24951171875, -4.771484375, -3.29345703125, -1.8154296875, -0.33740234375, 1.140625, 2.61865234375, 4.0966796875, 5.57470703125, 7.052734375, 8.53076171875, 10.0087890625, 11.48681640625, 12.96484375, 14.44287109375, 15.9208984375, 17.39892578125, 18.876953125, 20.35498046875, 21.8330078125, 23.31103515625, 24.7890625, 26.26708984375, 27.7451171875, 29.22314453125, 30.701171875, 32.17919921875, 33.6572265625, 35.13525390625, 36.61328125, 38.09130859375, 39.5693359375, 41.04736328125, 42.525390625, 44.00341796875, 45.4814453125, 46.95947265625, 48.4375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 9.0, 6.0, 9.0, 10.0, 13.0, 13.0, 19.0, 25.0, 31.0, 29.0, 32.0, 31.0, 35.0, 55.0, 44.0, 45.0, 41.0, 44.0, 52.0, 45.0, 35.0, 41.0, 39.0, 36.0, 31.0, 25.0, 20.0, 28.0, 21.0, 23.0, 17.0, 10.0, 13.0, 18.0, 7.0, 3.0, 7.0, 11.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.1328125, -13.6336669921875, -13.134521484375, -12.6353759765625, -12.13623046875, -11.6370849609375, -11.137939453125, -10.6387939453125, -10.1396484375, -9.6405029296875, -9.141357421875, -8.6422119140625, -8.14306640625, -7.6439208984375, -7.144775390625, -6.6456298828125, -6.146484375, -5.6473388671875, -5.148193359375, -4.6490478515625, -4.14990234375, -3.6507568359375, -3.151611328125, -2.6524658203125, -2.1533203125, -1.6541748046875, -1.155029296875, -0.6558837890625, -0.15673828125, 0.3424072265625, 0.841552734375, 1.3406982421875, 1.83984375, 2.3389892578125, 2.838134765625, 3.3372802734375, 3.83642578125, 4.3355712890625, 4.834716796875, 5.3338623046875, 5.8330078125, 6.3321533203125, 6.831298828125, 7.3304443359375, 7.82958984375, 8.3287353515625, 8.827880859375, 9.3270263671875, 9.826171875, 10.3253173828125, 10.824462890625, 11.3236083984375, 11.82275390625, 12.3218994140625, 12.821044921875, 13.3201904296875, 13.8193359375, 14.3184814453125, 14.817626953125, 15.3167724609375, 15.81591796875, 16.3150634765625, 16.814208984375, 17.3133544921875, 17.8125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 4.0, 15.0, 11.0, 17.0, 28.0, 47.0, 48.0, 78.0, 102.0, 169.0, 215.0, 365.0, 545.0, 738.0, 1240.0, 1937.0, 3279.0, 5513.0, 9966.0, 18634.0, 38437.0, 87295.0, 227787.0, 791324.0, 2095055.0, 586415.0, 181791.0, 71399.0, 33302.0, 16586.0, 8835.0, 4905.0, 3045.0, 1839.0, 1140.0, 766.0, 469.0, 283.0, 188.0, 147.0, 92.0, 71.0, 45.0, 33.0, 28.0, 21.0, 12.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-45.65625, -44.2890625, -42.921875, -41.5546875, -40.1875, -38.8203125, -37.453125, -36.0859375, -34.71875, -33.3515625, -31.984375, -30.6171875, -29.25, -27.8828125, -26.515625, -25.1484375, -23.78125, -22.4140625, -21.046875, -19.6796875, -18.3125, -16.9453125, -15.578125, -14.2109375, -12.84375, -11.4765625, -10.109375, -8.7421875, -7.375, -6.0078125, -4.640625, -3.2734375, -1.90625, -0.5390625, 0.828125, 2.1953125, 3.5625, 4.9296875, 6.296875, 7.6640625, 9.03125, 10.3984375, 11.765625, 13.1328125, 14.5, 15.8671875, 17.234375, 18.6015625, 19.96875, 21.3359375, 22.703125, 24.0703125, 25.4375, 26.8046875, 28.171875, 29.5390625, 30.90625, 32.2734375, 33.640625, 35.0078125, 36.375, 37.7421875, 39.109375, 40.4765625, 41.84375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 2.0, 4.0, 6.0, 7.0, 13.0, 18.0, 23.0, 30.0, 43.0, 57.0, 71.0, 93.0, 126.0, 169.0, 209.0, 234.0, 299.0, 349.0, 386.0, 376.0, 306.0, 255.0, 177.0, 161.0, 136.0, 110.0, 74.0, 72.0, 66.0, 32.0, 35.0, 28.0, 24.0, 21.0, 14.0, 6.0, 9.0, 9.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.1015625, -8.7752685546875, -8.448974609375, -8.1226806640625, -7.79638671875, -7.4700927734375, -7.143798828125, -6.8175048828125, -6.4912109375, -6.1649169921875, -5.838623046875, -5.5123291015625, -5.18603515625, -4.8597412109375, -4.533447265625, -4.2071533203125, -3.880859375, -3.5545654296875, -3.228271484375, -2.9019775390625, -2.57568359375, -2.2493896484375, -1.923095703125, -1.5968017578125, -1.2705078125, -0.9442138671875, -0.617919921875, -0.2916259765625, 0.03466796875, 0.3609619140625, 0.687255859375, 1.0135498046875, 1.33984375, 1.6661376953125, 1.992431640625, 2.3187255859375, 2.64501953125, 2.9713134765625, 3.297607421875, 3.6239013671875, 3.9501953125, 4.2764892578125, 4.602783203125, 4.9290771484375, 5.25537109375, 5.5816650390625, 5.907958984375, 6.2342529296875, 6.560546875, 6.8868408203125, 7.213134765625, 7.5394287109375, 7.86572265625, 8.1920166015625, 8.518310546875, 8.8446044921875, 9.1708984375, 9.4971923828125, 9.823486328125, 10.1497802734375, 10.47607421875, 10.8023681640625, 11.128662109375, 11.4549560546875, 11.78125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 9.0, 18.0, 30.0, 46.0, 75.0, 133.0, 219.0, 188.0, 104.0, 62.0, 33.0, 17.0, 10.0, 13.0, 9.0, 2.0, 9.0, 1.0, 6.0, 0.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.93971633911133, -59.09362030029297, -57.247520446777344, -55.401424407958984, -53.55532455444336, -51.709228515625, -49.863128662109375, -48.017032623291016, -46.170936584472656, -44.3248405456543, -42.47874069213867, -40.63264465332031, -38.78654479980469, -36.94044876098633, -35.09435272216797, -33.248252868652344, -31.40215301513672, -29.556055068969727, -27.709957122802734, -25.863861083984375, -24.01776123046875, -22.17166519165039, -20.3255672454834, -18.479469299316406, -16.633371353149414, -14.787273406982422, -12.94117546081543, -11.095078468322754, -9.248980522155762, -7.4028825759887695, -5.556785583496094, -3.7106876373291016, -1.8645858764648438, -0.018488168716430664, 1.8276095390319824, 3.6737070083618164, 5.519804954528809, 7.365902900695801, 9.211999893188477, 11.058097839355469, 12.904195785522461, 14.750293731689453, 16.596391677856445, 18.442489624023438, 20.288585662841797, 22.134685516357422, 23.98078155517578, 25.826879501342773, 27.672977447509766, 29.519075393676758, 31.36517333984375, 33.21126937866211, 35.057369232177734, 36.903465270996094, 38.74956512451172, 40.59566116333008, 42.44175720214844, 44.2878532409668, 46.13395309448242, 47.98004913330078, 49.826148986816406, 51.672245025634766, 53.518341064453125, 55.36444091796875, 57.210540771484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 2.0, 3.0, 10.0, 4.0, 11.0, 15.0, 13.0, 16.0, 20.0, 31.0, 15.0, 31.0, 34.0, 37.0, 38.0, 27.0, 35.0, 26.0, 36.0, 41.0, 57.0, 43.0, 44.0, 29.0, 31.0, 30.0, 33.0, 38.0, 28.0, 34.0, 26.0, 15.0, 21.0, 20.0, 11.0, 13.0, 14.0, 8.0, 3.0, 6.0, 16.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-16.732433319091797, -16.187957763671875, -15.64348030090332, -15.099003791809082, -14.554527282714844, -14.010050773620605, -13.465574264526367, -12.921097755432129, -12.37662124633789, -11.832144737243652, -11.287668228149414, -10.743191719055176, -10.198715209960938, -9.6542387008667, -9.109762191772461, -8.565285682678223, -8.020809173583984, -7.476332664489746, -6.931856155395508, -6.3873796463012695, -5.842903137207031, -5.298426628112793, -4.753950119018555, -4.209473609924316, -3.664997100830078, -3.12052059173584, -2.5760440826416016, -2.0315675735473633, -1.487091064453125, -0.9426145553588867, -0.39813804626464844, 0.14633846282958984, 0.6908130645751953, 1.2352895736694336, 1.7797660827636719, 2.32424259185791, 2.8687191009521484, 3.4131956100463867, 3.957672119140625, 4.502148628234863, 5.046625137329102, 5.59110164642334, 6.135578155517578, 6.680054664611816, 7.224531173706055, 7.769007682800293, 8.313484191894531, 8.85796070098877, 9.402437210083008, 9.946913719177246, 10.491390228271484, 11.035866737365723, 11.580343246459961, 12.1248197555542, 12.669296264648438, 13.213772773742676, 13.758249282836914, 14.302725791931152, 14.84720230102539, 15.391678810119629, 15.936155319213867, 16.480632781982422, 17.025108337402344, 17.569583892822266, 18.11406135559082]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 13.0, 27.0, 40.0, 67.0, 96.0, 123.0, 190.0, 320.0, 470.0, 669.0, 1003.0, 1544.0, 2269.0, 3507.0, 5651.0, 8949.0, 14912.0, 26156.0, 48729.0, 100854.0, 249221.0, 321440.0, 126595.0, 58621.0, 31227.0, 17548.0, 10353.0, 6316.0, 4007.0, 2597.0, 1636.0, 1158.0, 719.0, 527.0, 307.0, 193.0, 152.0, 96.0, 75.0, 54.0, 32.0, 26.0, 16.0, 16.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-16.203125, -15.698974609375, -15.19482421875, -14.690673828125, -14.1865234375, -13.682373046875, -13.17822265625, -12.674072265625, -12.169921875, -11.665771484375, -11.16162109375, -10.657470703125, -10.1533203125, -9.649169921875, -9.14501953125, -8.640869140625, -8.13671875, -7.632568359375, -7.12841796875, -6.624267578125, -6.1201171875, -5.615966796875, -5.11181640625, -4.607666015625, -4.103515625, -3.599365234375, -3.09521484375, -2.591064453125, -2.0869140625, -1.582763671875, -1.07861328125, -0.574462890625, -0.0703125, 0.433837890625, 0.93798828125, 1.442138671875, 1.9462890625, 2.450439453125, 2.95458984375, 3.458740234375, 3.962890625, 4.467041015625, 4.97119140625, 5.475341796875, 5.9794921875, 6.483642578125, 6.98779296875, 7.491943359375, 7.99609375, 8.500244140625, 9.00439453125, 9.508544921875, 10.0126953125, 10.516845703125, 11.02099609375, 11.525146484375, 12.029296875, 12.533447265625, 13.03759765625, 13.541748046875, 14.0458984375, 14.550048828125, 15.05419921875, 15.558349609375, 16.0625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 5.0, 10.0, 4.0, 7.0, 14.0, 18.0, 22.0, 30.0, 24.0, 18.0, 27.0, 37.0, 24.0, 23.0, 40.0, 35.0, 42.0, 36.0, 42.0, 44.0, 47.0, 42.0, 35.0, 34.0, 33.0, 27.0, 29.0, 28.0, 29.0, 33.0, 30.0, 14.0, 17.0, 11.0, 13.0, 9.0, 8.0, 10.0, 11.0, 4.0, 6.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.234375, -15.70654296875, -15.1787109375, -14.65087890625, -14.123046875, -13.59521484375, -13.0673828125, -12.53955078125, -12.01171875, -11.48388671875, -10.9560546875, -10.42822265625, -9.900390625, -9.37255859375, -8.8447265625, -8.31689453125, -7.7890625, -7.26123046875, -6.7333984375, -6.20556640625, -5.677734375, -5.14990234375, -4.6220703125, -4.09423828125, -3.56640625, -3.03857421875, -2.5107421875, -1.98291015625, -1.455078125, -0.92724609375, -0.3994140625, 0.12841796875, 0.65625, 1.18408203125, 1.7119140625, 2.23974609375, 2.767578125, 3.29541015625, 3.8232421875, 4.35107421875, 4.87890625, 5.40673828125, 5.9345703125, 6.46240234375, 6.990234375, 7.51806640625, 8.0458984375, 8.57373046875, 9.1015625, 9.62939453125, 10.1572265625, 10.68505859375, 11.212890625, 11.74072265625, 12.2685546875, 12.79638671875, 13.32421875, 13.85205078125, 14.3798828125, 14.90771484375, 15.435546875, 15.96337890625, 16.4912109375, 17.01904296875, 17.546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 6.0, 15.0, 20.0, 33.0, 42.0, 52.0, 80.0, 97.0, 135.0, 194.0, 329.0, 456.0, 737.0, 1113.0, 1743.0, 3037.0, 5157.0, 9515.0, 20686.0, 65137.0, 531693.0, 320011.0, 50395.0, 17658.0, 8288.0, 4572.0, 2621.0, 1571.0, 1018.0, 655.0, 451.0, 324.0, 214.0, 144.0, 105.0, 77.0, 44.0, 40.0, 26.0, 11.0, 12.0, 14.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.453125, -29.554931640625, -28.65673828125, -27.758544921875, -26.8603515625, -25.962158203125, -25.06396484375, -24.165771484375, -23.267578125, -22.369384765625, -21.47119140625, -20.572998046875, -19.6748046875, -18.776611328125, -17.87841796875, -16.980224609375, -16.08203125, -15.183837890625, -14.28564453125, -13.387451171875, -12.4892578125, -11.591064453125, -10.69287109375, -9.794677734375, -8.896484375, -7.998291015625, -7.10009765625, -6.201904296875, -5.3037109375, -4.405517578125, -3.50732421875, -2.609130859375, -1.7109375, -0.812744140625, 0.08544921875, 0.983642578125, 1.8818359375, 2.780029296875, 3.67822265625, 4.576416015625, 5.474609375, 6.372802734375, 7.27099609375, 8.169189453125, 9.0673828125, 9.965576171875, 10.86376953125, 11.761962890625, 12.66015625, 13.558349609375, 14.45654296875, 15.354736328125, 16.2529296875, 17.151123046875, 18.04931640625, 18.947509765625, 19.845703125, 20.743896484375, 21.64208984375, 22.540283203125, 23.4384765625, 24.336669921875, 25.23486328125, 26.133056640625, 27.03125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 7.0, 2.0, 3.0, 9.0, 7.0, 14.0, 12.0, 15.0, 13.0, 23.0, 21.0, 25.0, 36.0, 19.0, 37.0, 39.0, 31.0, 43.0, 44.0, 28.0, 31.0, 47.0, 44.0, 37.0, 38.0, 37.0, 41.0, 32.0, 26.0, 24.0, 27.0, 25.0, 22.0, 13.0, 12.0, 22.0, 16.0, 14.0, 15.0, 15.0, 6.0, 5.0, 8.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.59375, -10.2406005859375, -9.887451171875, -9.5343017578125, -9.18115234375, -8.8280029296875, -8.474853515625, -8.1217041015625, -7.7685546875, -7.4154052734375, -7.062255859375, -6.7091064453125, -6.35595703125, -6.0028076171875, -5.649658203125, -5.2965087890625, -4.943359375, -4.5902099609375, -4.237060546875, -3.8839111328125, -3.53076171875, -3.1776123046875, -2.824462890625, -2.4713134765625, -2.1181640625, -1.7650146484375, -1.411865234375, -1.0587158203125, -0.70556640625, -0.3524169921875, 0.000732421875, 0.3538818359375, 0.70703125, 1.0601806640625, 1.413330078125, 1.7664794921875, 2.11962890625, 2.4727783203125, 2.825927734375, 3.1790771484375, 3.5322265625, 3.8853759765625, 4.238525390625, 4.5916748046875, 4.94482421875, 5.2979736328125, 5.651123046875, 6.0042724609375, 6.357421875, 6.7105712890625, 7.063720703125, 7.4168701171875, 7.77001953125, 8.1231689453125, 8.476318359375, 8.8294677734375, 9.1826171875, 9.5357666015625, 9.888916015625, 10.2420654296875, 10.59521484375, 10.9483642578125, 11.301513671875, 11.6546630859375, 12.0078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 16.0, 17.0, 24.0, 32.0, 44.0, 48.0, 83.0, 124.0, 210.0, 275.0, 432.0, 682.0, 1072.0, 1871.0, 3164.0, 6019.0, 13050.0, 35150.0, 203258.0, 674906.0, 68532.0, 20548.0, 8704.0, 4213.0, 2300.0, 1402.0, 797.0, 503.0, 342.0, 248.0, 134.0, 98.0, 56.0, 38.0, 35.0, 34.0, 15.0, 21.0, 14.0, 4.0, 9.0, 7.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0], "bins": [-4.296875, -4.1676025390625, -4.038330078125, -3.9090576171875, -3.77978515625, -3.6505126953125, -3.521240234375, -3.3919677734375, -3.2626953125, -3.1334228515625, -3.004150390625, -2.8748779296875, -2.74560546875, -2.6163330078125, -2.487060546875, -2.3577880859375, -2.228515625, -2.0992431640625, -1.969970703125, -1.8406982421875, -1.71142578125, -1.5821533203125, -1.452880859375, -1.3236083984375, -1.1943359375, -1.0650634765625, -0.935791015625, -0.8065185546875, -0.67724609375, -0.5479736328125, -0.418701171875, -0.2894287109375, -0.16015625, -0.0308837890625, 0.098388671875, 0.2276611328125, 0.35693359375, 0.4862060546875, 0.615478515625, 0.7447509765625, 0.8740234375, 1.0032958984375, 1.132568359375, 1.2618408203125, 1.39111328125, 1.5203857421875, 1.649658203125, 1.7789306640625, 1.908203125, 2.0374755859375, 2.166748046875, 2.2960205078125, 2.42529296875, 2.5545654296875, 2.683837890625, 2.8131103515625, 2.9423828125, 3.0716552734375, 3.200927734375, 3.3302001953125, 3.45947265625, 3.5887451171875, 3.718017578125, 3.8472900390625, 3.9765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 11.0, 12.0, 33.0, 22.0, 26.0, 42.0, 52.0, 73.0, 110.0, 131.0, 98.0, 98.0, 71.0, 32.0, 40.0, 33.0, 30.0, 15.0, 12.0, 5.0, 15.0, 8.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00026035308837890625, -0.00025286152958869934, -0.00024536997079849243, -0.00023787841200828552, -0.0002303868532180786, -0.0002228952944278717, -0.0002154037356376648, -0.00020791217684745789, -0.00020042061805725098, -0.00019292905926704407, -0.00018543750047683716, -0.00017794594168663025, -0.00017045438289642334, -0.00016296282410621643, -0.00015547126531600952, -0.0001479797065258026, -0.0001404881477355957, -0.0001329965889453888, -0.00012550503015518188, -0.00011801347136497498, -0.00011052191257476807, -0.00010303035378456116, -9.553879499435425e-05, -8.804723620414734e-05, -8.055567741394043e-05, -7.306411862373352e-05, -6.557255983352661e-05, -5.80810010433197e-05, -5.058944225311279e-05, -4.3097883462905884e-05, -3.5606324672698975e-05, -2.8114765882492065e-05, -2.0623207092285156e-05, -1.3131648302078247e-05, -5.640089511871338e-06, 1.8514692783355713e-06, 9.34302806854248e-06, 1.683458685874939e-05, 2.43261456489563e-05, 3.181770443916321e-05, 3.930926322937012e-05, 4.6800822019577026e-05, 5.4292380809783936e-05, 6.178393959999084e-05, 6.927549839019775e-05, 7.676705718040466e-05, 8.425861597061157e-05, 9.175017476081848e-05, 9.924173355102539e-05, 0.0001067332923412323, 0.00011422485113143921, 0.00012171640992164612, 0.00012920796871185303, 0.00013669952750205994, 0.00014419108629226685, 0.00015168264508247375, 0.00015917420387268066, 0.00016666576266288757, 0.00017415732145309448, 0.0001816488802433014, 0.0001891404390335083, 0.0001966319978237152, 0.00020412355661392212, 0.00021161511540412903, 0.00021910667419433594]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 14.0, 13.0, 20.0, 27.0, 33.0, 44.0, 69.0, 108.0, 144.0, 192.0, 282.0, 440.0, 597.0, 914.0, 1294.0, 1869.0, 3176.0, 5313.0, 9636.0, 18454.0, 40534.0, 110283.0, 485846.0, 240589.0, 67764.0, 28072.0, 13661.0, 7324.0, 4192.0, 2548.0, 1628.0, 1054.0, 709.0, 503.0, 335.0, 246.0, 166.0, 151.0, 97.0, 70.0, 40.0, 39.0, 19.0, 11.0, 11.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.783477783203125, -2.69000244140625, -2.596527099609375, -2.5030517578125, -2.409576416015625, -2.31610107421875, -2.222625732421875, -2.129150390625, -2.035675048828125, -1.94219970703125, -1.848724365234375, -1.7552490234375, -1.661773681640625, -1.56829833984375, -1.474822998046875, -1.38134765625, -1.287872314453125, -1.19439697265625, -1.100921630859375, -1.0074462890625, -0.913970947265625, -0.82049560546875, -0.727020263671875, -0.633544921875, -0.540069580078125, -0.44659423828125, -0.353118896484375, -0.2596435546875, -0.166168212890625, -0.07269287109375, 0.020782470703125, 0.1142578125, 0.207733154296875, 0.30120849609375, 0.394683837890625, 0.4881591796875, 0.581634521484375, 0.67510986328125, 0.768585205078125, 0.862060546875, 0.955535888671875, 1.04901123046875, 1.142486572265625, 1.2359619140625, 1.329437255859375, 1.42291259765625, 1.516387939453125, 1.60986328125, 1.703338623046875, 1.79681396484375, 1.890289306640625, 1.9837646484375, 2.077239990234375, 2.17071533203125, 2.264190673828125, 2.357666015625, 2.451141357421875, 2.54461669921875, 2.638092041015625, 2.7315673828125, 2.825042724609375, 2.91851806640625, 3.011993408203125, 3.10546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 6.0, 5.0, 9.0, 12.0, 9.0, 22.0, 26.0, 24.0, 32.0, 54.0, 75.0, 91.0, 98.0, 107.0, 89.0, 68.0, 58.0, 42.0, 30.0, 26.0, 25.0, 19.0, 12.0, 10.0, 7.0, 5.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4809608459472656, -0.46265411376953125, -0.4443473815917969, -0.4260406494140625, -0.4077339172363281, -0.38942718505859375, -0.3711204528808594, -0.352813720703125, -0.3345069885253906, -0.31620025634765625, -0.2978935241699219, -0.2795867919921875, -0.2612800598144531, -0.24297332763671875, -0.22466659545898438, -0.20635986328125, -0.18805313110351562, -0.16974639892578125, -0.15143966674804688, -0.1331329345703125, -0.11482620239257812, -0.09651947021484375, -0.07821273803710938, -0.059906005859375, -0.041599273681640625, -0.02329254150390625, -0.004985809326171875, 0.0133209228515625, 0.031627655029296875, 0.04993438720703125, 0.06824111938476562, 0.0865478515625, 0.10485458374023438, 0.12316131591796875, 0.14146804809570312, 0.1597747802734375, 0.17808151245117188, 0.19638824462890625, 0.21469497680664062, 0.233001708984375, 0.2513084411621094, 0.26961517333984375, 0.2879219055175781, 0.3062286376953125, 0.3245353698730469, 0.34284210205078125, 0.3611488342285156, 0.37945556640625, 0.3977622985839844, 0.41606903076171875, 0.4343757629394531, 0.4526824951171875, 0.4709892272949219, 0.48929595947265625, 0.5076026916503906, 0.525909423828125, 0.5442161560058594, 0.5625228881835938, 0.5808296203613281, 0.5991363525390625, 0.6174430847167969, 0.6357498168945312, 0.6540565490722656, 0.67236328125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 10.0, 22.0, 23.0, 62.0, 102.0, 174.0, 212.0, 136.0, 92.0, 50.0, 29.0, 16.0, 14.0, 8.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.39835739135742, -51.70405960083008, -50.009761810302734, -48.315460205078125, -46.62116241455078, -44.92686462402344, -43.232566833496094, -41.53826904296875, -39.843971252441406, -38.14967346191406, -36.45537567138672, -34.761077880859375, -33.066776275634766, -31.372478485107422, -29.678180694580078, -27.983882904052734, -26.289581298828125, -24.59528350830078, -22.900983810424805, -21.20668601989746, -19.512386322021484, -17.81808853149414, -16.123790740966797, -14.429491996765137, -12.735193252563477, -11.040894508361816, -9.346595764160156, -7.6522979736328125, -5.957999229431152, -4.263700485229492, -2.5694026947021484, -0.8751039505004883, 0.8191947937011719, 2.513493299484253, 4.207791805267334, 5.902090072631836, 7.596388816833496, 9.290687561035156, 10.9849853515625, 12.67928409576416, 14.37358283996582, 16.067880630493164, 17.76218032836914, 19.456478118896484, 21.150775909423828, 22.845075607299805, 24.53937339782715, 26.233673095703125, 27.92797088623047, 29.622268676757812, 31.31656837463379, 33.0108642578125, 34.70516586303711, 36.39946365356445, 38.0937614440918, 39.78805923461914, 41.48236083984375, 43.176658630371094, 44.87095642089844, 46.56525421142578, 48.25955581665039, 49.953853607177734, 51.64815139770508, 53.34244918823242, 55.036746978759766]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 7.0, 4.0, 4.0, 6.0, 5.0, 7.0, 9.0, 17.0, 9.0, 22.0, 20.0, 24.0, 24.0, 33.0, 33.0, 33.0, 37.0, 29.0, 33.0, 26.0, 36.0, 41.0, 53.0, 45.0, 44.0, 33.0, 27.0, 25.0, 37.0, 38.0, 22.0, 38.0, 31.0, 16.0, 17.0, 18.0, 14.0, 12.0, 15.0, 9.0, 3.0, 7.0, 12.0, 7.0, 3.0, 6.0, 1.0, 2.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-15.665393829345703, -15.15869140625, -14.65198802947998, -14.145284652709961, -13.638582229614258, -13.131879806518555, -12.625176429748535, -12.118473052978516, -11.611770629882812, -11.10506820678711, -10.59836483001709, -10.09166145324707, -9.584959030151367, -9.078256607055664, -8.571553230285645, -8.064849853515625, -7.558147430419922, -7.0514445304870605, -6.544741630554199, -6.038038730621338, -5.531335830688477, -5.024632930755615, -4.517930030822754, -4.011227130889893, -3.5045242309570312, -2.99782133102417, -2.4911184310913086, -1.9844155311584473, -1.477712631225586, -0.9710097312927246, -0.4643068313598633, 0.04239606857299805, 0.5490989685058594, 1.0558018684387207, 1.562504768371582, 2.0692076683044434, 2.5759105682373047, 3.082613468170166, 3.5893163681030273, 4.096019268035889, 4.60272216796875, 5.109425067901611, 5.616127967834473, 6.122830867767334, 6.629533767700195, 7.136236667633057, 7.642939567565918, 8.149642944335938, 8.65634536743164, 9.163047790527344, 9.669751167297363, 10.176454544067383, 10.683156967163086, 11.189859390258789, 11.696562767028809, 12.203266143798828, 12.709968566894531, 13.216670989990234, 13.723374366760254, 14.230077743530273, 14.736780166625977, 15.24348258972168, 15.7501859664917, 16.25688934326172, 16.763591766357422]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 8.0, 7.0, 11.0, 16.0, 16.0, 30.0, 49.0, 64.0, 98.0, 138.0, 207.0, 263.0, 416.0, 590.0, 856.0, 1280.0, 1799.0, 2509.0, 3825.0, 5784.0, 8598.0, 13086.0, 20376.0, 33094.0, 55176.0, 92360.0, 156194.0, 218395.0, 169619.0, 101678.0, 60311.0, 36651.0, 22562.0, 14188.0, 9243.0, 6034.0, 4110.0, 2810.0, 1861.0, 1242.0, 899.0, 612.0, 436.0, 306.0, 261.0, 141.0, 121.0, 69.0, 47.0, 43.0, 26.0, 19.0, 8.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0], "bins": [-24.09375, -23.3310546875, -22.568359375, -21.8056640625, -21.04296875, -20.2802734375, -19.517578125, -18.7548828125, -17.9921875, -17.2294921875, -16.466796875, -15.7041015625, -14.94140625, -14.1787109375, -13.416015625, -12.6533203125, -11.890625, -11.1279296875, -10.365234375, -9.6025390625, -8.83984375, -8.0771484375, -7.314453125, -6.5517578125, -5.7890625, -5.0263671875, -4.263671875, -3.5009765625, -2.73828125, -1.9755859375, -1.212890625, -0.4501953125, 0.3125, 1.0751953125, 1.837890625, 2.6005859375, 3.36328125, 4.1259765625, 4.888671875, 5.6513671875, 6.4140625, 7.1767578125, 7.939453125, 8.7021484375, 9.46484375, 10.2275390625, 10.990234375, 11.7529296875, 12.515625, 13.2783203125, 14.041015625, 14.8037109375, 15.56640625, 16.3291015625, 17.091796875, 17.8544921875, 18.6171875, 19.3798828125, 20.142578125, 20.9052734375, 21.66796875, 22.4306640625, 23.193359375, 23.9560546875, 24.71875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 3.0, 5.0, 4.0, 12.0, 9.0, 10.0, 17.0, 15.0, 19.0, 24.0, 20.0, 25.0, 30.0, 37.0, 32.0, 34.0, 38.0, 32.0, 47.0, 40.0, 48.0, 53.0, 43.0, 46.0, 32.0, 28.0, 33.0, 34.0, 29.0, 40.0, 20.0, 21.0, 16.0, 8.0, 15.0, 7.0, 14.0, 7.0, 8.0, 11.0, 10.0, 5.0, 3.0, 1.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.09375, -13.60546875, -13.1171875, -12.62890625, -12.140625, -11.65234375, -11.1640625, -10.67578125, -10.1875, -9.69921875, -9.2109375, -8.72265625, -8.234375, -7.74609375, -7.2578125, -6.76953125, -6.28125, -5.79296875, -5.3046875, -4.81640625, -4.328125, -3.83984375, -3.3515625, -2.86328125, -2.375, -1.88671875, -1.3984375, -0.91015625, -0.421875, 0.06640625, 0.5546875, 1.04296875, 1.53125, 2.01953125, 2.5078125, 2.99609375, 3.484375, 3.97265625, 4.4609375, 4.94921875, 5.4375, 5.92578125, 6.4140625, 6.90234375, 7.390625, 7.87890625, 8.3671875, 8.85546875, 9.34375, 9.83203125, 10.3203125, 10.80859375, 11.296875, 11.78515625, 12.2734375, 12.76171875, 13.25, 13.73828125, 14.2265625, 14.71484375, 15.203125, 15.69140625, 16.1796875, 16.66796875, 17.15625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 12.0, 17.0, 25.0, 32.0, 41.0, 61.0, 86.0, 120.0, 189.0, 292.0, 476.0, 722.0, 1116.0, 1607.0, 2758.0, 4496.0, 7549.0, 12888.0, 22985.0, 42117.0, 80661.0, 169902.0, 295626.0, 199904.0, 94368.0, 47836.0, 26152.0, 14639.0, 8508.0, 5072.0, 2999.0, 1895.0, 1125.0, 788.0, 501.0, 295.0, 199.0, 142.0, 90.0, 68.0, 53.0, 47.0, 26.0, 18.0, 10.0, 13.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-28.34375, -27.417724609375, -26.49169921875, -25.565673828125, -24.6396484375, -23.713623046875, -22.78759765625, -21.861572265625, -20.935546875, -20.009521484375, -19.08349609375, -18.157470703125, -17.2314453125, -16.305419921875, -15.37939453125, -14.453369140625, -13.52734375, -12.601318359375, -11.67529296875, -10.749267578125, -9.8232421875, -8.897216796875, -7.97119140625, -7.045166015625, -6.119140625, -5.193115234375, -4.26708984375, -3.341064453125, -2.4150390625, -1.489013671875, -0.56298828125, 0.363037109375, 1.2890625, 2.215087890625, 3.14111328125, 4.067138671875, 4.9931640625, 5.919189453125, 6.84521484375, 7.771240234375, 8.697265625, 9.623291015625, 10.54931640625, 11.475341796875, 12.4013671875, 13.327392578125, 14.25341796875, 15.179443359375, 16.10546875, 17.031494140625, 17.95751953125, 18.883544921875, 19.8095703125, 20.735595703125, 21.66162109375, 22.587646484375, 23.513671875, 24.439697265625, 25.36572265625, 26.291748046875, 27.2177734375, 28.143798828125, 29.06982421875, 29.995849609375, 30.921875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 10.0, 9.0, 11.0, 17.0, 15.0, 21.0, 22.0, 22.0, 25.0, 22.0, 34.0, 39.0, 30.0, 47.0, 32.0, 39.0, 38.0, 34.0, 44.0, 38.0, 41.0, 30.0, 40.0, 29.0, 32.0, 24.0, 30.0, 24.0, 21.0, 28.0, 19.0, 21.0, 14.0, 14.0, 5.0, 11.0, 12.0, 8.0, 8.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.8907470703125, -9.578369140625, -9.2659912109375, -8.95361328125, -8.6412353515625, -8.328857421875, -8.0164794921875, -7.7041015625, -7.3917236328125, -7.079345703125, -6.7669677734375, -6.45458984375, -6.1422119140625, -5.829833984375, -5.5174560546875, -5.205078125, -4.8927001953125, -4.580322265625, -4.2679443359375, -3.95556640625, -3.6431884765625, -3.330810546875, -3.0184326171875, -2.7060546875, -2.3936767578125, -2.081298828125, -1.7689208984375, -1.45654296875, -1.1441650390625, -0.831787109375, -0.5194091796875, -0.20703125, 0.1053466796875, 0.417724609375, 0.7301025390625, 1.04248046875, 1.3548583984375, 1.667236328125, 1.9796142578125, 2.2919921875, 2.6043701171875, 2.916748046875, 3.2291259765625, 3.54150390625, 3.8538818359375, 4.166259765625, 4.4786376953125, 4.791015625, 5.1033935546875, 5.415771484375, 5.7281494140625, 6.04052734375, 6.3529052734375, 6.665283203125, 6.9776611328125, 7.2900390625, 7.6024169921875, 7.914794921875, 8.2271728515625, 8.53955078125, 8.8519287109375, 9.164306640625, 9.4766845703125, 9.7890625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 3.0, 9.0, 10.0, 14.0, 21.0, 28.0, 34.0, 48.0, 104.0, 119.0, 207.0, 268.0, 430.0, 735.0, 1118.0, 1797.0, 3302.0, 6097.0, 12726.0, 28803.0, 78195.0, 385852.0, 393992.0, 77688.0, 29482.0, 13068.0, 6316.0, 3246.0, 1767.0, 1068.0, 691.0, 411.0, 281.0, 198.0, 134.0, 92.0, 53.0, 41.0, 31.0, 29.0, 24.0, 3.0, 7.0, 3.0, 1.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.65625, -34.607666015625, -33.55908203125, -32.510498046875, -31.4619140625, -30.413330078125, -29.36474609375, -28.316162109375, -27.267578125, -26.218994140625, -25.17041015625, -24.121826171875, -23.0732421875, -22.024658203125, -20.97607421875, -19.927490234375, -18.87890625, -17.830322265625, -16.78173828125, -15.733154296875, -14.6845703125, -13.635986328125, -12.58740234375, -11.538818359375, -10.490234375, -9.441650390625, -8.39306640625, -7.344482421875, -6.2958984375, -5.247314453125, -4.19873046875, -3.150146484375, -2.1015625, -1.052978515625, -0.00439453125, 1.044189453125, 2.0927734375, 3.141357421875, 4.18994140625, 5.238525390625, 6.287109375, 7.335693359375, 8.38427734375, 9.432861328125, 10.4814453125, 11.530029296875, 12.57861328125, 13.627197265625, 14.67578125, 15.724365234375, 16.77294921875, 17.821533203125, 18.8701171875, 19.918701171875, 20.96728515625, 22.015869140625, 23.064453125, 24.113037109375, 25.16162109375, 26.210205078125, 27.2587890625, 28.307373046875, 29.35595703125, 30.404541015625, 31.453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 10.0, 13.0, 11.0, 29.0, 27.0, 25.0, 49.0, 62.0, 100.0, 104.0, 117.0, 99.0, 80.0, 53.0, 41.0, 51.0, 27.0, 19.0, 25.0, 9.0, 10.0, 7.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00165557861328125, -0.001608729362487793, -0.001561880111694336, -0.001515030860900879, -0.0014681816101074219, -0.0014213323593139648, -0.0013744831085205078, -0.0013276338577270508, -0.0012807846069335938, -0.0012339353561401367, -0.0011870861053466797, -0.0011402368545532227, -0.0010933876037597656, -0.0010465383529663086, -0.0009996891021728516, -0.0009528398513793945, -0.0009059906005859375, -0.0008591413497924805, -0.0008122920989990234, -0.0007654428482055664, -0.0007185935974121094, -0.0006717443466186523, -0.0006248950958251953, -0.0005780458450317383, -0.0005311965942382812, -0.0004843473434448242, -0.0004374980926513672, -0.00039064884185791016, -0.0003437995910644531, -0.0002969503402709961, -0.00025010108947753906, -0.00020325183868408203, -0.000156402587890625, -0.00010955333709716797, -6.270408630371094e-05, -1.5854835510253906e-05, 3.0994415283203125e-05, 7.784366607666016e-05, 0.0001246929168701172, 0.00017154216766357422, 0.00021839141845703125, 0.0002652406692504883, 0.0003120899200439453, 0.00035893917083740234, 0.0004057884216308594, 0.0004526376724243164, 0.0004994869232177734, 0.0005463361740112305, 0.0005931854248046875, 0.0006400346755981445, 0.0006868839263916016, 0.0007337331771850586, 0.0007805824279785156, 0.0008274316787719727, 0.0008742809295654297, 0.0009211301803588867, 0.0009679794311523438, 0.0010148286819458008, 0.0010616779327392578, 0.0011085271835327148, 0.0011553764343261719, 0.001202225685119629, 0.001249074935913086, 0.001295924186706543, 0.0013427734375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 14.0, 13.0, 20.0, 21.0, 35.0, 29.0, 70.0, 76.0, 129.0, 162.0, 240.0, 294.0, 547.0, 818.0, 1285.0, 2196.0, 3854.0, 7454.0, 16290.0, 42596.0, 170728.0, 600082.0, 134186.0, 37027.0, 14568.0, 6707.0, 3554.0, 2003.0, 1183.0, 782.0, 514.0, 312.0, 215.0, 148.0, 102.0, 82.0, 66.0, 49.0, 31.0, 23.0, 19.0, 3.0, 5.0, 1.0, 6.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0], "bins": [-30.21875, -29.341064453125, -28.46337890625, -27.585693359375, -26.7080078125, -25.830322265625, -24.95263671875, -24.074951171875, -23.197265625, -22.319580078125, -21.44189453125, -20.564208984375, -19.6865234375, -18.808837890625, -17.93115234375, -17.053466796875, -16.17578125, -15.298095703125, -14.42041015625, -13.542724609375, -12.6650390625, -11.787353515625, -10.90966796875, -10.031982421875, -9.154296875, -8.276611328125, -7.39892578125, -6.521240234375, -5.6435546875, -4.765869140625, -3.88818359375, -3.010498046875, -2.1328125, -1.255126953125, -0.37744140625, 0.500244140625, 1.3779296875, 2.255615234375, 3.13330078125, 4.010986328125, 4.888671875, 5.766357421875, 6.64404296875, 7.521728515625, 8.3994140625, 9.277099609375, 10.15478515625, 11.032470703125, 11.91015625, 12.787841796875, 13.66552734375, 14.543212890625, 15.4208984375, 16.298583984375, 17.17626953125, 18.053955078125, 18.931640625, 19.809326171875, 20.68701171875, 21.564697265625, 22.4423828125, 23.320068359375, 24.19775390625, 25.075439453125, 25.953125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 7.0, 16.0, 10.0, 14.0, 27.0, 30.0, 47.0, 57.0, 76.0, 112.0, 122.0, 99.0, 91.0, 67.0, 60.0, 39.0, 26.0, 17.0, 16.0, 8.0, 5.0, 10.0, 9.0, 0.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.37890625, -7.17645263671875, -6.9739990234375, -6.77154541015625, -6.569091796875, -6.36663818359375, -6.1641845703125, -5.96173095703125, -5.75927734375, -5.55682373046875, -5.3543701171875, -5.15191650390625, -4.949462890625, -4.74700927734375, -4.5445556640625, -4.34210205078125, -4.1396484375, -3.93719482421875, -3.7347412109375, -3.53228759765625, -3.329833984375, -3.12738037109375, -2.9249267578125, -2.72247314453125, -2.52001953125, -2.31756591796875, -2.1151123046875, -1.91265869140625, -1.710205078125, -1.50775146484375, -1.3052978515625, -1.10284423828125, -0.900390625, -0.69793701171875, -0.4954833984375, -0.29302978515625, -0.090576171875, 0.11187744140625, 0.3143310546875, 0.51678466796875, 0.71923828125, 0.92169189453125, 1.1241455078125, 1.32659912109375, 1.529052734375, 1.73150634765625, 1.9339599609375, 2.13641357421875, 2.3388671875, 2.54132080078125, 2.7437744140625, 2.94622802734375, 3.148681640625, 3.35113525390625, 3.5535888671875, 3.75604248046875, 3.95849609375, 4.16094970703125, 4.3634033203125, 4.56585693359375, 4.768310546875, 4.97076416015625, 5.1732177734375, 5.37567138671875, 5.578125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 6.0, 14.0, 24.0, 45.0, 74.0, 186.0, 282.0, 151.0, 76.0, 45.0, 23.0, 22.0, 14.0, 10.0, 8.0, 4.0, 3.0, 0.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.489105224609375, -54.691017150878906, -52.89292907714844, -51.09484100341797, -49.296749114990234, -47.498661041259766, -45.7005729675293, -43.90248489379883, -42.104393005371094, -40.306304931640625, -38.508216857910156, -36.71012878417969, -34.91203689575195, -33.113948822021484, -31.315860748291016, -29.517772674560547, -27.719684600830078, -25.92159652709961, -24.123506546020508, -22.32541847229004, -20.527328491210938, -18.72924041748047, -16.93115234375, -15.133063316345215, -13.33497428894043, -11.536885261535645, -9.73879623413086, -7.940708160400391, -6.1426191329956055, -4.34453010559082, -2.5464420318603516, -0.7483530044555664, 1.0497398376464844, 2.8478286266326904, 4.6459174156188965, 6.444005966186523, 8.242094993591309, 10.040184020996094, 11.838272094726562, 13.636361122131348, 15.434450149536133, 17.2325382232666, 19.030628204345703, 20.828716278076172, 22.62680435180664, 24.424894332885742, 26.22298240661621, 28.021072387695312, 29.81916046142578, 31.61724853515625, 33.41533660888672, 35.21342468261719, 37.01151657104492, 38.80960464477539, 40.60769271850586, 42.40578079223633, 44.20387268066406, 46.00196075439453, 47.800048828125, 49.59813690185547, 51.3962287902832, 53.19431686401367, 54.99240493774414, 56.79049301147461, 58.58858108520508]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 5.0, 5.0, 7.0, 5.0, 8.0, 11.0, 16.0, 21.0, 12.0, 32.0, 21.0, 25.0, 31.0, 35.0, 32.0, 41.0, 31.0, 31.0, 47.0, 50.0, 42.0, 50.0, 30.0, 42.0, 29.0, 28.0, 36.0, 33.0, 38.0, 29.0, 33.0, 21.0, 20.0, 15.0, 21.0, 9.0, 13.0, 5.0, 11.0, 6.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.24713134765625, -14.739377975463867, -14.2316255569458, -13.723873138427734, -13.216119766235352, -12.708366394042969, -12.200613975524902, -11.692861557006836, -11.185108184814453, -10.67735481262207, -10.169602394104004, -9.661849975585938, -9.154096603393555, -8.646343231201172, -8.138590812683105, -7.630837917327881, -7.123085021972656, -6.615332126617432, -6.107579231262207, -5.599826335906982, -5.092073440551758, -4.584320545196533, -4.076567649841309, -3.568814754486084, -3.0610618591308594, -2.5533089637756348, -2.04555606842041, -1.5378031730651855, -1.030050277709961, -0.5222973823547363, -0.014544486999511719, 0.4932084083557129, 1.0009613037109375, 1.508714199066162, 2.0164670944213867, 2.5242199897766113, 3.031972885131836, 3.5397257804870605, 4.047478675842285, 4.55523157119751, 5.062984466552734, 5.570737361907959, 6.078490257263184, 6.586243152618408, 7.093996047973633, 7.601748943328857, 8.109501838684082, 8.617254257202148, 9.125007629394531, 9.632761001586914, 10.14051342010498, 10.648265838623047, 11.15601921081543, 11.663772583007812, 12.171525001525879, 12.679277420043945, 13.187030792236328, 13.694784164428711, 14.202536582946777, 14.710289001464844, 15.218042373657227, 15.72579574584961, 16.23354721069336, 16.741300582885742, 17.249053955078125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 14.0, 15.0, 17.0, 46.0, 62.0, 104.0, 161.0, 230.0, 349.0, 585.0, 885.0, 1403.0, 2187.0, 3528.0, 5644.0, 9444.0, 16059.0, 28261.0, 54269.0, 113868.0, 295831.0, 1351047.0, 1706739.0, 344915.0, 123384.0, 57427.0, 30385.0, 17518.0, 10415.0, 6713.0, 4259.0, 2761.0, 1860.0, 1261.0, 845.0, 567.0, 389.0, 256.0, 185.0, 122.0, 91.0, 54.0, 40.0, 29.0, 15.0, 15.0, 10.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.28125, -24.440673828125, -23.60009765625, -22.759521484375, -21.9189453125, -21.078369140625, -20.23779296875, -19.397216796875, -18.556640625, -17.716064453125, -16.87548828125, -16.034912109375, -15.1943359375, -14.353759765625, -13.51318359375, -12.672607421875, -11.83203125, -10.991455078125, -10.15087890625, -9.310302734375, -8.4697265625, -7.629150390625, -6.78857421875, -5.947998046875, -5.107421875, -4.266845703125, -3.42626953125, -2.585693359375, -1.7451171875, -0.904541015625, -0.06396484375, 0.776611328125, 1.6171875, 2.457763671875, 3.29833984375, 4.138916015625, 4.9794921875, 5.820068359375, 6.66064453125, 7.501220703125, 8.341796875, 9.182373046875, 10.02294921875, 10.863525390625, 11.7041015625, 12.544677734375, 13.38525390625, 14.225830078125, 15.06640625, 15.906982421875, 16.74755859375, 17.588134765625, 18.4287109375, 19.269287109375, 20.10986328125, 20.950439453125, 21.791015625, 22.631591796875, 23.47216796875, 24.312744140625, 25.1533203125, 25.993896484375, 26.83447265625, 27.675048828125, 28.515625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 6.0, 5.0, 11.0, 17.0, 20.0, 12.0, 22.0, 23.0, 23.0, 22.0, 32.0, 38.0, 29.0, 47.0, 40.0, 49.0, 60.0, 54.0, 56.0, 24.0, 31.0, 38.0, 35.0, 36.0, 40.0, 30.0, 28.0, 21.0, 23.0, 23.0, 20.0, 14.0, 8.0, 11.0, 13.0, 8.0, 3.0, 1.0, 4.0, 6.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.3792724609375, -8.071044921875, -7.7628173828125, -7.45458984375, -7.1463623046875, -6.838134765625, -6.5299072265625, -6.2216796875, -5.9134521484375, -5.605224609375, -5.2969970703125, -4.98876953125, -4.6805419921875, -4.372314453125, -4.0640869140625, -3.755859375, -3.4476318359375, -3.139404296875, -2.8311767578125, -2.52294921875, -2.2147216796875, -1.906494140625, -1.5982666015625, -1.2900390625, -0.9818115234375, -0.673583984375, -0.3653564453125, -0.05712890625, 0.2510986328125, 0.559326171875, 0.8675537109375, 1.17578125, 1.4840087890625, 1.792236328125, 2.1004638671875, 2.40869140625, 2.7169189453125, 3.025146484375, 3.3333740234375, 3.6416015625, 3.9498291015625, 4.258056640625, 4.5662841796875, 4.87451171875, 5.1827392578125, 5.490966796875, 5.7991943359375, 6.107421875, 6.4156494140625, 6.723876953125, 7.0321044921875, 7.34033203125, 7.6485595703125, 7.956787109375, 8.2650146484375, 8.5732421875, 8.8814697265625, 9.189697265625, 9.4979248046875, 9.80615234375, 10.1143798828125, 10.422607421875, 10.7308349609375, 11.0390625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 6.0, 14.0, 17.0, 26.0, 54.0, 53.0, 91.0, 146.0, 191.0, 288.0, 403.0, 641.0, 1013.0, 1737.0, 2722.0, 4422.0, 7605.0, 13372.0, 25937.0, 52547.0, 125394.0, 365868.0, 1585128.0, 1441361.0, 340030.0, 118133.0, 50543.0, 24616.0, 12974.0, 7368.0, 4351.0, 2708.0, 1626.0, 970.0, 657.0, 429.0, 257.0, 181.0, 131.0, 89.0, 54.0, 35.0, 33.0, 13.0, 14.0, 9.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.953125, -23.1796875, -22.40625, -21.6328125, -20.859375, -20.0859375, -19.3125, -18.5390625, -17.765625, -16.9921875, -16.21875, -15.4453125, -14.671875, -13.8984375, -13.125, -12.3515625, -11.578125, -10.8046875, -10.03125, -9.2578125, -8.484375, -7.7109375, -6.9375, -6.1640625, -5.390625, -4.6171875, -3.84375, -3.0703125, -2.296875, -1.5234375, -0.75, 0.0234375, 0.796875, 1.5703125, 2.34375, 3.1171875, 3.890625, 4.6640625, 5.4375, 6.2109375, 6.984375, 7.7578125, 8.53125, 9.3046875, 10.078125, 10.8515625, 11.625, 12.3984375, 13.171875, 13.9453125, 14.71875, 15.4921875, 16.265625, 17.0390625, 17.8125, 18.5859375, 19.359375, 20.1328125, 20.90625, 21.6796875, 22.453125, 23.2265625, 24.0, 24.7734375, 25.546875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 5.0, 7.0, 12.0, 15.0, 21.0, 24.0, 32.0, 38.0, 50.0, 69.0, 75.0, 119.0, 144.0, 181.0, 235.0, 300.0, 348.0, 378.0, 396.0, 350.0, 276.0, 208.0, 168.0, 127.0, 111.0, 82.0, 50.0, 48.0, 41.0, 28.0, 30.0, 22.0, 14.0, 17.0, 10.0, 12.0, 8.0, 2.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21484375, -6.020263671875, -5.82568359375, -5.631103515625, -5.4365234375, -5.241943359375, -5.04736328125, -4.852783203125, -4.658203125, -4.463623046875, -4.26904296875, -4.074462890625, -3.8798828125, -3.685302734375, -3.49072265625, -3.296142578125, -3.1015625, -2.906982421875, -2.71240234375, -2.517822265625, -2.3232421875, -2.128662109375, -1.93408203125, -1.739501953125, -1.544921875, -1.350341796875, -1.15576171875, -0.961181640625, -0.7666015625, -0.572021484375, -0.37744140625, -0.182861328125, 0.01171875, 0.206298828125, 0.40087890625, 0.595458984375, 0.7900390625, 0.984619140625, 1.17919921875, 1.373779296875, 1.568359375, 1.762939453125, 1.95751953125, 2.152099609375, 2.3466796875, 2.541259765625, 2.73583984375, 2.930419921875, 3.125, 3.319580078125, 3.51416015625, 3.708740234375, 3.9033203125, 4.097900390625, 4.29248046875, 4.487060546875, 4.681640625, 4.876220703125, 5.07080078125, 5.265380859375, 5.4599609375, 5.654541015625, 5.84912109375, 6.043701171875, 6.23828125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 9.0, 13.0, 18.0, 36.0, 60.0, 74.0, 160.0, 183.0, 168.0, 102.0, 61.0, 25.0, 27.0, 13.0, 11.0, 8.0, 6.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.13579559326172, -31.24021339416504, -30.344633102416992, -29.449050903320312, -28.553468704223633, -27.657886505126953, -26.762306213378906, -25.866724014282227, -24.971141815185547, -24.075559616088867, -23.17997932434082, -22.28439712524414, -21.38881492614746, -20.49323272705078, -19.597652435302734, -18.702070236206055, -17.806489944458008, -16.910907745361328, -16.01532745361328, -15.119745254516602, -14.224163055419922, -13.328581809997559, -12.433000564575195, -11.537418365478516, -10.641837120056152, -9.746255874633789, -8.85067367553711, -7.955092430114746, -7.059510707855225, -6.163928985595703, -5.26834774017334, -4.372766017913818, -3.4771862030029297, -2.581604480743408, -1.6860229969024658, -0.7904415130615234, 0.10514020919799805, 1.0007219314575195, 1.8963031768798828, 2.7918848991394043, 3.687466621398926, 4.583048343658447, 5.478630065917969, 6.374211311340332, 7.2697930335998535, 8.165374755859375, 9.060956001281738, 9.956537246704102, 10.852119445800781, 11.747700691223145, 12.643282890319824, 13.538864135742188, 14.434446334838867, 15.33002758026123, 16.225608825683594, 17.121191024780273, 18.016773223876953, 18.912355422973633, 19.80793571472168, 20.70351791381836, 21.59910011291504, 22.49468231201172, 23.390262603759766, 24.285844802856445, 25.181425094604492]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 8.0, 10.0, 7.0, 7.0, 13.0, 17.0, 14.0, 19.0, 18.0, 34.0, 24.0, 34.0, 33.0, 38.0, 34.0, 45.0, 52.0, 55.0, 48.0, 39.0, 41.0, 40.0, 51.0, 47.0, 33.0, 37.0, 19.0, 26.0, 28.0, 24.0, 17.0, 21.0, 10.0, 16.0, 8.0, 9.0, 5.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.64921760559082, -10.291535377502441, -9.933853149414062, -9.576170921325684, -9.218488693237305, -8.860806465148926, -8.503124237060547, -8.145441055297852, -7.787759304046631, -7.430077075958252, -7.072394847869873, -6.714712142944336, -6.357029914855957, -5.999347686767578, -5.641665458679199, -5.28398323059082, -4.926301002502441, -4.5686187744140625, -4.210936546325684, -3.8532540798187256, -3.4955718517303467, -3.1378896236419678, -2.7802071571350098, -2.422524929046631, -2.064842700958252, -1.707160472869873, -1.3494781255722046, -0.9917957782745361, -0.6341135501861572, -0.2764313220977783, 0.08125114440917969, 0.4389333724975586, 0.7966146469116211, 1.154296875, 1.5119792222976685, 1.869661569595337, 2.227343797683716, 2.5850260257720947, 2.9427084922790527, 3.3003907203674316, 3.6580729484558105, 4.0157551765441895, 4.373437404632568, 4.7311201095581055, 5.088802337646484, 5.446484565734863, 5.804166793823242, 6.161849021911621, 6.51953125, 6.877213478088379, 7.234895706176758, 7.592577934265137, 7.950260162353516, 8.307942390441895, 8.665624618530273, 9.023307800292969, 9.380989074707031, 9.73867130279541, 10.096353530883789, 10.454035758972168, 10.811717987060547, 11.169400215148926, 11.527082443237305, 11.884765625, 12.242447853088379]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 11.0, 9.0, 17.0, 30.0, 37.0, 49.0, 88.0, 123.0, 181.0, 269.0, 419.0, 627.0, 1015.0, 1698.0, 2766.0, 4816.0, 8376.0, 15522.0, 30631.0, 65618.0, 162053.0, 408160.0, 195677.0, 75701.0, 34639.0, 17227.0, 9451.0, 5274.0, 2995.0, 1903.0, 1140.0, 730.0, 439.0, 290.0, 190.0, 115.0, 81.0, 62.0, 41.0, 29.0, 18.0, 9.0, 6.0, 5.0, 7.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.1328125, -11.760498046875, -11.38818359375, -11.015869140625, -10.6435546875, -10.271240234375, -9.89892578125, -9.526611328125, -9.154296875, -8.781982421875, -8.40966796875, -8.037353515625, -7.6650390625, -7.292724609375, -6.92041015625, -6.548095703125, -6.17578125, -5.803466796875, -5.43115234375, -5.058837890625, -4.6865234375, -4.314208984375, -3.94189453125, -3.569580078125, -3.197265625, -2.824951171875, -2.45263671875, -2.080322265625, -1.7080078125, -1.335693359375, -0.96337890625, -0.591064453125, -0.21875, 0.153564453125, 0.52587890625, 0.898193359375, 1.2705078125, 1.642822265625, 2.01513671875, 2.387451171875, 2.759765625, 3.132080078125, 3.50439453125, 3.876708984375, 4.2490234375, 4.621337890625, 4.99365234375, 5.365966796875, 5.73828125, 6.110595703125, 6.48291015625, 6.855224609375, 7.2275390625, 7.599853515625, 7.97216796875, 8.344482421875, 8.716796875, 9.089111328125, 9.46142578125, 9.833740234375, 10.2060546875, 10.578369140625, 10.95068359375, 11.322998046875, 11.6953125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 8.0, 7.0, 7.0, 15.0, 13.0, 11.0, 29.0, 25.0, 29.0, 30.0, 37.0, 33.0, 36.0, 27.0, 42.0, 45.0, 56.0, 52.0, 45.0, 50.0, 44.0, 52.0, 38.0, 36.0, 35.0, 27.0, 23.0, 18.0, 19.0, 26.0, 14.0, 13.0, 9.0, 12.0, 4.0, 6.0, 12.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.597412109375, -10.24169921875, -9.885986328125, -9.5302734375, -9.174560546875, -8.81884765625, -8.463134765625, -8.107421875, -7.751708984375, -7.39599609375, -7.040283203125, -6.6845703125, -6.328857421875, -5.97314453125, -5.617431640625, -5.26171875, -4.906005859375, -4.55029296875, -4.194580078125, -3.8388671875, -3.483154296875, -3.12744140625, -2.771728515625, -2.416015625, -2.060302734375, -1.70458984375, -1.348876953125, -0.9931640625, -0.637451171875, -0.28173828125, 0.073974609375, 0.4296875, 0.785400390625, 1.14111328125, 1.496826171875, 1.8525390625, 2.208251953125, 2.56396484375, 2.919677734375, 3.275390625, 3.631103515625, 3.98681640625, 4.342529296875, 4.6982421875, 5.053955078125, 5.40966796875, 5.765380859375, 6.12109375, 6.476806640625, 6.83251953125, 7.188232421875, 7.5439453125, 7.899658203125, 8.25537109375, 8.611083984375, 8.966796875, 9.322509765625, 9.67822265625, 10.033935546875, 10.3896484375, 10.745361328125, 11.10107421875, 11.456787109375, 11.8125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 7.0, 11.0, 4.0, 13.0, 27.0, 30.0, 45.0, 68.0, 80.0, 150.0, 201.0, 290.0, 455.0, 700.0, 1045.0, 1675.0, 2843.0, 4881.0, 8826.0, 19038.0, 57179.0, 470535.0, 389048.0, 52570.0, 18043.0, 8601.0, 4746.0, 2785.0, 1623.0, 1002.0, 680.0, 422.0, 295.0, 196.0, 135.0, 95.0, 56.0, 40.0, 43.0, 22.0, 17.0, 7.0, 12.0, 2.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.59375, -18.04638671875, -17.4990234375, -16.95166015625, -16.404296875, -15.85693359375, -15.3095703125, -14.76220703125, -14.21484375, -13.66748046875, -13.1201171875, -12.57275390625, -12.025390625, -11.47802734375, -10.9306640625, -10.38330078125, -9.8359375, -9.28857421875, -8.7412109375, -8.19384765625, -7.646484375, -7.09912109375, -6.5517578125, -6.00439453125, -5.45703125, -4.90966796875, -4.3623046875, -3.81494140625, -3.267578125, -2.72021484375, -2.1728515625, -1.62548828125, -1.078125, -0.53076171875, 0.0166015625, 0.56396484375, 1.111328125, 1.65869140625, 2.2060546875, 2.75341796875, 3.30078125, 3.84814453125, 4.3955078125, 4.94287109375, 5.490234375, 6.03759765625, 6.5849609375, 7.13232421875, 7.6796875, 8.22705078125, 8.7744140625, 9.32177734375, 9.869140625, 10.41650390625, 10.9638671875, 11.51123046875, 12.05859375, 12.60595703125, 13.1533203125, 13.70068359375, 14.248046875, 14.79541015625, 15.3427734375, 15.89013671875, 16.4375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 11.0, 12.0, 14.0, 19.0, 19.0, 27.0, 14.0, 30.0, 35.0, 42.0, 53.0, 40.0, 40.0, 52.0, 39.0, 57.0, 61.0, 53.0, 58.0, 46.0, 41.0, 33.0, 32.0, 24.0, 32.0, 24.0, 20.0, 18.0, 16.0, 8.0, 4.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.963623046875, -7.70068359375, -7.437744140625, -7.1748046875, -6.911865234375, -6.64892578125, -6.385986328125, -6.123046875, -5.860107421875, -5.59716796875, -5.334228515625, -5.0712890625, -4.808349609375, -4.54541015625, -4.282470703125, -4.01953125, -3.756591796875, -3.49365234375, -3.230712890625, -2.9677734375, -2.704833984375, -2.44189453125, -2.178955078125, -1.916015625, -1.653076171875, -1.39013671875, -1.127197265625, -0.8642578125, -0.601318359375, -0.33837890625, -0.075439453125, 0.1875, 0.450439453125, 0.71337890625, 0.976318359375, 1.2392578125, 1.502197265625, 1.76513671875, 2.028076171875, 2.291015625, 2.553955078125, 2.81689453125, 3.079833984375, 3.3427734375, 3.605712890625, 3.86865234375, 4.131591796875, 4.39453125, 4.657470703125, 4.92041015625, 5.183349609375, 5.4462890625, 5.709228515625, 5.97216796875, 6.235107421875, 6.498046875, 6.760986328125, 7.02392578125, 7.286865234375, 7.5498046875, 7.812744140625, 8.07568359375, 8.338623046875, 8.6015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 6.0, 1.0, 3.0, 8.0, 10.0, 8.0, 14.0, 29.0, 29.0, 27.0, 53.0, 64.0, 108.0, 122.0, 176.0, 286.0, 443.0, 606.0, 914.0, 1406.0, 2322.0, 3689.0, 6589.0, 13571.0, 34996.0, 160650.0, 677451.0, 93475.0, 26079.0, 10898.0, 5509.0, 3310.0, 1930.0, 1214.0, 787.0, 575.0, 364.0, 237.0, 179.0, 121.0, 70.0, 64.0, 60.0, 32.0, 26.0, 16.0, 8.0, 7.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.4091796875, -1.362762451171875, -1.31634521484375, -1.269927978515625, -1.2235107421875, -1.177093505859375, -1.13067626953125, -1.084259033203125, -1.037841796875, -0.991424560546875, -0.94500732421875, -0.898590087890625, -0.8521728515625, -0.805755615234375, -0.75933837890625, -0.712921142578125, -0.66650390625, -0.620086669921875, -0.57366943359375, -0.527252197265625, -0.4808349609375, -0.434417724609375, -0.38800048828125, -0.341583251953125, -0.295166015625, -0.248748779296875, -0.20233154296875, -0.155914306640625, -0.1094970703125, -0.063079833984375, -0.01666259765625, 0.029754638671875, 0.076171875, 0.122589111328125, 0.16900634765625, 0.215423583984375, 0.2618408203125, 0.308258056640625, 0.35467529296875, 0.401092529296875, 0.447509765625, 0.493927001953125, 0.54034423828125, 0.586761474609375, 0.6331787109375, 0.679595947265625, 0.72601318359375, 0.772430419921875, 0.81884765625, 0.865264892578125, 0.91168212890625, 0.958099365234375, 1.0045166015625, 1.050933837890625, 1.09735107421875, 1.143768310546875, 1.190185546875, 1.236602783203125, 1.28302001953125, 1.329437255859375, 1.3758544921875, 1.422271728515625, 1.46868896484375, 1.515106201171875, 1.5615234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 4.0, 3.0, 4.0, 7.0, 3.0, 10.0, 11.0, 10.0, 30.0, 29.0, 40.0, 52.0, 73.0, 100.0, 148.0, 140.0, 91.0, 55.0, 48.0, 34.0, 23.0, 20.0, 12.0, 8.0, 6.0, 14.0, 4.0, 5.0, 8.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016510486602783203, -0.00015934742987155914, -0.00015358999371528625, -0.00014783255755901337, -0.00014207512140274048, -0.0001363176852464676, -0.0001305602490901947, -0.00012480281293392181, -0.00011904537677764893, -0.00011328794062137604, -0.00010753050446510315, -0.00010177306830883026, -9.601563215255737e-05, -9.025819599628448e-05, -8.45007598400116e-05, -7.874332368373871e-05, -7.298588752746582e-05, -6.722845137119293e-05, -6.147101521492004e-05, -5.5713579058647156e-05, -4.995614290237427e-05, -4.419870674610138e-05, -3.844127058982849e-05, -3.26838344335556e-05, -2.6926398277282715e-05, -2.1168962121009827e-05, -1.541152596473694e-05, -9.65408980846405e-06, -3.896653652191162e-06, 1.860782504081726e-06, 7.618218660354614e-06, 1.3375654816627502e-05, 1.913309097290039e-05, 2.489052712917328e-05, 3.064796328544617e-05, 3.6405399441719055e-05, 4.216283559799194e-05, 4.792027175426483e-05, 5.367770791053772e-05, 5.943514406681061e-05, 6.51925802230835e-05, 7.095001637935638e-05, 7.670745253562927e-05, 8.246488869190216e-05, 8.822232484817505e-05, 9.397976100444794e-05, 9.973719716072083e-05, 0.00010549463331699371, 0.0001112520694732666, 0.00011700950562953949, 0.00012276694178581238, 0.00012852437794208527, 0.00013428181409835815, 0.00014003925025463104, 0.00014579668641090393, 0.00015155412256717682, 0.0001573115587234497, 0.0001630689948797226, 0.00016882643103599548, 0.00017458386719226837, 0.00018034130334854126, 0.00018609873950481415, 0.00019185617566108704, 0.00019761361181735992, 0.0002033710479736328]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 9.0, 10.0, 8.0, 14.0, 30.0, 37.0, 56.0, 75.0, 140.0, 189.0, 340.0, 455.0, 688.0, 1144.0, 1860.0, 2968.0, 5498.0, 10564.0, 22848.0, 58716.0, 253352.0, 538668.0, 89852.0, 30715.0, 13693.0, 6838.0, 3897.0, 2259.0, 1346.0, 794.0, 491.0, 299.0, 210.0, 133.0, 118.0, 72.0, 54.0, 29.0, 34.0, 17.0, 11.0, 9.0, 4.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.107421875, -2.0457611083984375, -1.984100341796875, -1.9224395751953125, -1.86077880859375, -1.7991180419921875, -1.737457275390625, -1.6757965087890625, -1.6141357421875, -1.5524749755859375, -1.490814208984375, -1.4291534423828125, -1.36749267578125, -1.3058319091796875, -1.244171142578125, -1.1825103759765625, -1.120849609375, -1.0591888427734375, -0.997528076171875, -0.9358673095703125, -0.87420654296875, -0.8125457763671875, -0.750885009765625, -0.6892242431640625, -0.6275634765625, -0.5659027099609375, -0.504241943359375, -0.4425811767578125, -0.38092041015625, -0.3192596435546875, -0.257598876953125, -0.1959381103515625, -0.13427734375, -0.0726165771484375, -0.010955810546875, 0.0507049560546875, 0.11236572265625, 0.1740264892578125, 0.235687255859375, 0.2973480224609375, 0.3590087890625, 0.4206695556640625, 0.482330322265625, 0.5439910888671875, 0.60565185546875, 0.6673126220703125, 0.728973388671875, 0.7906341552734375, 0.852294921875, 0.9139556884765625, 0.975616455078125, 1.0372772216796875, 1.09893798828125, 1.1605987548828125, 1.222259521484375, 1.2839202880859375, 1.3455810546875, 1.4072418212890625, 1.468902587890625, 1.5305633544921875, 1.59222412109375, 1.6538848876953125, 1.715545654296875, 1.7772064208984375, 1.8388671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 5.0, 9.0, 9.0, 13.0, 26.0, 13.0, 31.0, 44.0, 55.0, 90.0, 87.0, 123.0, 118.0, 88.0, 55.0, 44.0, 29.0, 26.0, 19.0, 14.0, 12.0, 14.0, 12.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.37109375, -0.3590431213378906, -0.34699249267578125, -0.3349418640136719, -0.3228912353515625, -0.3108406066894531, -0.29878997802734375, -0.2867393493652344, -0.274688720703125, -0.2626380920410156, -0.25058746337890625, -0.23853683471679688, -0.2264862060546875, -0.21443557739257812, -0.20238494873046875, -0.19033432006835938, -0.17828369140625, -0.16623306274414062, -0.15418243408203125, -0.14213180541992188, -0.1300811767578125, -0.11803054809570312, -0.10597991943359375, -0.09392929077148438, -0.081878662109375, -0.06982803344726562, -0.05777740478515625, -0.045726776123046875, -0.0336761474609375, -0.021625518798828125, -0.00957489013671875, 0.002475738525390625, 0.0145263671875, 0.026576995849609375, 0.03862762451171875, 0.050678253173828125, 0.0627288818359375, 0.07477951049804688, 0.08683013916015625, 0.09888076782226562, 0.110931396484375, 0.12298202514648438, 0.13503265380859375, 0.14708328247070312, 0.1591339111328125, 0.17118453979492188, 0.18323516845703125, 0.19528579711914062, 0.20733642578125, 0.21938705444335938, 0.23143768310546875, 0.24348831176757812, 0.2555389404296875, 0.2675895690917969, 0.27964019775390625, 0.2916908264160156, 0.303741455078125, 0.3157920837402344, 0.32784271240234375, 0.3398933410644531, 0.3519439697265625, 0.3639945983886719, 0.37604522705078125, 0.3880958557128906, 0.400146484375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 11.0, 13.0, 24.0, 37.0, 63.0, 111.0, 163.0, 190.0, 143.0, 88.0, 47.0, 24.0, 21.0, 15.0, 9.0, 8.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.92591667175293, -28.085140228271484, -27.24436378479004, -26.403587341308594, -25.56281089782715, -24.722034454345703, -23.881258010864258, -23.040481567382812, -22.199705123901367, -21.358928680419922, -20.518152236938477, -19.67737579345703, -18.836599349975586, -17.99582290649414, -17.155046463012695, -16.31427001953125, -15.473494529724121, -14.632718086242676, -13.79194164276123, -12.951165199279785, -12.11038875579834, -11.269613265991211, -10.428836822509766, -9.58806037902832, -8.747283935546875, -7.90650749206543, -7.065731048583984, -6.224954605102539, -5.384178161621094, -4.543402194976807, -3.7026257514953613, -2.861849308013916, -2.0210723876953125, -1.1802959442138672, -0.3395196199417114, 0.5012567043304443, 1.3420331478118896, 2.182809352874756, 3.023585796356201, 3.8643622398376465, 4.705138683319092, 5.545915126800537, 6.386691570281982, 7.2274675369262695, 8.068243980407715, 8.90902042388916, 9.749796867370605, 10.59057331085205, 11.431349754333496, 12.272126197814941, 13.112902641296387, 13.953679084777832, 14.794455528259277, 15.635231018066406, 16.47600746154785, 17.316783905029297, 18.157560348510742, 18.998336791992188, 19.839113235473633, 20.679889678955078, 21.520666122436523, 22.36144256591797, 23.202219009399414, 24.04299545288086, 24.883771896362305]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 8.0, 7.0, 5.0, 14.0, 19.0, 13.0, 21.0, 19.0, 30.0, 33.0, 30.0, 27.0, 46.0, 35.0, 43.0, 50.0, 58.0, 45.0, 39.0, 40.0, 41.0, 53.0, 40.0, 31.0, 45.0, 19.0, 26.0, 28.0, 20.0, 21.0, 16.0, 11.0, 15.0, 5.0, 11.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.068840980529785, -9.730722427368164, -9.39260482788086, -9.054487228393555, -8.716368675231934, -8.378250122070312, -8.040132522583008, -7.702014446258545, -7.363896369934082, -7.025778293609619, -6.687660217285156, -6.349542140960693, -6.0114240646362305, -5.673305988311768, -5.335187911987305, -4.997069835662842, -4.658951759338379, -4.320833683013916, -3.982715606689453, -3.6445975303649902, -3.3064794540405273, -2.9683613777160645, -2.6302433013916016, -2.2921252250671387, -1.9540071487426758, -1.615889072418213, -1.27777099609375, -0.9396529197692871, -0.6015348434448242, -0.26341676712036133, 0.07470130920410156, 0.41281938552856445, 0.7509374618530273, 1.0890555381774902, 1.4271736145019531, 1.765291690826416, 2.103409767150879, 2.441527843475342, 2.7796459197998047, 3.1177639961242676, 3.4558820724487305, 3.7940001487731934, 4.132118225097656, 4.470236301422119, 4.808354377746582, 5.146472454071045, 5.484590530395508, 5.822708606719971, 6.160826683044434, 6.4989447593688965, 6.837062835693359, 7.175180912017822, 7.513298988342285, 7.851417064666748, 8.189535140991211, 8.527652740478516, 8.865771293640137, 9.203889846801758, 9.542007446289062, 9.880125045776367, 10.218243598937988, 10.55636215209961, 10.894479751586914, 11.232597351074219, 11.57071590423584]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 9.0, 13.0, 18.0, 17.0, 35.0, 40.0, 76.0, 107.0, 135.0, 185.0, 328.0, 449.0, 657.0, 1033.0, 1540.0, 2530.0, 3907.0, 6403.0, 10764.0, 18591.0, 33235.0, 61526.0, 119096.0, 232087.0, 257294.0, 136919.0, 70737.0, 38407.0, 20730.0, 12127.0, 7158.0, 4509.0, 2782.0, 1657.0, 1082.0, 749.0, 499.0, 346.0, 219.0, 145.0, 110.0, 86.0, 72.0, 37.0, 36.0, 23.0, 21.0, 11.0, 9.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-18.703125, -18.13818359375, -17.5732421875, -17.00830078125, -16.443359375, -15.87841796875, -15.3134765625, -14.74853515625, -14.18359375, -13.61865234375, -13.0537109375, -12.48876953125, -11.923828125, -11.35888671875, -10.7939453125, -10.22900390625, -9.6640625, -9.09912109375, -8.5341796875, -7.96923828125, -7.404296875, -6.83935546875, -6.2744140625, -5.70947265625, -5.14453125, -4.57958984375, -4.0146484375, -3.44970703125, -2.884765625, -2.31982421875, -1.7548828125, -1.18994140625, -0.625, -0.06005859375, 0.5048828125, 1.06982421875, 1.634765625, 2.19970703125, 2.7646484375, 3.32958984375, 3.89453125, 4.45947265625, 5.0244140625, 5.58935546875, 6.154296875, 6.71923828125, 7.2841796875, 7.84912109375, 8.4140625, 8.97900390625, 9.5439453125, 10.10888671875, 10.673828125, 11.23876953125, 11.8037109375, 12.36865234375, 12.93359375, 13.49853515625, 14.0634765625, 14.62841796875, 15.193359375, 15.75830078125, 16.3232421875, 16.88818359375, 17.453125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 4.0, 4.0, 3.0, 3.0, 14.0, 8.0, 17.0, 12.0, 21.0, 25.0, 22.0, 34.0, 24.0, 46.0, 33.0, 43.0, 41.0, 46.0, 59.0, 52.0, 47.0, 57.0, 34.0, 46.0, 36.0, 24.0, 36.0, 35.0, 25.0, 36.0, 23.0, 19.0, 15.0, 5.0, 9.0, 6.0, 7.0, 3.0, 12.0, 2.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.5614013671875, -8.263427734375, -7.9654541015625, -7.66748046875, -7.3695068359375, -7.071533203125, -6.7735595703125, -6.4755859375, -6.1776123046875, -5.879638671875, -5.5816650390625, -5.28369140625, -4.9857177734375, -4.687744140625, -4.3897705078125, -4.091796875, -3.7938232421875, -3.495849609375, -3.1978759765625, -2.89990234375, -2.6019287109375, -2.303955078125, -2.0059814453125, -1.7080078125, -1.4100341796875, -1.112060546875, -0.8140869140625, -0.51611328125, -0.2181396484375, 0.079833984375, 0.3778076171875, 0.67578125, 0.9737548828125, 1.271728515625, 1.5697021484375, 1.86767578125, 2.1656494140625, 2.463623046875, 2.7615966796875, 3.0595703125, 3.3575439453125, 3.655517578125, 3.9534912109375, 4.25146484375, 4.5494384765625, 4.847412109375, 5.1453857421875, 5.443359375, 5.7413330078125, 6.039306640625, 6.3372802734375, 6.63525390625, 6.9332275390625, 7.231201171875, 7.5291748046875, 7.8271484375, 8.1251220703125, 8.423095703125, 8.7210693359375, 9.01904296875, 9.3170166015625, 9.614990234375, 9.9129638671875, 10.2109375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 11.0, 9.0, 6.0, 11.0, 32.0, 29.0, 41.0, 49.0, 74.0, 141.0, 181.0, 257.0, 406.0, 545.0, 884.0, 1426.0, 2266.0, 3842.0, 6517.0, 11582.0, 20930.0, 40549.0, 85653.0, 192179.0, 320458.0, 188117.0, 84051.0, 40052.0, 20704.0, 11051.0, 6293.0, 3740.0, 2355.0, 1483.0, 879.0, 611.0, 350.0, 259.0, 165.0, 103.0, 96.0, 48.0, 32.0, 32.0, 28.0, 13.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.197998046875, -16.61474609375, -16.031494140625, -15.4482421875, -14.864990234375, -14.28173828125, -13.698486328125, -13.115234375, -12.531982421875, -11.94873046875, -11.365478515625, -10.7822265625, -10.198974609375, -9.61572265625, -9.032470703125, -8.44921875, -7.865966796875, -7.28271484375, -6.699462890625, -6.1162109375, -5.532958984375, -4.94970703125, -4.366455078125, -3.783203125, -3.199951171875, -2.61669921875, -2.033447265625, -1.4501953125, -0.866943359375, -0.28369140625, 0.299560546875, 0.8828125, 1.466064453125, 2.04931640625, 2.632568359375, 3.2158203125, 3.799072265625, 4.38232421875, 4.965576171875, 5.548828125, 6.132080078125, 6.71533203125, 7.298583984375, 7.8818359375, 8.465087890625, 9.04833984375, 9.631591796875, 10.21484375, 10.798095703125, 11.38134765625, 11.964599609375, 12.5478515625, 13.131103515625, 13.71435546875, 14.297607421875, 14.880859375, 15.464111328125, 16.04736328125, 16.630615234375, 17.2138671875, 17.797119140625, 18.38037109375, 18.963623046875, 19.546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 13.0, 10.0, 9.0, 11.0, 15.0, 18.0, 25.0, 20.0, 19.0, 28.0, 29.0, 34.0, 40.0, 33.0, 35.0, 49.0, 34.0, 38.0, 34.0, 38.0, 40.0, 49.0, 28.0, 34.0, 36.0, 33.0, 31.0, 25.0, 22.0, 25.0, 16.0, 19.0, 14.0, 17.0, 12.0, 8.0, 12.0, 11.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 4.0], "bins": [-5.984375, -5.81744384765625, -5.6505126953125, -5.48358154296875, -5.316650390625, -5.14971923828125, -4.9827880859375, -4.81585693359375, -4.64892578125, -4.48199462890625, -4.3150634765625, -4.14813232421875, -3.981201171875, -3.81427001953125, -3.6473388671875, -3.48040771484375, -3.3134765625, -3.14654541015625, -2.9796142578125, -2.81268310546875, -2.645751953125, -2.47882080078125, -2.3118896484375, -2.14495849609375, -1.97802734375, -1.81109619140625, -1.6441650390625, -1.47723388671875, -1.310302734375, -1.14337158203125, -0.9764404296875, -0.80950927734375, -0.642578125, -0.47564697265625, -0.3087158203125, -0.14178466796875, 0.025146484375, 0.19207763671875, 0.3590087890625, 0.52593994140625, 0.69287109375, 0.85980224609375, 1.0267333984375, 1.19366455078125, 1.360595703125, 1.52752685546875, 1.6944580078125, 1.86138916015625, 2.0283203125, 2.19525146484375, 2.3621826171875, 2.52911376953125, 2.696044921875, 2.86297607421875, 3.0299072265625, 3.19683837890625, 3.36376953125, 3.53070068359375, 3.6976318359375, 3.86456298828125, 4.031494140625, 4.19842529296875, 4.3653564453125, 4.53228759765625, 4.69921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 3.0, 6.0, 7.0, 5.0, 11.0, 12.0, 16.0, 20.0, 36.0, 44.0, 67.0, 84.0, 133.0, 161.0, 282.0, 357.0, 564.0, 905.0, 1610.0, 2709.0, 5262.0, 10458.0, 23640.0, 62052.0, 267276.0, 544440.0, 75331.0, 27423.0, 12024.0, 5916.0, 3044.0, 1710.0, 1013.0, 611.0, 413.0, 270.0, 184.0, 124.0, 90.0, 63.0, 45.0, 30.0, 24.0, 19.0, 13.0, 11.0, 11.0, 5.0, 10.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-13.09375, -12.7095947265625, -12.325439453125, -11.9412841796875, -11.55712890625, -11.1729736328125, -10.788818359375, -10.4046630859375, -10.0205078125, -9.6363525390625, -9.252197265625, -8.8680419921875, -8.48388671875, -8.0997314453125, -7.715576171875, -7.3314208984375, -6.947265625, -6.5631103515625, -6.178955078125, -5.7947998046875, -5.41064453125, -5.0264892578125, -4.642333984375, -4.2581787109375, -3.8740234375, -3.4898681640625, -3.105712890625, -2.7215576171875, -2.33740234375, -1.9532470703125, -1.569091796875, -1.1849365234375, -0.80078125, -0.4166259765625, -0.032470703125, 0.3516845703125, 0.73583984375, 1.1199951171875, 1.504150390625, 1.8883056640625, 2.2724609375, 2.6566162109375, 3.040771484375, 3.4249267578125, 3.80908203125, 4.1932373046875, 4.577392578125, 4.9615478515625, 5.345703125, 5.7298583984375, 6.114013671875, 6.4981689453125, 6.88232421875, 7.2664794921875, 7.650634765625, 8.0347900390625, 8.4189453125, 8.8031005859375, 9.187255859375, 9.5714111328125, 9.95556640625, 10.3397216796875, 10.723876953125, 11.1080322265625, 11.4921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 6.0, 11.0, 14.0, 20.0, 24.0, 23.0, 29.0, 47.0, 60.0, 61.0, 83.0, 126.0, 121.0, 86.0, 56.0, 36.0, 28.0, 24.0, 21.0, 28.0, 18.0, 9.0, 11.0, 8.0, 2.0, 13.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00049591064453125, -0.00048126280307769775, -0.0004666149616241455, -0.00045196712017059326, -0.000437319278717041, -0.00042267143726348877, -0.0004080235958099365, -0.0003933757543563843, -0.00037872791290283203, -0.0003640800714492798, -0.00034943222999572754, -0.0003347843885421753, -0.00032013654708862305, -0.0003054887056350708, -0.00029084086418151855, -0.0002761930227279663, -0.00026154518127441406, -0.0002468973398208618, -0.00023224949836730957, -0.00021760165691375732, -0.00020295381546020508, -0.00018830597400665283, -0.00017365813255310059, -0.00015901029109954834, -0.0001443624496459961, -0.00012971460819244385, -0.0001150667667388916, -0.00010041892528533936, -8.577108383178711e-05, -7.112324237823486e-05, -5.647540092468262e-05, -4.182755947113037e-05, -2.7179718017578125e-05, -1.2531876564025879e-05, 2.115964889526367e-06, 1.6763806343078613e-05, 3.141164779663086e-05, 4.6059489250183105e-05, 6.070733070373535e-05, 7.53551721572876e-05, 9.000301361083984e-05, 0.00010465085506439209, 0.00011929869651794434, 0.00013394653797149658, 0.00014859437942504883, 0.00016324222087860107, 0.00017789006233215332, 0.00019253790378570557, 0.0002071857452392578, 0.00022183358669281006, 0.0002364814281463623, 0.00025112926959991455, 0.0002657771110534668, 0.00028042495250701904, 0.0002950727939605713, 0.00030972063541412354, 0.0003243684768676758, 0.00033901631832122803, 0.0003536641597747803, 0.0003683120012283325, 0.00038295984268188477, 0.000397607684135437, 0.00041225552558898926, 0.0004269033670425415, 0.00044155120849609375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 11.0, 20.0, 20.0, 24.0, 45.0, 56.0, 80.0, 91.0, 127.0, 166.0, 262.0, 421.0, 594.0, 871.0, 1498.0, 2581.0, 5065.0, 11680.0, 33982.0, 152509.0, 691309.0, 101453.0, 25800.0, 9533.0, 4184.0, 2247.0, 1262.0, 835.0, 557.0, 388.0, 254.0, 164.0, 132.0, 76.0, 59.0, 40.0, 38.0, 32.0, 25.0, 14.0, 9.0, 4.0, 1.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.84375, -11.47802734375, -11.1123046875, -10.74658203125, -10.380859375, -10.01513671875, -9.6494140625, -9.28369140625, -8.91796875, -8.55224609375, -8.1865234375, -7.82080078125, -7.455078125, -7.08935546875, -6.7236328125, -6.35791015625, -5.9921875, -5.62646484375, -5.2607421875, -4.89501953125, -4.529296875, -4.16357421875, -3.7978515625, -3.43212890625, -3.06640625, -2.70068359375, -2.3349609375, -1.96923828125, -1.603515625, -1.23779296875, -0.8720703125, -0.50634765625, -0.140625, 0.22509765625, 0.5908203125, 0.95654296875, 1.322265625, 1.68798828125, 2.0537109375, 2.41943359375, 2.78515625, 3.15087890625, 3.5166015625, 3.88232421875, 4.248046875, 4.61376953125, 4.9794921875, 5.34521484375, 5.7109375, 6.07666015625, 6.4423828125, 6.80810546875, 7.173828125, 7.53955078125, 7.9052734375, 8.27099609375, 8.63671875, 9.00244140625, 9.3681640625, 9.73388671875, 10.099609375, 10.46533203125, 10.8310546875, 11.19677734375, 11.5625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 14.0, 17.0, 36.0, 31.0, 50.0, 44.0, 68.0, 110.0, 274.0, 71.0, 63.0, 49.0, 36.0, 31.0, 26.0, 14.0, 15.0, 3.0, 4.0, 1.0, 7.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.44049072265625, -2.3692626953125, -2.29803466796875, -2.226806640625, -2.15557861328125, -2.0843505859375, -2.01312255859375, -1.94189453125, -1.87066650390625, -1.7994384765625, -1.72821044921875, -1.656982421875, -1.58575439453125, -1.5145263671875, -1.44329833984375, -1.3720703125, -1.30084228515625, -1.2296142578125, -1.15838623046875, -1.087158203125, -1.01593017578125, -0.9447021484375, -0.87347412109375, -0.80224609375, -0.73101806640625, -0.6597900390625, -0.58856201171875, -0.517333984375, -0.44610595703125, -0.3748779296875, -0.30364990234375, -0.232421875, -0.16119384765625, -0.0899658203125, -0.01873779296875, 0.052490234375, 0.12371826171875, 0.1949462890625, 0.26617431640625, 0.33740234375, 0.40863037109375, 0.4798583984375, 0.55108642578125, 0.622314453125, 0.69354248046875, 0.7647705078125, 0.83599853515625, 0.9072265625, 0.97845458984375, 1.0496826171875, 1.12091064453125, 1.192138671875, 1.26336669921875, 1.3345947265625, 1.40582275390625, 1.47705078125, 1.54827880859375, 1.6195068359375, 1.69073486328125, 1.761962890625, 1.83319091796875, 1.9044189453125, 1.97564697265625, 2.046875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 2.0, 6.0, 8.0, 12.0, 23.0, 39.0, 65.0, 110.0, 200.0, 196.0, 120.0, 78.0, 37.0, 31.0, 23.0, 9.0, 5.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.816688537597656, -24.06675148010254, -23.316814422607422, -22.566877365112305, -21.816940307617188, -21.06700325012207, -20.317066192626953, -19.567127227783203, -18.81719207763672, -18.0672550201416, -17.317317962646484, -16.567380905151367, -15.81744384765625, -15.067506790161133, -14.3175687789917, -13.567631721496582, -12.817693710327148, -12.067756652832031, -11.317819595336914, -10.567882537841797, -9.81794548034668, -9.068008422851562, -8.318070411682129, -7.568133354187012, -6.8181962966918945, -6.068259239196777, -5.31832218170166, -4.568384647369385, -3.8184475898742676, -3.0685105323791504, -2.318572998046875, -1.5686359405517578, -0.8186969757080078, -0.06875979900360107, 0.6811773777008057, 1.431114673614502, 2.181051731109619, 2.9309887886047363, 3.6809263229370117, 4.430863380432129, 5.180800437927246, 5.930737495422363, 6.6806745529174805, 7.430612087249756, 8.180549621582031, 8.930486679077148, 9.680423736572266, 10.430360794067383, 11.1802978515625, 11.930234909057617, 12.680171966552734, 13.430109024047852, 14.180046081542969, 14.929983139038086, 15.67992115020752, 16.429859161376953, 17.179794311523438, 17.929731369018555, 18.679668426513672, 19.42960548400879, 20.179542541503906, 20.929479598999023, 21.67941665649414, 22.42935562133789, 23.179292678833008]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 7.0, 11.0, 15.0, 10.0, 15.0, 9.0, 19.0, 16.0, 27.0, 34.0, 36.0, 42.0, 39.0, 39.0, 41.0, 44.0, 43.0, 40.0, 41.0, 45.0, 56.0, 43.0, 40.0, 36.0, 34.0, 31.0, 22.0, 21.0, 21.0, 23.0, 19.0, 14.0, 9.0, 11.0, 10.0, 6.0, 3.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.164570808410645, -8.865348815917969, -8.566126823425293, -8.266904830932617, -7.967682838439941, -7.668460845947266, -7.369239330291748, -7.070017337799072, -6.7707953453063965, -6.471573352813721, -6.172351360321045, -5.873129367828369, -5.573907852172852, -5.274685859680176, -4.9754638671875, -4.676241874694824, -4.377019882202148, -4.077797889709473, -3.778575897216797, -3.4793541431427, -3.1801321506500244, -2.8809101581573486, -2.581688404083252, -2.282466411590576, -1.9832444190979004, -1.6840224266052246, -1.3848005533218384, -1.0855786800384521, -0.7863566875457764, -0.4871346950531006, -0.18791282176971436, 0.11130905151367188, 0.41053009033203125, 0.7097520232200623, 1.0089739561080933, 1.3081958293914795, 1.6074178218841553, 1.906639814376831, 2.2058615684509277, 2.5050835609436035, 2.8043055534362793, 3.103527545928955, 3.402749538421631, 3.7019712924957275, 4.001193046569824, 4.3004150390625, 4.599637031555176, 4.898859024047852, 5.198081016540527, 5.497303009033203, 5.796525001525879, 6.095746994018555, 6.3949689865112305, 6.694190979003906, 6.993412494659424, 7.2926344871521, 7.591856479644775, 7.891078472137451, 8.190299987792969, 8.489521980285645, 8.78874397277832, 9.087965965270996, 9.387187957763672, 9.686409950256348, 9.985631942749023]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 15.0, 24.0, 36.0, 59.0, 95.0, 123.0, 230.0, 328.0, 489.0, 756.0, 1113.0, 1719.0, 2665.0, 3909.0, 6234.0, 9989.0, 16227.0, 28798.0, 53212.0, 109456.0, 291117.0, 1312036.0, 1715292.0, 369835.0, 127603.0, 60237.0, 32100.0, 18615.0, 11280.0, 7063.0, 4612.0, 2920.0, 2008.0, 1341.0, 857.0, 591.0, 397.0, 265.0, 197.0, 129.0, 88.0, 59.0, 46.0, 32.0, 18.0, 20.0, 19.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-13.3203125, -12.862548828125, -12.40478515625, -11.947021484375, -11.4892578125, -11.031494140625, -10.57373046875, -10.115966796875, -9.658203125, -9.200439453125, -8.74267578125, -8.284912109375, -7.8271484375, -7.369384765625, -6.91162109375, -6.453857421875, -5.99609375, -5.538330078125, -5.08056640625, -4.622802734375, -4.1650390625, -3.707275390625, -3.24951171875, -2.791748046875, -2.333984375, -1.876220703125, -1.41845703125, -0.960693359375, -0.5029296875, -0.045166015625, 0.41259765625, 0.870361328125, 1.328125, 1.785888671875, 2.24365234375, 2.701416015625, 3.1591796875, 3.616943359375, 4.07470703125, 4.532470703125, 4.990234375, 5.447998046875, 5.90576171875, 6.363525390625, 6.8212890625, 7.279052734375, 7.73681640625, 8.194580078125, 8.65234375, 9.110107421875, 9.56787109375, 10.025634765625, 10.4833984375, 10.941162109375, 11.39892578125, 11.856689453125, 12.314453125, 12.772216796875, 13.22998046875, 13.687744140625, 14.1455078125, 14.603271484375, 15.06103515625, 15.518798828125, 15.9765625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 8.0, 4.0, 7.0, 11.0, 9.0, 23.0, 21.0, 12.0, 20.0, 27.0, 37.0, 39.0, 48.0, 43.0, 35.0, 39.0, 51.0, 54.0, 52.0, 52.0, 48.0, 40.0, 38.0, 42.0, 37.0, 23.0, 37.0, 21.0, 23.0, 18.0, 15.0, 16.0, 12.0, 13.0, 8.0, 4.0, 6.0, 1.0, 6.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.58282470703125, -5.3843994140625, -5.18597412109375, -4.987548828125, -4.78912353515625, -4.5906982421875, -4.39227294921875, -4.19384765625, -3.99542236328125, -3.7969970703125, -3.59857177734375, -3.400146484375, -3.20172119140625, -3.0032958984375, -2.80487060546875, -2.6064453125, -2.40802001953125, -2.2095947265625, -2.01116943359375, -1.812744140625, -1.61431884765625, -1.4158935546875, -1.21746826171875, -1.01904296875, -0.82061767578125, -0.6221923828125, -0.42376708984375, -0.225341796875, -0.02691650390625, 0.1715087890625, 0.36993408203125, 0.568359375, 0.76678466796875, 0.9652099609375, 1.16363525390625, 1.362060546875, 1.56048583984375, 1.7589111328125, 1.95733642578125, 2.15576171875, 2.35418701171875, 2.5526123046875, 2.75103759765625, 2.949462890625, 3.14788818359375, 3.3463134765625, 3.54473876953125, 3.7431640625, 3.94158935546875, 4.1400146484375, 4.33843994140625, 4.536865234375, 4.73529052734375, 4.9337158203125, 5.13214111328125, 5.33056640625, 5.52899169921875, 5.7274169921875, 5.92584228515625, 6.124267578125, 6.32269287109375, 6.5211181640625, 6.71954345703125, 6.91796875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 11.0, 13.0, 18.0, 19.0, 31.0, 41.0, 72.0, 129.0, 163.0, 225.0, 332.0, 528.0, 906.0, 1376.0, 2276.0, 3842.0, 6604.0, 11988.0, 23540.0, 48818.0, 113676.0, 324946.0, 1356956.0, 1673821.0, 384524.0, 128510.0, 54166.0, 25503.0, 13225.0, 7187.0, 4214.0, 2501.0, 1489.0, 947.0, 543.0, 369.0, 274.0, 180.0, 124.0, 67.0, 37.0, 26.0, 20.0, 18.0, 11.0, 10.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.84375, -14.380859375, -13.91796875, -13.455078125, -12.9921875, -12.529296875, -12.06640625, -11.603515625, -11.140625, -10.677734375, -10.21484375, -9.751953125, -9.2890625, -8.826171875, -8.36328125, -7.900390625, -7.4375, -6.974609375, -6.51171875, -6.048828125, -5.5859375, -5.123046875, -4.66015625, -4.197265625, -3.734375, -3.271484375, -2.80859375, -2.345703125, -1.8828125, -1.419921875, -0.95703125, -0.494140625, -0.03125, 0.431640625, 0.89453125, 1.357421875, 1.8203125, 2.283203125, 2.74609375, 3.208984375, 3.671875, 4.134765625, 4.59765625, 5.060546875, 5.5234375, 5.986328125, 6.44921875, 6.912109375, 7.375, 7.837890625, 8.30078125, 8.763671875, 9.2265625, 9.689453125, 10.15234375, 10.615234375, 11.078125, 11.541015625, 12.00390625, 12.466796875, 12.9296875, 13.392578125, 13.85546875, 14.318359375, 14.78125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 16.0, 19.0, 24.0, 18.0, 37.0, 45.0, 46.0, 82.0, 92.0, 111.0, 148.0, 192.0, 210.0, 298.0, 372.0, 363.0, 413.0, 303.0, 280.0, 213.0, 161.0, 137.0, 93.0, 76.0, 72.0, 37.0, 25.0, 38.0, 27.0, 23.0, 16.0, 14.0, 15.0, 5.0, 7.0, 10.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.578125, -3.4664306640625, -3.354736328125, -3.2430419921875, -3.13134765625, -3.0196533203125, -2.907958984375, -2.7962646484375, -2.6845703125, -2.5728759765625, -2.461181640625, -2.3494873046875, -2.23779296875, -2.1260986328125, -2.014404296875, -1.9027099609375, -1.791015625, -1.6793212890625, -1.567626953125, -1.4559326171875, -1.34423828125, -1.2325439453125, -1.120849609375, -1.0091552734375, -0.8974609375, -0.7857666015625, -0.674072265625, -0.5623779296875, -0.45068359375, -0.3389892578125, -0.227294921875, -0.1156005859375, -0.00390625, 0.1077880859375, 0.219482421875, 0.3311767578125, 0.44287109375, 0.5545654296875, 0.666259765625, 0.7779541015625, 0.8896484375, 1.0013427734375, 1.113037109375, 1.2247314453125, 1.33642578125, 1.4481201171875, 1.559814453125, 1.6715087890625, 1.783203125, 1.8948974609375, 2.006591796875, 2.1182861328125, 2.22998046875, 2.3416748046875, 2.453369140625, 2.5650634765625, 2.6767578125, 2.7884521484375, 2.900146484375, 3.0118408203125, 3.12353515625, 3.2352294921875, 3.346923828125, 3.4586181640625, 3.5703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 3.0, 11.0, 13.0, 20.0, 25.0, 32.0, 62.0, 97.0, 136.0, 150.0, 135.0, 96.0, 66.0, 42.0, 25.0, 17.0, 15.0, 15.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.132898330688477, -13.702184677124023, -13.27147102355957, -12.8407564163208, -12.410042762756348, -11.979329109191895, -11.548614501953125, -11.117900848388672, -10.687187194824219, -10.256473541259766, -9.825759887695312, -9.395045280456543, -8.96433162689209, -8.533617973327637, -8.102903366088867, -7.672189712524414, -7.241476058959961, -6.810762405395508, -6.3800482749938965, -5.949334144592285, -5.518620491027832, -5.087906837463379, -4.657192707061768, -4.226478576660156, -3.795764923095703, -3.365051031112671, -2.9343371391296387, -2.5036232471466064, -2.072909355163574, -1.642195463180542, -1.2114815711975098, -0.7807676792144775, -0.3500537872314453, 0.08066010475158691, 0.5113739967346191, 0.9420878887176514, 1.3728017807006836, 1.8035156726837158, 2.234229564666748, 2.6649434566497803, 3.0956573486328125, 3.5263712406158447, 3.957085132598877, 4.387799263000488, 4.818512916564941, 5.2492265701293945, 5.679940700531006, 6.110654830932617, 6.54136848449707, 6.972082138061523, 7.402796268463135, 7.833510398864746, 8.2642240524292, 8.694937705993652, 9.125652313232422, 9.556365966796875, 9.987079620361328, 10.417793273925781, 10.848506927490234, 11.279221534729004, 11.709935188293457, 12.14064884185791, 12.57136344909668, 13.002077102661133, 13.432790756225586]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 8.0, 8.0, 9.0, 14.0, 12.0, 15.0, 12.0, 13.0, 13.0, 20.0, 16.0, 23.0, 22.0, 29.0, 39.0, 46.0, 27.0, 52.0, 47.0, 36.0, 46.0, 43.0, 51.0, 41.0, 30.0, 34.0, 42.0, 21.0, 34.0, 34.0, 20.0, 17.0, 22.0, 18.0, 12.0, 10.0, 16.0, 10.0, 8.0, 8.0, 4.0, 7.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.900868892669678, -5.703700542449951, -5.506531715393066, -5.30936336517334, -5.112194538116455, -4.9150261878967285, -4.717857360839844, -4.520689010620117, -4.323520660400391, -4.126352310180664, -3.9291834831237793, -3.7320151329040527, -3.534846305847168, -3.3376779556274414, -3.1405093669891357, -2.94334077835083, -2.7461719512939453, -2.5490033626556396, -2.351834774017334, -2.1546664237976074, -1.9574977159500122, -1.7603291273117065, -1.5631606578826904, -1.3659920692443848, -1.168823480606079, -0.9716548919677734, -0.7744863629341125, -0.5773178339004517, -0.380149245262146, -0.18298065662384033, 0.014187812805175781, 0.21135640144348145, 0.4085249900817871, 0.6056935787200928, 0.8028621077537537, 1.0000306367874146, 1.1971992254257202, 1.3943678140640259, 1.591536283493042, 1.7887048721313477, 1.9858734607696533, 2.183042049407959, 2.3802106380462646, 2.5773792266845703, 2.774547576904297, 2.9717164039611816, 3.168884754180908, 3.366053342819214, 3.5632219314575195, 3.760390520095825, 3.957559108734131, 4.154727458953857, 4.351896286010742, 4.549064636230469, 4.746232986450195, 4.94340181350708, 5.140570640563965, 5.337738990783691, 5.534907817840576, 5.732076168060303, 5.9292449951171875, 6.126413345336914, 6.323581695556641, 6.520750522613525, 6.717918872833252]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 14.0, 11.0, 29.0, 44.0, 65.0, 92.0, 129.0, 204.0, 297.0, 405.0, 593.0, 818.0, 1342.0, 1981.0, 3053.0, 4790.0, 7628.0, 12484.0, 21430.0, 39478.0, 81009.0, 194514.0, 353944.0, 166775.0, 71035.0, 35508.0, 19737.0, 11310.0, 6829.0, 4456.0, 2876.0, 1892.0, 1216.0, 825.0, 511.0, 368.0, 224.0, 197.0, 130.0, 88.0, 64.0, 43.0, 26.0, 26.0, 19.0, 13.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0], "bins": [-5.48046875, -5.31646728515625, -5.1524658203125, -4.98846435546875, -4.824462890625, -4.66046142578125, -4.4964599609375, -4.33245849609375, -4.16845703125, -4.00445556640625, -3.8404541015625, -3.67645263671875, -3.512451171875, -3.34844970703125, -3.1844482421875, -3.02044677734375, -2.8564453125, -2.69244384765625, -2.5284423828125, -2.36444091796875, -2.200439453125, -2.03643798828125, -1.8724365234375, -1.70843505859375, -1.54443359375, -1.38043212890625, -1.2164306640625, -1.05242919921875, -0.888427734375, -0.72442626953125, -0.5604248046875, -0.39642333984375, -0.232421875, -0.06842041015625, 0.0955810546875, 0.25958251953125, 0.423583984375, 0.58758544921875, 0.7515869140625, 0.91558837890625, 1.07958984375, 1.24359130859375, 1.4075927734375, 1.57159423828125, 1.735595703125, 1.89959716796875, 2.0635986328125, 2.22760009765625, 2.3916015625, 2.55560302734375, 2.7196044921875, 2.88360595703125, 3.047607421875, 3.21160888671875, 3.3756103515625, 3.53961181640625, 3.70361328125, 3.86761474609375, 4.0316162109375, 4.19561767578125, 4.359619140625, 4.52362060546875, 4.6876220703125, 4.85162353515625, 5.015625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 9.0, 8.0, 11.0, 11.0, 15.0, 14.0, 12.0, 16.0, 25.0, 20.0, 22.0, 26.0, 34.0, 33.0, 45.0, 37.0, 46.0, 48.0, 42.0, 32.0, 52.0, 45.0, 36.0, 28.0, 42.0, 38.0, 33.0, 23.0, 26.0, 22.0, 21.0, 17.0, 14.0, 9.0, 14.0, 17.0, 11.0, 3.0, 9.0, 4.0, 6.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.896240234375, -4.70263671875, -4.509033203125, -4.3154296875, -4.121826171875, -3.92822265625, -3.734619140625, -3.541015625, -3.347412109375, -3.15380859375, -2.960205078125, -2.7666015625, -2.572998046875, -2.37939453125, -2.185791015625, -1.9921875, -1.798583984375, -1.60498046875, -1.411376953125, -1.2177734375, -1.024169921875, -0.83056640625, -0.636962890625, -0.443359375, -0.249755859375, -0.05615234375, 0.137451171875, 0.3310546875, 0.524658203125, 0.71826171875, 0.911865234375, 1.10546875, 1.299072265625, 1.49267578125, 1.686279296875, 1.8798828125, 2.073486328125, 2.26708984375, 2.460693359375, 2.654296875, 2.847900390625, 3.04150390625, 3.235107421875, 3.4287109375, 3.622314453125, 3.81591796875, 4.009521484375, 4.203125, 4.396728515625, 4.59033203125, 4.783935546875, 4.9775390625, 5.171142578125, 5.36474609375, 5.558349609375, 5.751953125, 5.945556640625, 6.13916015625, 6.332763671875, 6.5263671875, 6.719970703125, 6.91357421875, 7.107177734375, 7.30078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 6.0, 16.0, 17.0, 15.0, 22.0, 38.0, 47.0, 50.0, 91.0, 101.0, 152.0, 230.0, 301.0, 411.0, 635.0, 817.0, 1256.0, 1846.0, 2912.0, 4615.0, 8057.0, 15869.0, 41069.0, 167023.0, 611851.0, 123300.0, 34227.0, 14110.0, 7128.0, 4025.0, 2590.0, 1710.0, 1167.0, 768.0, 561.0, 418.0, 294.0, 222.0, 157.0, 129.0, 88.0, 55.0, 44.0, 30.0, 27.0, 20.0, 17.0, 5.0, 5.0, 1.0, 1.0, 6.0, 2.0, 2.0, 1.0], "bins": [-7.72265625, -7.49151611328125, -7.2603759765625, -7.02923583984375, -6.798095703125, -6.56695556640625, -6.3358154296875, -6.10467529296875, -5.87353515625, -5.64239501953125, -5.4112548828125, -5.18011474609375, -4.948974609375, -4.71783447265625, -4.4866943359375, -4.25555419921875, -4.0244140625, -3.79327392578125, -3.5621337890625, -3.33099365234375, -3.099853515625, -2.86871337890625, -2.6375732421875, -2.40643310546875, -2.17529296875, -1.94415283203125, -1.7130126953125, -1.48187255859375, -1.250732421875, -1.01959228515625, -0.7884521484375, -0.55731201171875, -0.326171875, -0.09503173828125, 0.1361083984375, 0.36724853515625, 0.598388671875, 0.82952880859375, 1.0606689453125, 1.29180908203125, 1.52294921875, 1.75408935546875, 1.9852294921875, 2.21636962890625, 2.447509765625, 2.67864990234375, 2.9097900390625, 3.14093017578125, 3.3720703125, 3.60321044921875, 3.8343505859375, 4.06549072265625, 4.296630859375, 4.52777099609375, 4.7589111328125, 4.99005126953125, 5.22119140625, 5.45233154296875, 5.6834716796875, 5.91461181640625, 6.145751953125, 6.37689208984375, 6.6080322265625, 6.83917236328125, 7.0703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 7.0, 5.0, 10.0, 6.0, 9.0, 12.0, 10.0, 14.0, 22.0, 11.0, 24.0, 21.0, 22.0, 29.0, 26.0, 38.0, 40.0, 36.0, 35.0, 36.0, 30.0, 31.0, 42.0, 35.0, 39.0, 36.0, 35.0, 31.0, 30.0, 33.0, 32.0, 23.0, 23.0, 25.0, 18.0, 16.0, 14.0, 14.0, 14.0, 11.0, 6.0, 8.0, 6.0, 8.0, 1.0, 10.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.693359375, -3.579315185546875, -3.46527099609375, -3.351226806640625, -3.2371826171875, -3.123138427734375, -3.00909423828125, -2.895050048828125, -2.781005859375, -2.666961669921875, -2.55291748046875, -2.438873291015625, -2.3248291015625, -2.210784912109375, -2.09674072265625, -1.982696533203125, -1.86865234375, -1.754608154296875, -1.64056396484375, -1.526519775390625, -1.4124755859375, -1.298431396484375, -1.18438720703125, -1.070343017578125, -0.956298828125, -0.842254638671875, -0.72821044921875, -0.614166259765625, -0.5001220703125, -0.386077880859375, -0.27203369140625, -0.157989501953125, -0.0439453125, 0.070098876953125, 0.18414306640625, 0.298187255859375, 0.4122314453125, 0.526275634765625, 0.64031982421875, 0.754364013671875, 0.868408203125, 0.982452392578125, 1.09649658203125, 1.210540771484375, 1.3245849609375, 1.438629150390625, 1.55267333984375, 1.666717529296875, 1.78076171875, 1.894805908203125, 2.00885009765625, 2.122894287109375, 2.2369384765625, 2.350982666015625, 2.46502685546875, 2.579071044921875, 2.693115234375, 2.807159423828125, 2.92120361328125, 3.035247802734375, 3.1492919921875, 3.263336181640625, 3.37738037109375, 3.491424560546875, 3.60546875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [7.0, 1.0, 1.0, 3.0, 9.0, 7.0, 14.0, 7.0, 15.0, 10.0, 22.0, 25.0, 43.0, 63.0, 83.0, 75.0, 128.0, 191.0, 217.0, 302.0, 406.0, 567.0, 804.0, 1245.0, 1799.0, 2749.0, 4661.0, 8062.0, 16674.0, 44859.0, 282785.0, 576614.0, 61375.0, 20446.0, 9495.0, 5182.0, 3054.0, 1925.0, 1289.0, 870.0, 649.0, 498.0, 329.0, 263.0, 179.0, 130.0, 109.0, 79.0, 85.0, 30.0, 36.0, 32.0, 27.0, 5.0, 11.0, 9.0, 6.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.71435546875, -0.6913986206054688, -0.6684417724609375, -0.6454849243164062, -0.622528076171875, -0.5995712280273438, -0.5766143798828125, -0.5536575317382812, -0.53070068359375, -0.5077438354492188, -0.4847869873046875, -0.46183013916015625, -0.438873291015625, -0.41591644287109375, -0.3929595947265625, -0.37000274658203125, -0.3470458984375, -0.32408905029296875, -0.3011322021484375, -0.27817535400390625, -0.255218505859375, -0.23226165771484375, -0.2093048095703125, -0.18634796142578125, -0.16339111328125, -0.14043426513671875, -0.1174774169921875, -0.09452056884765625, -0.071563720703125, -0.04860687255859375, -0.0256500244140625, -0.00269317626953125, 0.020263671875, 0.04322052001953125, 0.0661773681640625, 0.08913421630859375, 0.112091064453125, 0.13504791259765625, 0.1580047607421875, 0.18096160888671875, 0.20391845703125, 0.22687530517578125, 0.2498321533203125, 0.27278900146484375, 0.295745849609375, 0.31870269775390625, 0.3416595458984375, 0.36461639404296875, 0.3875732421875, 0.41053009033203125, 0.4334869384765625, 0.45644378662109375, 0.479400634765625, 0.5023574829101562, 0.5253143310546875, 0.5482711791992188, 0.57122802734375, 0.5941848754882812, 0.6171417236328125, 0.6400985717773438, 0.663055419921875, 0.6860122680664062, 0.7089691162109375, 0.7319259643554688, 0.7548828125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 3.0, 3.0, 16.0, 10.0, 12.0, 13.0, 19.0, 23.0, 28.0, 32.0, 41.0, 42.0, 89.0, 73.0, 102.0, 101.0, 86.0, 63.0, 49.0, 29.0, 35.0, 20.0, 25.0, 15.0, 16.0, 10.0, 4.0, 6.0, 2.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.649162292480469e-05, -4.508160054683685e-05, -4.367157816886902e-05, -4.2261555790901184e-05, -4.085153341293335e-05, -3.9441511034965515e-05, -3.803148865699768e-05, -3.6621466279029846e-05, -3.521144390106201e-05, -3.380142152309418e-05, -3.239139914512634e-05, -3.098137676715851e-05, -2.9571354389190674e-05, -2.816133201122284e-05, -2.6751309633255005e-05, -2.534128725528717e-05, -2.3931264877319336e-05, -2.25212424993515e-05, -2.1111220121383667e-05, -1.9701197743415833e-05, -1.8291175365447998e-05, -1.6881152987480164e-05, -1.547113060951233e-05, -1.4061108231544495e-05, -1.265108585357666e-05, -1.1241063475608826e-05, -9.831041097640991e-06, -8.421018719673157e-06, -7.010996341705322e-06, -5.600973963737488e-06, -4.190951585769653e-06, -2.780929207801819e-06, -1.3709068298339844e-06, 3.91155481338501e-08, 1.4491379261016846e-06, 2.859160304069519e-06, 4.2691826820373535e-06, 5.679205060005188e-06, 7.0892274379730225e-06, 8.499249815940857e-06, 9.909272193908691e-06, 1.1319294571876526e-05, 1.272931694984436e-05, 1.4139339327812195e-05, 1.554936170578003e-05, 1.6959384083747864e-05, 1.8369406461715698e-05, 1.9779428839683533e-05, 2.1189451217651367e-05, 2.25994735956192e-05, 2.4009495973587036e-05, 2.541951835155487e-05, 2.6829540729522705e-05, 2.823956310749054e-05, 2.9649585485458374e-05, 3.105960786342621e-05, 3.246963024139404e-05, 3.387965261936188e-05, 3.528967499732971e-05, 3.6699697375297546e-05, 3.810971975326538e-05, 3.9519742131233215e-05, 4.092976450920105e-05, 4.2339786887168884e-05, 4.374980926513672e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 7.0, 5.0, 13.0, 12.0, 14.0, 38.0, 29.0, 40.0, 75.0, 107.0, 134.0, 196.0, 307.0, 512.0, 735.0, 1228.0, 2107.0, 3567.0, 7112.0, 15590.0, 41167.0, 161007.0, 598566.0, 146928.0, 38381.0, 14853.0, 6878.0, 3588.0, 1950.0, 1188.0, 749.0, 500.0, 306.0, 198.0, 124.0, 96.0, 77.0, 44.0, 36.0, 28.0, 18.0, 9.0, 10.0, 8.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84375, -0.8169403076171875, -0.790130615234375, -0.7633209228515625, -0.73651123046875, -0.7097015380859375, -0.682891845703125, -0.6560821533203125, -0.6292724609375, -0.6024627685546875, -0.575653076171875, -0.5488433837890625, -0.52203369140625, -0.4952239990234375, -0.468414306640625, -0.4416046142578125, -0.414794921875, -0.3879852294921875, -0.361175537109375, -0.3343658447265625, -0.30755615234375, -0.2807464599609375, -0.253936767578125, -0.2271270751953125, -0.2003173828125, -0.1735076904296875, -0.146697998046875, -0.1198883056640625, -0.09307861328125, -0.0662689208984375, -0.039459228515625, -0.0126495361328125, 0.01416015625, 0.0409698486328125, 0.067779541015625, 0.0945892333984375, 0.12139892578125, 0.1482086181640625, 0.175018310546875, 0.2018280029296875, 0.2286376953125, 0.2554473876953125, 0.282257080078125, 0.3090667724609375, 0.33587646484375, 0.3626861572265625, 0.389495849609375, 0.4163055419921875, 0.443115234375, 0.4699249267578125, 0.496734619140625, 0.5235443115234375, 0.55035400390625, 0.5771636962890625, 0.603973388671875, 0.6307830810546875, 0.6575927734375, 0.6844024658203125, 0.711212158203125, 0.7380218505859375, 0.76483154296875, 0.7916412353515625, 0.818450927734375, 0.8452606201171875, 0.8720703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 8.0, 10.0, 14.0, 28.0, 39.0, 41.0, 64.0, 81.0, 139.0, 135.0, 121.0, 99.0, 64.0, 45.0, 28.0, 25.0, 13.0, 8.0, 5.0, 5.0, 1.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2159423828125, -0.20925521850585938, -0.20256805419921875, -0.19588088989257812, -0.1891937255859375, -0.18250656127929688, -0.17581939697265625, -0.16913223266601562, -0.162445068359375, -0.15575790405273438, -0.14907073974609375, -0.14238357543945312, -0.1356964111328125, -0.12900924682617188, -0.12232208251953125, -0.11563491821289062, -0.10894775390625, -0.10226058959960938, -0.09557342529296875, -0.08888626098632812, -0.0821990966796875, -0.07551193237304688, -0.06882476806640625, -0.062137603759765625, -0.055450439453125, -0.048763275146484375, -0.04207611083984375, -0.035388946533203125, -0.0287017822265625, -0.022014617919921875, -0.01532745361328125, -0.008640289306640625, -0.001953125, 0.004734039306640625, 0.01142120361328125, 0.018108367919921875, 0.0247955322265625, 0.031482696533203125, 0.03816986083984375, 0.044857025146484375, 0.051544189453125, 0.058231353759765625, 0.06491851806640625, 0.07160568237304688, 0.0782928466796875, 0.08498001098632812, 0.09166717529296875, 0.09835433959960938, 0.10504150390625, 0.11172866821289062, 0.11841583251953125, 0.12510299682617188, 0.1317901611328125, 0.13847732543945312, 0.14516448974609375, 0.15185165405273438, 0.158538818359375, 0.16522598266601562, 0.17191314697265625, 0.17860031127929688, 0.1852874755859375, 0.19197463989257812, 0.19866180419921875, 0.20534896850585938, 0.2120361328125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 12.0, 17.0, 21.0, 21.0, 58.0, 72.0, 125.0, 149.0, 145.0, 118.0, 66.0, 47.0, 41.0, 20.0, 17.0, 14.0, 13.0, 3.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.395456314086914, -12.978555679321289, -12.56165599822998, -12.144755363464355, -11.727855682373047, -11.310955047607422, -10.894054412841797, -10.477154731750488, -10.06025505065918, -9.643354415893555, -9.226454734802246, -8.809554100036621, -8.392654418945312, -7.9757537841796875, -7.558853626251221, -7.141953468322754, -6.725052833557129, -6.308152675628662, -5.891252517700195, -5.47435188293457, -5.057452201843262, -4.640551567077637, -4.22365140914917, -3.806751251220703, -3.3898510932922363, -2.9729509353637695, -2.5560507774353027, -2.139150381088257, -1.72225022315979, -1.3053500652313232, -0.8884496688842773, -0.47154951095581055, -0.054648399353027344, 0.36225181818008423, 0.7791520357131958, 1.1960523128509521, 1.612952470779419, 2.0298526287078857, 2.4467530250549316, 2.8636531829833984, 3.2805533409118652, 3.697453498840332, 4.114353656768799, 4.531253814697266, 4.948154449462891, 5.365054130554199, 5.781954765319824, 6.198854923248291, 6.615755081176758, 7.032655239105225, 7.449555397033691, 7.866456031799316, 8.283355712890625, 8.70025634765625, 9.117156982421875, 9.534056663513184, 9.950956344604492, 10.367856979370117, 10.784756660461426, 11.20165729522705, 11.61855697631836, 12.035457611083984, 12.45235824584961, 12.869257926940918, 13.286158561706543]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 8.0, 9.0, 10.0, 12.0, 12.0, 16.0, 14.0, 11.0, 12.0, 21.0, 17.0, 23.0, 24.0, 28.0, 43.0, 43.0, 34.0, 41.0, 49.0, 42.0, 43.0, 47.0, 49.0, 40.0, 26.0, 44.0, 32.0, 29.0, 30.0, 33.0, 19.0, 18.0, 22.0, 16.0, 11.0, 12.0, 15.0, 11.0, 6.0, 7.0, 7.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.689723014831543, -5.49818754196167, -5.306651592254639, -5.115116119384766, -4.923580646514893, -4.7320451736450195, -4.540509223937988, -4.348973751068115, -4.157438278198242, -3.96590256690979, -3.774367094039917, -3.582831382751465, -3.391295909881592, -3.1997601985931396, -3.0082244873046875, -2.8166890144348145, -2.625153064727783, -2.433617353439331, -2.242081880569458, -2.050546169281006, -1.8590105772018433, -1.6674749851226807, -1.4759392738342285, -1.284403681755066, -1.0928680896759033, -0.9013324975967407, -0.7097968459129333, -0.518261194229126, -0.3267256021499634, -0.13519001007080078, 0.05634570121765137, 0.24788129329681396, 0.43941736221313477, 0.6309529542922974, 0.8224886059761047, 1.014024257659912, 1.2055598497390747, 1.3970954418182373, 1.5886311531066895, 1.780166745185852, 1.9717023372650146, 2.163238048553467, 2.35477352142334, 2.546309232711792, 2.737844944000244, 2.929380416870117, 3.1209161281585693, 3.3124518394470215, 3.5039873123168945, 3.6955230236053467, 3.8870584964752197, 4.078594207763672, 4.270129680633545, 4.461665153503418, 4.653201103210449, 4.844736576080322, 5.036272048950195, 5.227807521820068, 5.4193434715271, 5.610878944396973, 5.802414417266846, 5.993949890136719, 6.18548583984375, 6.377021312713623, 6.568557262420654]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 9.0, 12.0, 20.0, 28.0, 33.0, 49.0, 71.0, 92.0, 135.0, 213.0, 298.0, 394.0, 632.0, 932.0, 1259.0, 2016.0, 3233.0, 5167.0, 8430.0, 13917.0, 24070.0, 42085.0, 75946.0, 143736.0, 255341.0, 213851.0, 112162.0, 60422.0, 33923.0, 19227.0, 11379.0, 7002.0, 4310.0, 2706.0, 1701.0, 1172.0, 806.0, 564.0, 365.0, 242.0, 193.0, 131.0, 73.0, 56.0, 45.0, 33.0, 35.0, 15.0, 8.0, 6.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8046875, -9.46435546875, -9.1240234375, -8.78369140625, -8.443359375, -8.10302734375, -7.7626953125, -7.42236328125, -7.08203125, -6.74169921875, -6.4013671875, -6.06103515625, -5.720703125, -5.38037109375, -5.0400390625, -4.69970703125, -4.359375, -4.01904296875, -3.6787109375, -3.33837890625, -2.998046875, -2.65771484375, -2.3173828125, -1.97705078125, -1.63671875, -1.29638671875, -0.9560546875, -0.61572265625, -0.275390625, 0.06494140625, 0.4052734375, 0.74560546875, 1.0859375, 1.42626953125, 1.7666015625, 2.10693359375, 2.447265625, 2.78759765625, 3.1279296875, 3.46826171875, 3.80859375, 4.14892578125, 4.4892578125, 4.82958984375, 5.169921875, 5.51025390625, 5.8505859375, 6.19091796875, 6.53125, 6.87158203125, 7.2119140625, 7.55224609375, 7.892578125, 8.23291015625, 8.5732421875, 8.91357421875, 9.25390625, 9.59423828125, 9.9345703125, 10.27490234375, 10.615234375, 10.95556640625, 11.2958984375, 11.63623046875, 11.9765625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 8.0, 7.0, 9.0, 8.0, 17.0, 9.0, 17.0, 13.0, 15.0, 19.0, 17.0, 19.0, 22.0, 35.0, 39.0, 34.0, 42.0, 46.0, 46.0, 49.0, 39.0, 36.0, 54.0, 43.0, 41.0, 46.0, 38.0, 27.0, 25.0, 25.0, 25.0, 24.0, 21.0, 11.0, 15.0, 16.0, 7.0, 9.0, 14.0, 7.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.57171630859375, -4.4012451171875, -4.23077392578125, -4.060302734375, -3.88983154296875, -3.7193603515625, -3.54888916015625, -3.37841796875, -3.20794677734375, -3.0374755859375, -2.86700439453125, -2.696533203125, -2.52606201171875, -2.3555908203125, -2.18511962890625, -2.0146484375, -1.84417724609375, -1.6737060546875, -1.50323486328125, -1.332763671875, -1.16229248046875, -0.9918212890625, -0.82135009765625, -0.65087890625, -0.48040771484375, -0.3099365234375, -0.13946533203125, 0.031005859375, 0.20147705078125, 0.3719482421875, 0.54241943359375, 0.712890625, 0.88336181640625, 1.0538330078125, 1.22430419921875, 1.394775390625, 1.56524658203125, 1.7357177734375, 1.90618896484375, 2.07666015625, 2.24713134765625, 2.4176025390625, 2.58807373046875, 2.758544921875, 2.92901611328125, 3.0994873046875, 3.26995849609375, 3.4404296875, 3.61090087890625, 3.7813720703125, 3.95184326171875, 4.122314453125, 4.29278564453125, 4.4632568359375, 4.63372802734375, 4.80419921875, 4.97467041015625, 5.1451416015625, 5.31561279296875, 5.486083984375, 5.65655517578125, 5.8270263671875, 5.99749755859375, 6.16796875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 9.0, 7.0, 9.0, 16.0, 27.0, 39.0, 59.0, 111.0, 143.0, 199.0, 317.0, 545.0, 829.0, 1428.0, 2432.0, 4454.0, 8191.0, 15394.0, 30532.0, 63515.0, 137460.0, 277221.0, 261268.0, 126015.0, 58374.0, 28140.0, 14222.0, 7605.0, 4147.0, 2276.0, 1331.0, 788.0, 521.0, 306.0, 216.0, 152.0, 92.0, 59.0, 32.0, 29.0, 14.0, 11.0, 6.0, 8.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3203125, -10.9422607421875, -10.564208984375, -10.1861572265625, -9.80810546875, -9.4300537109375, -9.052001953125, -8.6739501953125, -8.2958984375, -7.9178466796875, -7.539794921875, -7.1617431640625, -6.78369140625, -6.4056396484375, -6.027587890625, -5.6495361328125, -5.271484375, -4.8934326171875, -4.515380859375, -4.1373291015625, -3.75927734375, -3.3812255859375, -3.003173828125, -2.6251220703125, -2.2470703125, -1.8690185546875, -1.490966796875, -1.1129150390625, -0.73486328125, -0.3568115234375, 0.021240234375, 0.3992919921875, 0.77734375, 1.1553955078125, 1.533447265625, 1.9114990234375, 2.28955078125, 2.6676025390625, 3.045654296875, 3.4237060546875, 3.8017578125, 4.1798095703125, 4.557861328125, 4.9359130859375, 5.31396484375, 5.6920166015625, 6.070068359375, 6.4481201171875, 6.826171875, 7.2042236328125, 7.582275390625, 7.9603271484375, 8.33837890625, 8.7164306640625, 9.094482421875, 9.4725341796875, 9.8505859375, 10.2286376953125, 10.606689453125, 10.9847412109375, 11.36279296875, 11.7408447265625, 12.118896484375, 12.4969482421875, 12.875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 5.0, 12.0, 10.0, 8.0, 10.0, 14.0, 20.0, 18.0, 25.0, 22.0, 23.0, 27.0, 23.0, 27.0, 41.0, 41.0, 30.0, 38.0, 28.0, 35.0, 29.0, 38.0, 38.0, 28.0, 39.0, 50.0, 35.0, 29.0, 36.0, 20.0, 28.0, 28.0, 16.0, 14.0, 17.0, 16.0, 16.0, 6.0, 7.0, 10.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.984375, -2.888763427734375, -2.79315185546875, -2.697540283203125, -2.6019287109375, -2.506317138671875, -2.41070556640625, -2.315093994140625, -2.219482421875, -2.123870849609375, -2.02825927734375, -1.932647705078125, -1.8370361328125, -1.741424560546875, -1.64581298828125, -1.550201416015625, -1.45458984375, -1.358978271484375, -1.26336669921875, -1.167755126953125, -1.0721435546875, -0.976531982421875, -0.88092041015625, -0.785308837890625, -0.689697265625, -0.594085693359375, -0.49847412109375, -0.402862548828125, -0.3072509765625, -0.211639404296875, -0.11602783203125, -0.020416259765625, 0.0751953125, 0.170806884765625, 0.26641845703125, 0.362030029296875, 0.4576416015625, 0.553253173828125, 0.64886474609375, 0.744476318359375, 0.840087890625, 0.935699462890625, 1.03131103515625, 1.126922607421875, 1.2225341796875, 1.318145751953125, 1.41375732421875, 1.509368896484375, 1.60498046875, 1.700592041015625, 1.79620361328125, 1.891815185546875, 1.9874267578125, 2.083038330078125, 2.17864990234375, 2.274261474609375, 2.369873046875, 2.465484619140625, 2.56109619140625, 2.656707763671875, 2.7523193359375, 2.847930908203125, 2.94354248046875, 3.039154052734375, 3.134765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 6.0, 18.0, 18.0, 28.0, 36.0, 40.0, 64.0, 100.0, 129.0, 203.0, 268.0, 369.0, 559.0, 819.0, 1334.0, 2085.0, 3578.0, 6553.0, 12899.0, 29385.0, 83777.0, 702565.0, 128903.0, 39196.0, 16400.0, 7912.0, 4299.0, 2434.0, 1536.0, 979.0, 635.0, 396.0, 300.0, 202.0, 148.0, 97.0, 75.0, 56.0, 38.0, 32.0, 18.0, 17.0, 8.0, 9.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.62890625, -7.37164306640625, -7.1143798828125, -6.85711669921875, -6.599853515625, -6.34259033203125, -6.0853271484375, -5.82806396484375, -5.57080078125, -5.31353759765625, -5.0562744140625, -4.79901123046875, -4.541748046875, -4.28448486328125, -4.0272216796875, -3.76995849609375, -3.5126953125, -3.25543212890625, -2.9981689453125, -2.74090576171875, -2.483642578125, -2.22637939453125, -1.9691162109375, -1.71185302734375, -1.45458984375, -1.19732666015625, -0.9400634765625, -0.68280029296875, -0.425537109375, -0.16827392578125, 0.0889892578125, 0.34625244140625, 0.603515625, 0.86077880859375, 1.1180419921875, 1.37530517578125, 1.632568359375, 1.88983154296875, 2.1470947265625, 2.40435791015625, 2.66162109375, 2.91888427734375, 3.1761474609375, 3.43341064453125, 3.690673828125, 3.94793701171875, 4.2052001953125, 4.46246337890625, 4.7197265625, 4.97698974609375, 5.2342529296875, 5.49151611328125, 5.748779296875, 6.00604248046875, 6.2633056640625, 6.52056884765625, 6.77783203125, 7.03509521484375, 7.2923583984375, 7.54962158203125, 7.806884765625, 8.06414794921875, 8.3214111328125, 8.57867431640625, 8.8359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 4.0, 3.0, 6.0, 6.0, 5.0, 11.0, 7.0, 15.0, 16.0, 23.0, 22.0, 43.0, 42.0, 65.0, 106.0, 140.0, 143.0, 96.0, 41.0, 27.0, 26.0, 22.0, 22.0, 21.0, 17.0, 12.0, 9.0, 5.0, 4.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00020599365234375, -0.00019931793212890625, -0.0001926422119140625, -0.00018596649169921875, -0.000179290771484375, -0.00017261505126953125, -0.0001659393310546875, -0.00015926361083984375, -0.000152587890625, -0.00014591217041015625, -0.0001392364501953125, -0.00013256072998046875, -0.000125885009765625, -0.00011920928955078125, -0.0001125335693359375, -0.00010585784912109375, -9.918212890625e-05, -9.250640869140625e-05, -8.58306884765625e-05, -7.915496826171875e-05, -7.2479248046875e-05, -6.580352783203125e-05, -5.91278076171875e-05, -5.245208740234375e-05, -4.57763671875e-05, -3.910064697265625e-05, -3.24249267578125e-05, -2.574920654296875e-05, -1.9073486328125e-05, -1.239776611328125e-05, -5.7220458984375e-06, 9.5367431640625e-07, 7.62939453125e-06, 1.430511474609375e-05, 2.09808349609375e-05, 2.765655517578125e-05, 3.4332275390625e-05, 4.100799560546875e-05, 4.76837158203125e-05, 5.435943603515625e-05, 6.103515625e-05, 6.771087646484375e-05, 7.43865966796875e-05, 8.106231689453125e-05, 8.7738037109375e-05, 9.441375732421875e-05, 0.0001010894775390625, 0.00010776519775390625, 0.00011444091796875, 0.00012111663818359375, 0.0001277923583984375, 0.00013446807861328125, 0.000141143798828125, 0.00014781951904296875, 0.0001544952392578125, 0.00016117095947265625, 0.0001678466796875, 0.00017452239990234375, 0.0001811981201171875, 0.00018787384033203125, 0.000194549560546875, 0.00020122528076171875, 0.0002079010009765625, 0.00021457672119140625, 0.00022125244140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 10.0, 3.0, 9.0, 12.0, 22.0, 29.0, 39.0, 64.0, 119.0, 187.0, 312.0, 557.0, 999.0, 2076.0, 4506.0, 10952.0, 34397.0, 253884.0, 677185.0, 41015.0, 12383.0, 4871.0, 2222.0, 1216.0, 605.0, 324.0, 223.0, 117.0, 69.0, 56.0, 26.0, 21.0, 10.0, 11.0, 5.0, 3.0, 5.0, 2.0, 6.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.1875, -11.8297119140625, -11.471923828125, -11.1141357421875, -10.75634765625, -10.3985595703125, -10.040771484375, -9.6829833984375, -9.3251953125, -8.9674072265625, -8.609619140625, -8.2518310546875, -7.89404296875, -7.5362548828125, -7.178466796875, -6.8206787109375, -6.462890625, -6.1051025390625, -5.747314453125, -5.3895263671875, -5.03173828125, -4.6739501953125, -4.316162109375, -3.9583740234375, -3.6005859375, -3.2427978515625, -2.885009765625, -2.5272216796875, -2.16943359375, -1.8116455078125, -1.453857421875, -1.0960693359375, -0.73828125, -0.3804931640625, -0.022705078125, 0.3350830078125, 0.69287109375, 1.0506591796875, 1.408447265625, 1.7662353515625, 2.1240234375, 2.4818115234375, 2.839599609375, 3.1973876953125, 3.55517578125, 3.9129638671875, 4.270751953125, 4.6285400390625, 4.986328125, 5.3441162109375, 5.701904296875, 6.0596923828125, 6.41748046875, 6.7752685546875, 7.133056640625, 7.4908447265625, 7.8486328125, 8.2064208984375, 8.564208984375, 8.9219970703125, 9.27978515625, 9.6375732421875, 9.995361328125, 10.3531494140625, 10.7109375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 8.0, 2.0, 0.0, 7.0, 13.0, 12.0, 15.0, 31.0, 30.0, 38.0, 54.0, 104.0, 414.0, 62.0, 61.0, 39.0, 27.0, 22.0, 8.0, 17.0, 7.0, 9.0, 3.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.581390380859375, -1.51043701171875, -1.439483642578125, -1.3685302734375, -1.297576904296875, -1.22662353515625, -1.155670166015625, -1.084716796875, -1.013763427734375, -0.94281005859375, -0.871856689453125, -0.8009033203125, -0.729949951171875, -0.65899658203125, -0.588043212890625, -0.51708984375, -0.446136474609375, -0.37518310546875, -0.304229736328125, -0.2332763671875, -0.162322998046875, -0.09136962890625, -0.020416259765625, 0.050537109375, 0.121490478515625, 0.19244384765625, 0.263397216796875, 0.3343505859375, 0.405303955078125, 0.47625732421875, 0.547210693359375, 0.6181640625, 0.689117431640625, 0.76007080078125, 0.831024169921875, 0.9019775390625, 0.972930908203125, 1.04388427734375, 1.114837646484375, 1.185791015625, 1.256744384765625, 1.32769775390625, 1.398651123046875, 1.4696044921875, 1.540557861328125, 1.61151123046875, 1.682464599609375, 1.75341796875, 1.824371337890625, 1.89532470703125, 1.966278076171875, 2.0372314453125, 2.108184814453125, 2.17913818359375, 2.250091552734375, 2.321044921875, 2.391998291015625, 2.46295166015625, 2.533905029296875, 2.6048583984375, 2.675811767578125, 2.74676513671875, 2.817718505859375, 2.888671875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 3.0, 14.0, 8.0, 21.0, 28.0, 41.0, 70.0, 85.0, 119.0, 135.0, 119.0, 76.0, 59.0, 59.0, 34.0, 23.0, 17.0, 18.0, 7.0, 12.0, 5.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.509291648864746, -9.19890022277832, -8.888507843017578, -8.578115463256836, -8.26772403717041, -7.957332134246826, -7.646940231323242, -7.336548328399658, -7.026156425476074, -6.71576452255249, -6.405372619628906, -6.094980716705322, -5.784588813781738, -5.474196910858154, -5.16380500793457, -4.853413105010986, -4.543021202087402, -4.232629299163818, -3.9222373962402344, -3.6118454933166504, -3.3014535903930664, -2.9910616874694824, -2.6806697845458984, -2.3702778816223145, -2.0598859786987305, -1.7494940757751465, -1.4391021728515625, -1.1287102699279785, -0.8183183670043945, -0.5079264640808105, -0.19753456115722656, 0.11285734176635742, 0.423248291015625, 0.733640193939209, 1.044032096862793, 1.354423999786377, 1.664815902709961, 1.975207805633545, 2.285599708557129, 2.595991611480713, 2.906383514404297, 3.216775417327881, 3.527167320251465, 3.837559223175049, 4.147951126098633, 4.458343029022217, 4.768734931945801, 5.079126834869385, 5.389518737792969, 5.699910640716553, 6.010302543640137, 6.320694446563721, 6.631086349487305, 6.941478252410889, 7.251870155334473, 7.562262058258057, 7.872653961181641, 8.183046340942383, 8.493437767028809, 8.803829193115234, 9.114221572875977, 9.424613952636719, 9.735005378723145, 10.04539680480957, 10.355789184570312]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 10.0, 16.0, 13.0, 15.0, 23.0, 20.0, 31.0, 34.0, 33.0, 36.0, 36.0, 40.0, 48.0, 37.0, 39.0, 46.0, 43.0, 36.0, 42.0, 38.0, 38.0, 38.0, 35.0, 31.0, 36.0, 18.0, 18.0, 20.0, 13.0, 16.0, 11.0, 15.0, 12.0, 6.0, 6.0, 1.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.574677467346191, -5.398855209350586, -5.223033428192139, -5.047211170196533, -4.871389389038086, -4.6955671310424805, -4.519744873046875, -4.343923091888428, -4.1681013107299805, -3.992279291152954, -3.8164572715759277, -3.6406350135803223, -3.464813232421875, -3.2889909744262695, -3.113168954849243, -2.937346935272217, -2.7615246772766113, -2.585702657699585, -2.4098806381225586, -2.234058380126953, -2.058236598968506, -1.88241446018219, -1.706592321395874, -1.5307703018188477, -1.3549482822418213, -1.179126262664795, -1.0033042430877686, -0.8274821043014526, -0.6516600847244263, -0.4758380651473999, -0.300015926361084, -0.12419390678405762, 0.05162763595581055, 0.2274496853351593, 0.40327173471450806, 0.5790938138961792, 0.7549158334732056, 0.9307378530502319, 1.1065599918365479, 1.2823820114135742, 1.4582040309906006, 1.634026050567627, 1.8098480701446533, 1.9856702089309692, 2.161492347717285, 2.3373141288757324, 2.513136386871338, 2.6889584064483643, 2.8647804260253906, 3.040602445602417, 3.2164244651794434, 3.392246723175049, 3.568068504333496, 3.7438907623291016, 3.919712781906128, 4.095534801483154, 4.271356582641602, 4.447178840637207, 4.623000621795654, 4.79882287979126, 4.974644660949707, 5.1504669189453125, 5.326289176940918, 5.502110958099365, 5.677933216094971]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 16.0, 25.0, 34.0, 76.0, 109.0, 177.0, 200.0, 336.0, 428.0, 672.0, 1027.0, 1421.0, 2274.0, 3369.0, 5183.0, 8363.0, 13554.0, 23031.0, 40560.0, 77157.0, 168363.0, 532755.0, 1903913.0, 951203.0, 238137.0, 99249.0, 50509.0, 27582.0, 16097.0, 9871.0, 6218.0, 3952.0, 2698.0, 1796.0, 1159.0, 848.0, 570.0, 382.0, 280.0, 211.0, 141.0, 100.0, 58.0, 44.0, 43.0, 22.0, 24.0, 7.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.80078125, -7.53802490234375, -7.2752685546875, -7.01251220703125, -6.749755859375, -6.48699951171875, -6.2242431640625, -5.96148681640625, -5.69873046875, -5.43597412109375, -5.1732177734375, -4.91046142578125, -4.647705078125, -4.38494873046875, -4.1221923828125, -3.85943603515625, -3.5966796875, -3.33392333984375, -3.0711669921875, -2.80841064453125, -2.545654296875, -2.28289794921875, -2.0201416015625, -1.75738525390625, -1.49462890625, -1.23187255859375, -0.9691162109375, -0.70635986328125, -0.443603515625, -0.18084716796875, 0.0819091796875, 0.34466552734375, 0.607421875, 0.87017822265625, 1.1329345703125, 1.39569091796875, 1.658447265625, 1.92120361328125, 2.1839599609375, 2.44671630859375, 2.70947265625, 2.97222900390625, 3.2349853515625, 3.49774169921875, 3.760498046875, 4.02325439453125, 4.2860107421875, 4.54876708984375, 4.8115234375, 5.07427978515625, 5.3370361328125, 5.59979248046875, 5.862548828125, 6.12530517578125, 6.3880615234375, 6.65081787109375, 6.91357421875, 7.17633056640625, 7.4390869140625, 7.70184326171875, 7.964599609375, 8.22735595703125, 8.4901123046875, 8.75286865234375, 9.015625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 2.0, 2.0, 5.0, 6.0, 11.0, 11.0, 9.0, 9.0, 17.0, 9.0, 20.0, 16.0, 19.0, 31.0, 33.0, 22.0, 42.0, 42.0, 29.0, 47.0, 35.0, 34.0, 32.0, 36.0, 32.0, 41.0, 35.0, 49.0, 38.0, 36.0, 26.0, 30.0, 17.0, 38.0, 22.0, 15.0, 18.0, 17.0, 8.0, 18.0, 9.0, 10.0, 3.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.08984375, -2.98809814453125, -2.8863525390625, -2.78460693359375, -2.682861328125, -2.58111572265625, -2.4793701171875, -2.37762451171875, -2.27587890625, -2.17413330078125, -2.0723876953125, -1.97064208984375, -1.868896484375, -1.76715087890625, -1.6654052734375, -1.56365966796875, -1.4619140625, -1.36016845703125, -1.2584228515625, -1.15667724609375, -1.054931640625, -0.95318603515625, -0.8514404296875, -0.74969482421875, -0.64794921875, -0.54620361328125, -0.4444580078125, -0.34271240234375, -0.240966796875, -0.13922119140625, -0.0374755859375, 0.06427001953125, 0.166015625, 0.26776123046875, 0.3695068359375, 0.47125244140625, 0.572998046875, 0.67474365234375, 0.7764892578125, 0.87823486328125, 0.97998046875, 1.08172607421875, 1.1834716796875, 1.28521728515625, 1.386962890625, 1.48870849609375, 1.5904541015625, 1.69219970703125, 1.7939453125, 1.89569091796875, 1.9974365234375, 2.09918212890625, 2.200927734375, 2.30267333984375, 2.4044189453125, 2.50616455078125, 2.60791015625, 2.70965576171875, 2.8114013671875, 2.91314697265625, 3.014892578125, 3.11663818359375, 3.2183837890625, 3.32012939453125, 3.421875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 9.0, 10.0, 23.0, 28.0, 39.0, 55.0, 104.0, 163.0, 265.0, 385.0, 709.0, 1224.0, 2165.0, 3829.0, 7228.0, 14262.0, 29875.0, 66650.0, 170353.0, 568512.0, 2094760.0, 848377.0, 227682.0, 84308.0, 36774.0, 17297.0, 8691.0, 4563.0, 2474.0, 1396.0, 828.0, 481.0, 261.0, 182.0, 113.0, 62.0, 50.0, 40.0, 24.0, 12.0, 7.0, 2.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.5421142578125, -9.240478515625, -8.9388427734375, -8.63720703125, -8.3355712890625, -8.033935546875, -7.7322998046875, -7.4306640625, -7.1290283203125, -6.827392578125, -6.5257568359375, -6.22412109375, -5.9224853515625, -5.620849609375, -5.3192138671875, -5.017578125, -4.7159423828125, -4.414306640625, -4.1126708984375, -3.81103515625, -3.5093994140625, -3.207763671875, -2.9061279296875, -2.6044921875, -2.3028564453125, -2.001220703125, -1.6995849609375, -1.39794921875, -1.0963134765625, -0.794677734375, -0.4930419921875, -0.19140625, 0.1102294921875, 0.411865234375, 0.7135009765625, 1.01513671875, 1.3167724609375, 1.618408203125, 1.9200439453125, 2.2216796875, 2.5233154296875, 2.824951171875, 3.1265869140625, 3.42822265625, 3.7298583984375, 4.031494140625, 4.3331298828125, 4.634765625, 4.9364013671875, 5.238037109375, 5.5396728515625, 5.84130859375, 6.1429443359375, 6.444580078125, 6.7462158203125, 7.0478515625, 7.3494873046875, 7.651123046875, 7.9527587890625, 8.25439453125, 8.5560302734375, 8.857666015625, 9.1593017578125, 9.4609375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 8.0, 14.0, 11.0, 14.0, 11.0, 23.0, 19.0, 17.0, 35.0, 52.0, 53.0, 69.0, 82.0, 101.0, 130.0, 169.0, 173.0, 239.0, 297.0, 348.0, 371.0, 309.0, 279.0, 285.0, 218.0, 161.0, 105.0, 103.0, 73.0, 67.0, 52.0, 29.0, 40.0, 24.0, 27.0, 10.0, 10.0, 20.0, 13.0, 4.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7553253173828125, -1.689361572265625, -1.6233978271484375, -1.55743408203125, -1.4914703369140625, -1.425506591796875, -1.3595428466796875, -1.2935791015625, -1.2276153564453125, -1.161651611328125, -1.0956878662109375, -1.02972412109375, -0.9637603759765625, -0.897796630859375, -0.8318328857421875, -0.765869140625, -0.6999053955078125, -0.633941650390625, -0.5679779052734375, -0.50201416015625, -0.4360504150390625, -0.370086669921875, -0.3041229248046875, -0.2381591796875, -0.1721954345703125, -0.106231689453125, -0.0402679443359375, 0.02569580078125, 0.0916595458984375, 0.157623291015625, 0.2235870361328125, 0.28955078125, 0.3555145263671875, 0.421478271484375, 0.4874420166015625, 0.55340576171875, 0.6193695068359375, 0.685333251953125, 0.7512969970703125, 0.8172607421875, 0.8832244873046875, 0.949188232421875, 1.0151519775390625, 1.08111572265625, 1.1470794677734375, 1.213043212890625, 1.2790069580078125, 1.344970703125, 1.4109344482421875, 1.476898193359375, 1.5428619384765625, 1.60882568359375, 1.6747894287109375, 1.740753173828125, 1.8067169189453125, 1.8726806640625, 1.9386444091796875, 2.004608154296875, 2.0705718994140625, 2.13653564453125, 2.2024993896484375, 2.268463134765625, 2.3344268798828125, 2.400390625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 4.0, 12.0, 11.0, 15.0, 24.0, 28.0, 61.0, 81.0, 86.0, 125.0, 129.0, 92.0, 82.0, 51.0, 44.0, 20.0, 34.0, 28.0, 15.0, 7.0, 12.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.902103424072266, -7.678369998931885, -7.454636573791504, -7.230902671813965, -7.007169246673584, -6.783435821533203, -6.559702396392822, -6.335968971252441, -6.1122355461120605, -5.88850212097168, -5.664768695831299, -5.441035270690918, -5.217301368713379, -4.993567943572998, -4.769834518432617, -4.546101093292236, -4.3223676681518555, -4.098634243011475, -3.8749005794525146, -3.651167154312134, -3.427433729171753, -3.203700065612793, -2.979966640472412, -2.7562332153320312, -2.532499313354492, -2.3087658882141113, -2.0850322246551514, -1.8612987995147705, -1.6375653743743896, -1.4138318300247192, -1.1900982856750488, -0.966364860534668, -0.7426314353942871, -0.5188979506492615, -0.29516443610191345, -0.07143092155456543, 0.1523025631904602, 0.37603604793548584, 0.5997695922851562, 0.8235030174255371, 1.0472365617752075, 1.270970106124878, 1.4947035312652588, 1.7184370756149292, 1.9421706199645996, 2.1659040451049805, 2.3896374702453613, 2.613370895385742, 2.837104558944702, 3.060837984085083, 3.284571647644043, 3.508305072784424, 3.7320384979248047, 3.9557719230651855, 4.179505348205566, 4.4032392501831055, 4.626972675323486, 4.850706100463867, 5.074439525604248, 5.298172950744629, 5.521906852722168, 5.745640277862549, 5.96937370300293, 6.1931071281433105, 6.416840553283691]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 3.0, 6.0, 5.0, 8.0, 11.0, 13.0, 14.0, 19.0, 20.0, 32.0, 31.0, 39.0, 45.0, 39.0, 48.0, 36.0, 50.0, 51.0, 39.0, 44.0, 57.0, 48.0, 33.0, 38.0, 41.0, 41.0, 35.0, 24.0, 23.0, 14.0, 21.0, 15.0, 14.0, 8.0, 6.0, 11.0, 10.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.606540203094482, -4.461686134338379, -4.316832542419434, -4.17197847366333, -4.027124404907227, -3.8822708129882812, -3.7374167442321777, -3.5925629138946533, -3.447709083557129, -3.3028552532196045, -3.15800142288208, -3.0131473541259766, -2.868293523788452, -2.7234396934509277, -2.578585624694824, -2.4337317943573, -2.2888779640197754, -2.144024133682251, -1.999170184135437, -1.854316234588623, -1.7094624042510986, -1.5646085739135742, -1.4197546243667603, -1.2749006748199463, -1.1300468444824219, -0.9851929545402527, -0.8403390645980835, -0.6954851746559143, -0.5506312847137451, -0.4057773947715759, -0.26092350482940674, -0.11606955528259277, 0.028784751892089844, 0.17363864183425903, 0.3184925317764282, 0.4633464217185974, 0.6082003116607666, 0.7530542016029358, 0.897908091545105, 1.042762041091919, 1.1876158714294434, 1.3324697017669678, 1.4773236513137817, 1.6221776008605957, 1.7670314311981201, 1.9118852615356445, 2.056739330291748, 2.2015931606292725, 2.346446990966797, 2.4913008213043213, 2.6361546516418457, 2.781008720397949, 2.9258625507354736, 3.070716381072998, 3.2155704498291016, 3.360424280166626, 3.5052781105041504, 3.650131940841675, 3.794985771179199, 3.9398398399353027, 4.084693908691406, 4.229547500610352, 4.374401569366455, 4.519255638122559, 4.664109230041504]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 12.0, 21.0, 29.0, 38.0, 46.0, 64.0, 91.0, 121.0, 176.0, 268.0, 353.0, 571.0, 754.0, 1106.0, 1664.0, 2516.0, 3597.0, 5852.0, 9080.0, 14845.0, 24953.0, 45135.0, 89633.0, 214765.0, 335465.0, 143629.0, 65457.0, 34685.0, 19806.0, 12089.0, 7339.0, 4666.0, 3119.0, 1984.0, 1382.0, 1013.0, 687.0, 415.0, 306.0, 235.0, 190.0, 133.0, 78.0, 46.0, 34.0, 28.0, 24.0, 20.0, 14.0, 9.0, 6.0, 2.0, 0.0, 1.0], "bins": [-3.2109375, -3.117279052734375, -3.02362060546875, -2.929962158203125, -2.8363037109375, -2.742645263671875, -2.64898681640625, -2.555328369140625, -2.461669921875, -2.368011474609375, -2.27435302734375, -2.180694580078125, -2.0870361328125, -1.993377685546875, -1.89971923828125, -1.806060791015625, -1.71240234375, -1.618743896484375, -1.52508544921875, -1.431427001953125, -1.3377685546875, -1.244110107421875, -1.15045166015625, -1.056793212890625, -0.963134765625, -0.869476318359375, -0.77581787109375, -0.682159423828125, -0.5885009765625, -0.494842529296875, -0.40118408203125, -0.307525634765625, -0.2138671875, -0.120208740234375, -0.02655029296875, 0.067108154296875, 0.1607666015625, 0.254425048828125, 0.34808349609375, 0.441741943359375, 0.535400390625, 0.629058837890625, 0.72271728515625, 0.816375732421875, 0.9100341796875, 1.003692626953125, 1.09735107421875, 1.191009521484375, 1.28466796875, 1.378326416015625, 1.47198486328125, 1.565643310546875, 1.6593017578125, 1.752960205078125, 1.84661865234375, 1.940277099609375, 2.033935546875, 2.127593994140625, 2.22125244140625, 2.314910888671875, 2.4085693359375, 2.502227783203125, 2.59588623046875, 2.689544677734375, 2.783203125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 4.0, 9.0, 8.0, 10.0, 16.0, 8.0, 17.0, 31.0, 32.0, 31.0, 23.0, 36.0, 37.0, 45.0, 39.0, 52.0, 57.0, 40.0, 43.0, 41.0, 42.0, 30.0, 39.0, 41.0, 38.0, 30.0, 32.0, 26.0, 25.0, 21.0, 15.0, 11.0, 10.0, 10.0, 8.0, 3.0, 12.0, 6.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.43359375, -4.2991943359375, -4.164794921875, -4.0303955078125, -3.89599609375, -3.7615966796875, -3.627197265625, -3.4927978515625, -3.3583984375, -3.2239990234375, -3.089599609375, -2.9552001953125, -2.82080078125, -2.6864013671875, -2.552001953125, -2.4176025390625, -2.283203125, -2.1488037109375, -2.014404296875, -1.8800048828125, -1.74560546875, -1.6112060546875, -1.476806640625, -1.3424072265625, -1.2080078125, -1.0736083984375, -0.939208984375, -0.8048095703125, -0.67041015625, -0.5360107421875, -0.401611328125, -0.2672119140625, -0.1328125, 0.0015869140625, 0.135986328125, 0.2703857421875, 0.40478515625, 0.5391845703125, 0.673583984375, 0.8079833984375, 0.9423828125, 1.0767822265625, 1.211181640625, 1.3455810546875, 1.47998046875, 1.6143798828125, 1.748779296875, 1.8831787109375, 2.017578125, 2.1519775390625, 2.286376953125, 2.4207763671875, 2.55517578125, 2.6895751953125, 2.823974609375, 2.9583740234375, 3.0927734375, 3.2271728515625, 3.361572265625, 3.4959716796875, 3.63037109375, 3.7647705078125, 3.899169921875, 4.0335693359375, 4.16796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 12.0, 23.0, 20.0, 36.0, 37.0, 69.0, 72.0, 109.0, 145.0, 209.0, 249.0, 377.0, 520.0, 711.0, 1014.0, 1412.0, 2122.0, 2991.0, 4738.0, 7752.0, 14238.0, 31160.0, 101088.0, 570485.0, 212371.0, 49433.0, 19425.0, 9916.0, 5764.0, 3674.0, 2443.0, 1652.0, 1204.0, 839.0, 589.0, 458.0, 287.0, 241.0, 185.0, 141.0, 93.0, 58.0, 55.0, 25.0, 32.0, 21.0, 17.0, 7.0, 5.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0], "bins": [-4.51953125, -4.38140869140625, -4.2432861328125, -4.10516357421875, -3.967041015625, -3.82891845703125, -3.6907958984375, -3.55267333984375, -3.41455078125, -3.27642822265625, -3.1383056640625, -3.00018310546875, -2.862060546875, -2.72393798828125, -2.5858154296875, -2.44769287109375, -2.3095703125, -2.17144775390625, -2.0333251953125, -1.89520263671875, -1.757080078125, -1.61895751953125, -1.4808349609375, -1.34271240234375, -1.20458984375, -1.06646728515625, -0.9283447265625, -0.79022216796875, -0.652099609375, -0.51397705078125, -0.3758544921875, -0.23773193359375, -0.099609375, 0.03851318359375, 0.1766357421875, 0.31475830078125, 0.452880859375, 0.59100341796875, 0.7291259765625, 0.86724853515625, 1.00537109375, 1.14349365234375, 1.2816162109375, 1.41973876953125, 1.557861328125, 1.69598388671875, 1.8341064453125, 1.97222900390625, 2.1103515625, 2.24847412109375, 2.3865966796875, 2.52471923828125, 2.662841796875, 2.80096435546875, 2.9390869140625, 3.07720947265625, 3.21533203125, 3.35345458984375, 3.4915771484375, 3.62969970703125, 3.767822265625, 3.90594482421875, 4.0440673828125, 4.18218994140625, 4.3203125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 5.0, 8.0, 15.0, 5.0, 12.0, 9.0, 10.0, 22.0, 13.0, 16.0, 18.0, 24.0, 27.0, 34.0, 23.0, 44.0, 44.0, 32.0, 33.0, 27.0, 42.0, 36.0, 44.0, 33.0, 26.0, 43.0, 32.0, 34.0, 29.0, 27.0, 26.0, 26.0, 16.0, 19.0, 23.0, 17.0, 18.0, 12.0, 11.0, 5.0, 6.0, 11.0, 6.0, 9.0, 8.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.248046875, -2.178009033203125, -2.10797119140625, -2.037933349609375, -1.9678955078125, -1.897857666015625, -1.82781982421875, -1.757781982421875, -1.687744140625, -1.617706298828125, -1.54766845703125, -1.477630615234375, -1.4075927734375, -1.337554931640625, -1.26751708984375, -1.197479248046875, -1.12744140625, -1.057403564453125, -0.98736572265625, -0.917327880859375, -0.8472900390625, -0.777252197265625, -0.70721435546875, -0.637176513671875, -0.567138671875, -0.497100830078125, -0.42706298828125, -0.357025146484375, -0.2869873046875, -0.216949462890625, -0.14691162109375, -0.076873779296875, -0.0068359375, 0.063201904296875, 0.13323974609375, 0.203277587890625, 0.2733154296875, 0.343353271484375, 0.41339111328125, 0.483428955078125, 0.553466796875, 0.623504638671875, 0.69354248046875, 0.763580322265625, 0.8336181640625, 0.903656005859375, 0.97369384765625, 1.043731689453125, 1.11376953125, 1.183807373046875, 1.25384521484375, 1.323883056640625, 1.3939208984375, 1.463958740234375, 1.53399658203125, 1.604034423828125, 1.674072265625, 1.744110107421875, 1.81414794921875, 1.884185791015625, 1.9542236328125, 2.024261474609375, 2.09429931640625, 2.164337158203125, 2.234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 14.0, 4.0, 9.0, 16.0, 15.0, 33.0, 39.0, 47.0, 61.0, 65.0, 129.0, 149.0, 202.0, 298.0, 371.0, 569.0, 862.0, 1378.0, 2164.0, 4063.0, 7573.0, 17732.0, 62043.0, 732645.0, 164879.0, 29183.0, 10825.0, 5228.0, 2857.0, 1660.0, 1078.0, 712.0, 442.0, 308.0, 250.0, 187.0, 116.0, 99.0, 57.0, 67.0, 23.0, 28.0, 21.0, 20.0, 9.0, 12.0, 5.0, 2.0, 2.0, 3.0, 7.0, 2.0, 1.0, 2.0], "bins": [-0.5810546875, -0.5638275146484375, -0.546600341796875, -0.5293731689453125, -0.51214599609375, -0.4949188232421875, -0.477691650390625, -0.4604644775390625, -0.4432373046875, -0.4260101318359375, -0.408782958984375, -0.3915557861328125, -0.37432861328125, -0.3571014404296875, -0.339874267578125, -0.3226470947265625, -0.305419921875, -0.2881927490234375, -0.270965576171875, -0.2537384033203125, -0.23651123046875, -0.2192840576171875, -0.202056884765625, -0.1848297119140625, -0.1676025390625, -0.1503753662109375, -0.133148193359375, -0.1159210205078125, -0.09869384765625, -0.0814666748046875, -0.064239501953125, -0.0470123291015625, -0.02978515625, -0.0125579833984375, 0.004669189453125, 0.0218963623046875, 0.03912353515625, 0.0563507080078125, 0.073577880859375, 0.0908050537109375, 0.1080322265625, 0.1252593994140625, 0.142486572265625, 0.1597137451171875, 0.17694091796875, 0.1941680908203125, 0.211395263671875, 0.2286224365234375, 0.245849609375, 0.2630767822265625, 0.280303955078125, 0.2975311279296875, 0.31475830078125, 0.3319854736328125, 0.349212646484375, 0.3664398193359375, 0.3836669921875, 0.4008941650390625, 0.418121337890625, 0.4353485107421875, 0.45257568359375, 0.4698028564453125, 0.487030029296875, 0.5042572021484375, 0.521484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 4.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 7.0, 9.0, 11.0, 11.0, 16.0, 16.0, 32.0, 31.0, 36.0, 60.0, 77.0, 93.0, 75.0, 100.0, 91.0, 71.0, 47.0, 46.0, 33.0, 29.0, 15.0, 18.0, 16.0, 8.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.075599670410156e-05, -2.9988586902618408e-05, -2.9221177101135254e-05, -2.84537672996521e-05, -2.7686357498168945e-05, -2.691894769668579e-05, -2.6151537895202637e-05, -2.5384128093719482e-05, -2.4616718292236328e-05, -2.3849308490753174e-05, -2.308189868927002e-05, -2.2314488887786865e-05, -2.154707908630371e-05, -2.0779669284820557e-05, -2.0012259483337402e-05, -1.9244849681854248e-05, -1.8477439880371094e-05, -1.771003007888794e-05, -1.6942620277404785e-05, -1.617521047592163e-05, -1.5407800674438477e-05, -1.4640390872955322e-05, -1.3872981071472168e-05, -1.3105571269989014e-05, -1.233816146850586e-05, -1.1570751667022705e-05, -1.080334186553955e-05, -1.0035932064056396e-05, -9.268522262573242e-06, -8.501112461090088e-06, -7.733702659606934e-06, -6.966292858123779e-06, -6.198883056640625e-06, -5.431473255157471e-06, -4.664063453674316e-06, -3.896653652191162e-06, -3.129243850708008e-06, -2.3618340492248535e-06, -1.5944242477416992e-06, -8.270144462585449e-07, -5.960464477539063e-08, 7.078051567077637e-07, 1.475214958190918e-06, 2.2426247596740723e-06, 3.0100345611572266e-06, 3.777444362640381e-06, 4.544854164123535e-06, 5.3122639656066895e-06, 6.079673767089844e-06, 6.847083568572998e-06, 7.614493370056152e-06, 8.381903171539307e-06, 9.149312973022461e-06, 9.916722774505615e-06, 1.068413257598877e-05, 1.1451542377471924e-05, 1.2218952178955078e-05, 1.2986361980438232e-05, 1.3753771781921387e-05, 1.4521181583404541e-05, 1.5288591384887695e-05, 1.605600118637085e-05, 1.6823410987854004e-05, 1.7590820789337158e-05, 1.8358230590820312e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 8.0, 4.0, 8.0, 10.0, 20.0, 27.0, 30.0, 41.0, 74.0, 99.0, 121.0, 220.0, 336.0, 580.0, 883.0, 1459.0, 2421.0, 4342.0, 8168.0, 16315.0, 37262.0, 110316.0, 541823.0, 217340.0, 58495.0, 23371.0, 10985.0, 5760.0, 3171.0, 1899.0, 1088.0, 657.0, 401.0, 263.0, 192.0, 138.0, 76.0, 56.0, 32.0, 24.0, 16.0, 8.0, 5.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.5673828125, -0.5515022277832031, -0.5356216430664062, -0.5197410583496094, -0.5038604736328125, -0.4879798889160156, -0.47209930419921875, -0.4562187194824219, -0.440338134765625, -0.4244575500488281, -0.40857696533203125, -0.3926963806152344, -0.3768157958984375, -0.3609352111816406, -0.34505462646484375, -0.3291740417480469, -0.31329345703125, -0.2974128723144531, -0.28153228759765625, -0.2656517028808594, -0.2497711181640625, -0.23389053344726562, -0.21800994873046875, -0.20212936401367188, -0.186248779296875, -0.17036819458007812, -0.15448760986328125, -0.13860702514648438, -0.1227264404296875, -0.10684585571289062, -0.09096527099609375, -0.07508468627929688, -0.0592041015625, -0.043323516845703125, -0.02744293212890625, -0.011562347412109375, 0.0043182373046875, 0.020198822021484375, 0.03607940673828125, 0.051959991455078125, 0.067840576171875, 0.08372116088867188, 0.09960174560546875, 0.11548233032226562, 0.1313629150390625, 0.14724349975585938, 0.16312408447265625, 0.17900466918945312, 0.19488525390625, 0.21076583862304688, 0.22664642333984375, 0.24252700805664062, 0.2584075927734375, 0.2742881774902344, 0.29016876220703125, 0.3060493469238281, 0.321929931640625, 0.3378105163574219, 0.35369110107421875, 0.3695716857910156, 0.3854522705078125, 0.4013328552246094, 0.41721343994140625, 0.4330940246582031, 0.448974609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 10.0, 5.0, 3.0, 9.0, 12.0, 11.0, 5.0, 13.0, 17.0, 24.0, 21.0, 32.0, 45.0, 54.0, 61.0, 74.0, 115.0, 93.0, 88.0, 55.0, 47.0, 44.0, 30.0, 27.0, 16.0, 14.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.09173583984375, -0.08909988403320312, -0.08646392822265625, -0.08382797241210938, -0.0811920166015625, -0.07855606079101562, -0.07592010498046875, -0.07328414916992188, -0.070648193359375, -0.06801223754882812, -0.06537628173828125, -0.06274032592773438, -0.0601043701171875, -0.057468414306640625, -0.05483245849609375, -0.052196502685546875, -0.049560546875, -0.046924591064453125, -0.04428863525390625, -0.041652679443359375, -0.0390167236328125, -0.036380767822265625, -0.03374481201171875, -0.031108856201171875, -0.028472900390625, -0.025836944580078125, -0.02320098876953125, -0.020565032958984375, -0.0179290771484375, -0.015293121337890625, -0.01265716552734375, -0.010021209716796875, -0.00738525390625, -0.004749298095703125, -0.00211334228515625, 0.000522613525390625, 0.0031585693359375, 0.005794525146484375, 0.00843048095703125, 0.011066436767578125, 0.013702392578125, 0.016338348388671875, 0.01897430419921875, 0.021610260009765625, 0.0242462158203125, 0.026882171630859375, 0.02951812744140625, 0.032154083251953125, 0.0347900390625, 0.037425994873046875, 0.04006195068359375, 0.042697906494140625, 0.0453338623046875, 0.047969818115234375, 0.05060577392578125, 0.053241729736328125, 0.055877685546875, 0.058513641357421875, 0.06114959716796875, 0.06378555297851562, 0.0664215087890625, 0.06905746459960938, 0.07169342041015625, 0.07432937622070312, 0.07696533203125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 4.0, 8.0, 15.0, 14.0, 21.0, 27.0, 42.0, 79.0, 89.0, 102.0, 137.0, 105.0, 90.0, 57.0, 37.0, 29.0, 34.0, 23.0, 20.0, 15.0, 13.0, 5.0, 2.0, 5.0, 1.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5460124015808105, -7.327597618103027, -7.109182834625244, -6.890768051147461, -6.672353744506836, -6.453938961029053, -6.2355241775512695, -6.017109394073486, -5.798694610595703, -5.58027982711792, -5.361865043640137, -5.143450736999512, -4.9250359535217285, -4.706621170043945, -4.488206386566162, -4.269791603088379, -4.051377296447754, -3.8329625129699707, -3.6145479679107666, -3.3961331844329834, -3.1777184009552, -2.959303855895996, -2.740889072418213, -2.5224742889404297, -2.3040595054626465, -2.0856447219848633, -1.8672300577163696, -1.648815393447876, -1.4304006099700928, -1.2119859457015991, -0.9935712814331055, -0.7751564979553223, -0.5567417144775391, -0.33832699060440063, -0.1199122965335846, 0.09850239753723145, 0.3169171214103699, 0.5353318452835083, 0.753746509552002, 0.9721612930297852, 1.1905759572982788, 1.4089906215667725, 1.6274054050445557, 1.8458200693130493, 2.064234733581543, 2.282649517059326, 2.5010643005371094, 2.7194790840148926, 2.9378936290740967, 3.15630841255188, 3.374722957611084, 3.593137741088867, 3.8115525245666504, 4.029967308044434, 4.248381614685059, 4.466796875, 4.685211181640625, 4.903625965118408, 5.122040748596191, 5.340455055236816, 5.5588698387146, 5.777284622192383, 5.995699405670166, 6.214114189147949, 6.432528972625732]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 6.0, 7.0, 11.0, 14.0, 13.0, 21.0, 21.0, 37.0, 26.0, 39.0, 44.0, 41.0, 47.0, 36.0, 52.0, 46.0, 48.0, 39.0, 55.0, 47.0, 39.0, 33.0, 44.0, 40.0, 33.0, 27.0, 19.0, 13.0, 21.0, 15.0, 15.0, 6.0, 9.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.454493522644043, -4.313096523284912, -4.1717000007629395, -4.030303001403809, -3.888906240463257, -3.747509479522705, -3.606112480163574, -3.4647157192230225, -3.3233189582824707, -3.181922197341919, -3.040525436401367, -2.8991284370422363, -2.7577316761016846, -2.616334915161133, -2.474937915802002, -2.33354115486145, -2.1921443939208984, -2.0507476329803467, -1.9093507528305054, -1.767953872680664, -1.6265571117401123, -1.4851603507995605, -1.3437634706497192, -1.202366590499878, -1.0609698295593262, -0.9195730090141296, -0.7781761884689331, -0.6367793679237366, -0.49538254737854004, -0.3539857268333435, -0.21258890628814697, -0.07119208574295044, 0.0702052116394043, 0.21160203218460083, 0.35299885272979736, 0.4943956732749939, 0.6357924938201904, 0.777189314365387, 0.9185861349105835, 1.0599830150604248, 1.2013797760009766, 1.3427765369415283, 1.4841734170913696, 1.625570297241211, 1.7669670581817627, 1.9083638191223145, 2.0497608184814453, 2.191157579421997, 2.332554340362549, 2.4739511013031006, 2.6153478622436523, 2.756744861602783, 2.898141622543335, 3.0395383834838867, 3.1809353828430176, 3.3223321437835693, 3.463728904724121, 3.605125665664673, 3.7465224266052246, 3.8879194259643555, 4.029315948486328, 4.170712947845459, 4.31210994720459, 4.4535064697265625, 4.594903469085693]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 10.0, 11.0, 18.0, 21.0, 35.0, 40.0, 70.0, 102.0, 138.0, 186.0, 285.0, 338.0, 487.0, 696.0, 1064.0, 1523.0, 2224.0, 3368.0, 5281.0, 7921.0, 12840.0, 21309.0, 35744.0, 62162.0, 110326.0, 193761.0, 236413.0, 147733.0, 82743.0, 47543.0, 27830.0, 16728.0, 10297.0, 6455.0, 4110.0, 2704.0, 1829.0, 1242.0, 865.0, 626.0, 448.0, 288.0, 222.0, 149.0, 110.0, 71.0, 51.0, 55.0, 28.0, 17.0, 16.0, 9.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0], "bins": [-6.4296875, -6.2303466796875, -6.031005859375, -5.8316650390625, -5.63232421875, -5.4329833984375, -5.233642578125, -5.0343017578125, -4.8349609375, -4.6356201171875, -4.436279296875, -4.2369384765625, -4.03759765625, -3.8382568359375, -3.638916015625, -3.4395751953125, -3.240234375, -3.0408935546875, -2.841552734375, -2.6422119140625, -2.44287109375, -2.2435302734375, -2.044189453125, -1.8448486328125, -1.6455078125, -1.4461669921875, -1.246826171875, -1.0474853515625, -0.84814453125, -0.6488037109375, -0.449462890625, -0.2501220703125, -0.05078125, 0.1485595703125, 0.347900390625, 0.5472412109375, 0.74658203125, 0.9459228515625, 1.145263671875, 1.3446044921875, 1.5439453125, 1.7432861328125, 1.942626953125, 2.1419677734375, 2.34130859375, 2.5406494140625, 2.739990234375, 2.9393310546875, 3.138671875, 3.3380126953125, 3.537353515625, 3.7366943359375, 3.93603515625, 4.1353759765625, 4.334716796875, 4.5340576171875, 4.7333984375, 4.9327392578125, 5.132080078125, 5.3314208984375, 5.53076171875, 5.7301025390625, 5.929443359375, 6.1287841796875, 6.328125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 6.0, 3.0, 7.0, 11.0, 20.0, 14.0, 19.0, 13.0, 32.0, 36.0, 36.0, 31.0, 36.0, 39.0, 40.0, 35.0, 45.0, 38.0, 51.0, 48.0, 43.0, 44.0, 31.0, 33.0, 33.0, 42.0, 30.0, 27.0, 25.0, 24.0, 23.0, 13.0, 11.0, 14.0, 13.0, 7.0, 5.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.623046875, -3.50872802734375, -3.3944091796875, -3.28009033203125, -3.165771484375, -3.05145263671875, -2.9371337890625, -2.82281494140625, -2.70849609375, -2.59417724609375, -2.4798583984375, -2.36553955078125, -2.251220703125, -2.13690185546875, -2.0225830078125, -1.90826416015625, -1.7939453125, -1.67962646484375, -1.5653076171875, -1.45098876953125, -1.336669921875, -1.22235107421875, -1.1080322265625, -0.99371337890625, -0.87939453125, -0.76507568359375, -0.6507568359375, -0.53643798828125, -0.422119140625, -0.30780029296875, -0.1934814453125, -0.07916259765625, 0.03515625, 0.14947509765625, 0.2637939453125, 0.37811279296875, 0.492431640625, 0.60675048828125, 0.7210693359375, 0.83538818359375, 0.94970703125, 1.06402587890625, 1.1783447265625, 1.29266357421875, 1.406982421875, 1.52130126953125, 1.6356201171875, 1.74993896484375, 1.8642578125, 1.97857666015625, 2.0928955078125, 2.20721435546875, 2.321533203125, 2.43585205078125, 2.5501708984375, 2.66448974609375, 2.77880859375, 2.89312744140625, 3.0074462890625, 3.12176513671875, 3.236083984375, 3.35040283203125, 3.4647216796875, 3.57904052734375, 3.693359375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 7.0, 15.0, 11.0, 22.0, 24.0, 39.0, 67.0, 106.0, 162.0, 242.0, 344.0, 638.0, 1008.0, 1735.0, 2844.0, 4880.0, 9472.0, 18117.0, 36485.0, 74783.0, 156770.0, 293212.0, 228252.0, 110668.0, 53043.0, 25977.0, 13076.0, 7111.0, 3759.0, 2229.0, 1262.0, 806.0, 516.0, 315.0, 199.0, 114.0, 70.0, 62.0, 30.0, 33.0, 17.0, 12.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.83984375, -7.593017578125, -7.34619140625, -7.099365234375, -6.8525390625, -6.605712890625, -6.35888671875, -6.112060546875, -5.865234375, -5.618408203125, -5.37158203125, -5.124755859375, -4.8779296875, -4.631103515625, -4.38427734375, -4.137451171875, -3.890625, -3.643798828125, -3.39697265625, -3.150146484375, -2.9033203125, -2.656494140625, -2.40966796875, -2.162841796875, -1.916015625, -1.669189453125, -1.42236328125, -1.175537109375, -0.9287109375, -0.681884765625, -0.43505859375, -0.188232421875, 0.05859375, 0.305419921875, 0.55224609375, 0.799072265625, 1.0458984375, 1.292724609375, 1.53955078125, 1.786376953125, 2.033203125, 2.280029296875, 2.52685546875, 2.773681640625, 3.0205078125, 3.267333984375, 3.51416015625, 3.760986328125, 4.0078125, 4.254638671875, 4.50146484375, 4.748291015625, 4.9951171875, 5.241943359375, 5.48876953125, 5.735595703125, 5.982421875, 6.229248046875, 6.47607421875, 6.722900390625, 6.9697265625, 7.216552734375, 7.46337890625, 7.710205078125, 7.95703125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 9.0, 8.0, 10.0, 7.0, 4.0, 15.0, 11.0, 17.0, 28.0, 18.0, 25.0, 22.0, 33.0, 23.0, 37.0, 28.0, 25.0, 45.0, 34.0, 27.0, 31.0, 39.0, 44.0, 34.0, 35.0, 34.0, 28.0, 22.0, 40.0, 25.0, 24.0, 27.0, 23.0, 27.0, 15.0, 15.0, 21.0, 12.0, 11.0, 10.0, 12.0, 8.0, 7.0, 2.0, 7.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.984375, -1.9246368408203125, -1.864898681640625, -1.8051605224609375, -1.74542236328125, -1.6856842041015625, -1.625946044921875, -1.5662078857421875, -1.5064697265625, -1.4467315673828125, -1.386993408203125, -1.3272552490234375, -1.26751708984375, -1.2077789306640625, -1.148040771484375, -1.0883026123046875, -1.028564453125, -0.9688262939453125, -0.909088134765625, -0.8493499755859375, -0.78961181640625, -0.7298736572265625, -0.670135498046875, -0.6103973388671875, -0.5506591796875, -0.4909210205078125, -0.431182861328125, -0.3714447021484375, -0.31170654296875, -0.2519683837890625, -0.192230224609375, -0.1324920654296875, -0.07275390625, -0.0130157470703125, 0.046722412109375, 0.1064605712890625, 0.16619873046875, 0.2259368896484375, 0.285675048828125, 0.3454132080078125, 0.4051513671875, 0.4648895263671875, 0.524627685546875, 0.5843658447265625, 0.64410400390625, 0.7038421630859375, 0.763580322265625, 0.8233184814453125, 0.883056640625, 0.9427947998046875, 1.002532958984375, 1.0622711181640625, 1.12200927734375, 1.1817474365234375, 1.241485595703125, 1.3012237548828125, 1.3609619140625, 1.4207000732421875, 1.480438232421875, 1.5401763916015625, 1.59991455078125, 1.6596527099609375, 1.719390869140625, 1.7791290283203125, 1.8388671875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 13.0, 4.0, 9.0, 10.0, 25.0, 35.0, 40.0, 74.0, 108.0, 163.0, 241.0, 369.0, 500.0, 785.0, 1189.0, 1860.0, 3053.0, 5174.0, 9029.0, 17356.0, 38469.0, 114845.0, 693228.0, 92203.0, 33394.0, 15606.0, 8213.0, 4717.0, 2729.0, 1798.0, 1119.0, 699.0, 468.0, 326.0, 209.0, 160.0, 107.0, 81.0, 58.0, 30.0, 20.0, 21.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.39739990234375, -4.2479248046875, -4.09844970703125, -3.948974609375, -3.79949951171875, -3.6500244140625, -3.50054931640625, -3.35107421875, -3.20159912109375, -3.0521240234375, -2.90264892578125, -2.753173828125, -2.60369873046875, -2.4542236328125, -2.30474853515625, -2.1552734375, -2.00579833984375, -1.8563232421875, -1.70684814453125, -1.557373046875, -1.40789794921875, -1.2584228515625, -1.10894775390625, -0.95947265625, -0.80999755859375, -0.6605224609375, -0.51104736328125, -0.361572265625, -0.21209716796875, -0.0626220703125, 0.08685302734375, 0.236328125, 0.38580322265625, 0.5352783203125, 0.68475341796875, 0.834228515625, 0.98370361328125, 1.1331787109375, 1.28265380859375, 1.43212890625, 1.58160400390625, 1.7310791015625, 1.88055419921875, 2.030029296875, 2.17950439453125, 2.3289794921875, 2.47845458984375, 2.6279296875, 2.77740478515625, 2.9268798828125, 3.07635498046875, 3.225830078125, 3.37530517578125, 3.5247802734375, 3.67425537109375, 3.82373046875, 3.97320556640625, 4.1226806640625, 4.27215576171875, 4.421630859375, 4.57110595703125, 4.7205810546875, 4.87005615234375, 5.01953125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 4.0, 8.0, 11.0, 20.0, 34.0, 29.0, 46.0, 87.0, 266.0, 218.0, 84.0, 45.0, 33.0, 29.0, 14.0, 11.0, 12.0, 6.0, 5.0, 7.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001983642578125, -0.00019127130508422852, -0.00018417835235595703, -0.00017708539962768555, -0.00016999244689941406, -0.00016289949417114258, -0.0001558065414428711, -0.0001487135887145996, -0.00014162063598632812, -0.00013452768325805664, -0.00012743473052978516, -0.00012034177780151367, -0.00011324882507324219, -0.0001061558723449707, -9.906291961669922e-05, -9.196996688842773e-05, -8.487701416015625e-05, -7.778406143188477e-05, -7.069110870361328e-05, -6.35981559753418e-05, -5.650520324707031e-05, -4.941225051879883e-05, -4.2319297790527344e-05, -3.522634506225586e-05, -2.8133392333984375e-05, -2.104043960571289e-05, -1.3947486877441406e-05, -6.854534149169922e-06, 2.384185791015625e-07, 7.331371307373047e-06, 1.4424324035644531e-05, 2.1517276763916016e-05, 2.86102294921875e-05, 3.5703182220458984e-05, 4.279613494873047e-05, 4.988908767700195e-05, 5.698204040527344e-05, 6.407499313354492e-05, 7.11679458618164e-05, 7.826089859008789e-05, 8.535385131835938e-05, 9.244680404663086e-05, 9.953975677490234e-05, 0.00010663270950317383, 0.00011372566223144531, 0.0001208186149597168, 0.00012791156768798828, 0.00013500452041625977, 0.00014209747314453125, 0.00014919042587280273, 0.00015628337860107422, 0.0001633763313293457, 0.0001704692840576172, 0.00017756223678588867, 0.00018465518951416016, 0.00019174814224243164, 0.00019884109497070312, 0.0002059340476989746, 0.0002130270004272461, 0.00022011995315551758, 0.00022721290588378906, 0.00023430585861206055, 0.00024139881134033203, 0.0002484917640686035, 0.000255584716796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 12.0, 13.0, 14.0, 27.0, 34.0, 41.0, 69.0, 95.0, 153.0, 255.0, 343.0, 530.0, 896.0, 1308.0, 2295.0, 3899.0, 7527.0, 15444.0, 38945.0, 161610.0, 711501.0, 60093.0, 21402.0, 9619.0, 5047.0, 2856.0, 1673.0, 956.0, 650.0, 395.0, 295.0, 199.0, 97.0, 75.0, 56.0, 41.0, 27.0, 18.0, 17.0, 9.0, 9.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.8203125, -5.64495849609375, -5.4696044921875, -5.29425048828125, -5.118896484375, -4.94354248046875, -4.7681884765625, -4.59283447265625, -4.41748046875, -4.24212646484375, -4.0667724609375, -3.89141845703125, -3.716064453125, -3.54071044921875, -3.3653564453125, -3.19000244140625, -3.0146484375, -2.83929443359375, -2.6639404296875, -2.48858642578125, -2.313232421875, -2.13787841796875, -1.9625244140625, -1.78717041015625, -1.61181640625, -1.43646240234375, -1.2611083984375, -1.08575439453125, -0.910400390625, -0.73504638671875, -0.5596923828125, -0.38433837890625, -0.208984375, -0.03363037109375, 0.1417236328125, 0.31707763671875, 0.492431640625, 0.66778564453125, 0.8431396484375, 1.01849365234375, 1.19384765625, 1.36920166015625, 1.5445556640625, 1.71990966796875, 1.895263671875, 2.07061767578125, 2.2459716796875, 2.42132568359375, 2.5966796875, 2.77203369140625, 2.9473876953125, 3.12274169921875, 3.298095703125, 3.47344970703125, 3.6488037109375, 3.82415771484375, 3.99951171875, 4.17486572265625, 4.3502197265625, 4.52557373046875, 4.700927734375, 4.87628173828125, 5.0516357421875, 5.22698974609375, 5.40234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 12.0, 13.0, 14.0, 16.0, 18.0, 25.0, 38.0, 42.0, 53.0, 246.0, 243.0, 54.0, 49.0, 27.0, 30.0, 23.0, 19.0, 10.0, 8.0, 7.0, 6.0, 6.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.0654754638671875, -1.024505615234375, -0.9835357666015625, -0.94256591796875, -0.9015960693359375, -0.860626220703125, -0.8196563720703125, -0.7786865234375, -0.7377166748046875, -0.696746826171875, -0.6557769775390625, -0.61480712890625, -0.5738372802734375, -0.532867431640625, -0.4918975830078125, -0.450927734375, -0.4099578857421875, -0.368988037109375, -0.3280181884765625, -0.28704833984375, -0.2460784912109375, -0.205108642578125, -0.1641387939453125, -0.1231689453125, -0.0821990966796875, -0.041229248046875, -0.0002593994140625, 0.04071044921875, 0.0816802978515625, 0.122650146484375, 0.1636199951171875, 0.20458984375, 0.2455596923828125, 0.286529541015625, 0.3274993896484375, 0.36846923828125, 0.4094390869140625, 0.450408935546875, 0.4913787841796875, 0.5323486328125, 0.5733184814453125, 0.614288330078125, 0.6552581787109375, 0.69622802734375, 0.7371978759765625, 0.778167724609375, 0.8191375732421875, 0.860107421875, 0.9010772705078125, 0.942047119140625, 0.9830169677734375, 1.02398681640625, 1.0649566650390625, 1.105926513671875, 1.1468963623046875, 1.1878662109375, 1.2288360595703125, 1.269805908203125, 1.3107757568359375, 1.35174560546875, 1.3927154541015625, 1.433685302734375, 1.4746551513671875, 1.515625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 4.0, 7.0, 4.0, 3.0, 7.0, 9.0, 26.0, 27.0, 32.0, 47.0, 69.0, 88.0, 105.0, 117.0, 94.0, 69.0, 59.0, 44.0, 43.0, 30.0, 22.0, 12.0, 16.0, 15.0, 8.0, 9.0, 1.0, 6.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.172679901123047, -6.003029823303223, -5.83337926864624, -5.663728713989258, -5.494078636169434, -5.324428558349609, -5.154778003692627, -4.9851274490356445, -4.81547737121582, -4.645827293395996, -4.476176738739014, -4.306526184082031, -4.136876106262207, -3.9672257900238037, -3.7975754737854004, -3.627925157546997, -3.4582748413085938, -3.2886245250701904, -3.118974208831787, -2.949323892593384, -2.7796735763549805, -2.610023260116577, -2.440372943878174, -2.2707226276397705, -2.101072311401367, -1.9314219951629639, -1.7617716789245605, -1.5921213626861572, -1.422471046447754, -1.2528207302093506, -1.0831704139709473, -0.913520097732544, -0.7438693046569824, -0.5742189884185791, -0.4045686721801758, -0.23491835594177246, -0.06526803970336914, 0.10438227653503418, 0.2740325927734375, 0.4436829090118408, 0.6133332252502441, 0.7829835414886475, 0.9526338577270508, 1.122284173965454, 1.2919344902038574, 1.4615848064422607, 1.631235122680664, 1.8008854389190674, 1.9705357551574707, 2.140186071395874, 2.3098363876342773, 2.4794867038726807, 2.649137020111084, 2.8187873363494873, 2.9884376525878906, 3.158087968826294, 3.3277382850646973, 3.4973886013031006, 3.667038917541504, 3.8366892337799072, 4.0063395500183105, 4.175990104675293, 4.345640182495117, 4.515290260314941, 4.684940814971924]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 13.0, 9.0, 15.0, 15.0, 14.0, 16.0, 9.0, 34.0, 24.0, 34.0, 29.0, 26.0, 42.0, 37.0, 44.0, 41.0, 35.0, 39.0, 42.0, 40.0, 49.0, 39.0, 30.0, 28.0, 28.0, 28.0, 22.0, 31.0, 30.0, 25.0, 21.0, 6.0, 16.0, 6.0, 14.0, 12.0, 7.0, 7.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.4337317943573, -3.326493263244629, -3.219254732131958, -3.112016201019287, -3.004777669906616, -2.8975391387939453, -2.7903008460998535, -2.6830620765686035, -2.5758237838745117, -2.468585252761841, -2.36134672164917, -2.254108190536499, -2.146869659423828, -2.0396311283111572, -1.9323927164077759, -1.825154185295105, -1.7179155349731445, -1.6106770038604736, -1.5034384727478027, -1.3961999416351318, -1.288961410522461, -1.18172287940979, -1.0744844675064087, -0.9672459363937378, -0.8600074052810669, -0.752768874168396, -0.6455303430557251, -0.538291871547699, -0.4310533404350281, -0.3238148093223572, -0.21657633781433105, -0.10933780670166016, -0.0020995140075683594, 0.10513900220394135, 0.21237751841545105, 0.31961601972579956, 0.42685455083847046, 0.5340930819511414, 0.6413315534591675, 0.7485700845718384, 0.8558086156845093, 0.9630471467971802, 1.070285677909851, 1.1775240898132324, 1.2847626209259033, 1.3920011520385742, 1.4992396831512451, 1.606478214263916, 1.713716745376587, 1.8209552764892578, 1.9281938076019287, 2.0354323387145996, 2.1426708698272705, 2.2499094009399414, 2.357147693634033, 2.464386463165283, 2.571624755859375, 2.678863286972046, 2.786101818084717, 2.8933403491973877, 3.0005788803100586, 3.1078174114227295, 3.2150559425354004, 3.322294235229492, 3.429533004760742]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 12.0, 18.0, 31.0, 31.0, 55.0, 61.0, 67.0, 117.0, 125.0, 173.0, 246.0, 339.0, 472.0, 605.0, 853.0, 1133.0, 1552.0, 2173.0, 3137.0, 4374.0, 6350.0, 9265.0, 14482.0, 22518.0, 37074.0, 64063.0, 121377.0, 282150.0, 912688.0, 1674629.0, 594929.0, 197877.0, 93896.0, 52122.0, 30811.0, 19662.0, 12905.0, 8665.0, 6323.0, 4502.0, 3158.0, 2355.0, 1745.0, 1340.0, 969.0, 712.0, 534.0, 435.0, 316.0, 214.0, 168.0, 129.0, 104.0, 74.0, 58.0, 41.0, 31.0, 27.0, 13.0, 7.0, 3.0, 2.0], "bins": [-4.51171875, -4.36773681640625, -4.2237548828125, -4.07977294921875, -3.935791015625, -3.79180908203125, -3.6478271484375, -3.50384521484375, -3.35986328125, -3.21588134765625, -3.0718994140625, -2.92791748046875, -2.783935546875, -2.63995361328125, -2.4959716796875, -2.35198974609375, -2.2080078125, -2.06402587890625, -1.9200439453125, -1.77606201171875, -1.632080078125, -1.48809814453125, -1.3441162109375, -1.20013427734375, -1.05615234375, -0.91217041015625, -0.7681884765625, -0.62420654296875, -0.480224609375, -0.33624267578125, -0.1922607421875, -0.04827880859375, 0.095703125, 0.23968505859375, 0.3836669921875, 0.52764892578125, 0.671630859375, 0.81561279296875, 0.9595947265625, 1.10357666015625, 1.24755859375, 1.39154052734375, 1.5355224609375, 1.67950439453125, 1.823486328125, 1.96746826171875, 2.1114501953125, 2.25543212890625, 2.3994140625, 2.54339599609375, 2.6873779296875, 2.83135986328125, 2.975341796875, 3.11932373046875, 3.2633056640625, 3.40728759765625, 3.55126953125, 3.69525146484375, 3.8392333984375, 3.98321533203125, 4.127197265625, 4.27117919921875, 4.4151611328125, 4.55914306640625, 4.703125]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 4.0, 12.0, 12.0, 9.0, 15.0, 15.0, 17.0, 20.0, 35.0, 28.0, 29.0, 31.0, 43.0, 35.0, 45.0, 40.0, 40.0, 34.0, 41.0, 36.0, 44.0, 44.0, 34.0, 35.0, 24.0, 35.0, 27.0, 20.0, 24.0, 26.0, 24.0, 13.0, 14.0, 13.0, 9.0, 9.0, 12.0, 11.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.296875, -2.228118896484375, -2.15936279296875, -2.090606689453125, -2.0218505859375, -1.953094482421875, -1.88433837890625, -1.815582275390625, -1.746826171875, -1.678070068359375, -1.60931396484375, -1.540557861328125, -1.4718017578125, -1.403045654296875, -1.33428955078125, -1.265533447265625, -1.19677734375, -1.128021240234375, -1.05926513671875, -0.990509033203125, -0.9217529296875, -0.852996826171875, -0.78424072265625, -0.715484619140625, -0.646728515625, -0.577972412109375, -0.50921630859375, -0.440460205078125, -0.3717041015625, -0.302947998046875, -0.23419189453125, -0.165435791015625, -0.0966796875, -0.027923583984375, 0.04083251953125, 0.109588623046875, 0.1783447265625, 0.247100830078125, 0.31585693359375, 0.384613037109375, 0.453369140625, 0.522125244140625, 0.59088134765625, 0.659637451171875, 0.7283935546875, 0.797149658203125, 0.86590576171875, 0.934661865234375, 1.00341796875, 1.072174072265625, 1.14093017578125, 1.209686279296875, 1.2784423828125, 1.347198486328125, 1.41595458984375, 1.484710693359375, 1.553466796875, 1.622222900390625, 1.69097900390625, 1.759735107421875, 1.8284912109375, 1.897247314453125, 1.96600341796875, 2.034759521484375, 2.103515625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 8.0, 4.0, 8.0, 9.0, 9.0, 25.0, 38.0, 44.0, 62.0, 71.0, 116.0, 200.0, 277.0, 379.0, 577.0, 905.0, 1342.0, 2228.0, 3555.0, 5676.0, 9702.0, 17008.0, 31077.0, 60004.0, 126267.0, 298833.0, 896770.0, 1732232.0, 586804.0, 216676.0, 95990.0, 47136.0, 24824.0, 14049.0, 8075.0, 4881.0, 3001.0, 1901.0, 1248.0, 774.0, 456.0, 340.0, 213.0, 156.0, 109.0, 84.0, 39.0, 31.0, 29.0, 16.0, 7.0, 9.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0], "bins": [-4.875, -4.72418212890625, -4.5733642578125, -4.42254638671875, -4.271728515625, -4.12091064453125, -3.9700927734375, -3.81927490234375, -3.66845703125, -3.51763916015625, -3.3668212890625, -3.21600341796875, -3.065185546875, -2.91436767578125, -2.7635498046875, -2.61273193359375, -2.4619140625, -2.31109619140625, -2.1602783203125, -2.00946044921875, -1.858642578125, -1.70782470703125, -1.5570068359375, -1.40618896484375, -1.25537109375, -1.10455322265625, -0.9537353515625, -0.80291748046875, -0.652099609375, -0.50128173828125, -0.3504638671875, -0.19964599609375, -0.048828125, 0.10198974609375, 0.2528076171875, 0.40362548828125, 0.554443359375, 0.70526123046875, 0.8560791015625, 1.00689697265625, 1.15771484375, 1.30853271484375, 1.4593505859375, 1.61016845703125, 1.760986328125, 1.91180419921875, 2.0626220703125, 2.21343994140625, 2.3642578125, 2.51507568359375, 2.6658935546875, 2.81671142578125, 2.967529296875, 3.11834716796875, 3.2691650390625, 3.41998291015625, 3.57080078125, 3.72161865234375, 3.8724365234375, 4.02325439453125, 4.174072265625, 4.32489013671875, 4.4757080078125, 4.62652587890625, 4.77734375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 6.0, 10.0, 14.0, 25.0, 27.0, 24.0, 37.0, 43.0, 52.0, 62.0, 80.0, 107.0, 131.0, 145.0, 201.0, 225.0, 281.0, 322.0, 346.0, 336.0, 306.0, 225.0, 197.0, 176.0, 133.0, 102.0, 90.0, 68.0, 75.0, 41.0, 43.0, 36.0, 18.0, 16.0, 9.0, 10.0, 4.0, 6.0, 15.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.361328125, -1.31982421875, -1.2783203125, -1.23681640625, -1.1953125, -1.15380859375, -1.1123046875, -1.07080078125, -1.029296875, -0.98779296875, -0.9462890625, -0.90478515625, -0.86328125, -0.82177734375, -0.7802734375, -0.73876953125, -0.697265625, -0.65576171875, -0.6142578125, -0.57275390625, -0.53125, -0.48974609375, -0.4482421875, -0.40673828125, -0.365234375, -0.32373046875, -0.2822265625, -0.24072265625, -0.19921875, -0.15771484375, -0.1162109375, -0.07470703125, -0.033203125, 0.00830078125, 0.0498046875, 0.09130859375, 0.1328125, 0.17431640625, 0.2158203125, 0.25732421875, 0.298828125, 0.34033203125, 0.3818359375, 0.42333984375, 0.46484375, 0.50634765625, 0.5478515625, 0.58935546875, 0.630859375, 0.67236328125, 0.7138671875, 0.75537109375, 0.796875, 0.83837890625, 0.8798828125, 0.92138671875, 0.962890625, 1.00439453125, 1.0458984375, 1.08740234375, 1.12890625, 1.17041015625, 1.2119140625, 1.25341796875, 1.294921875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 8.0, 20.0, 24.0, 17.0, 29.0, 54.0, 79.0, 108.0, 140.0, 125.0, 94.0, 81.0, 53.0, 38.0, 23.0, 23.0, 19.0, 10.0, 3.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.58712100982666, -5.431973934173584, -5.276827335357666, -5.12168025970459, -4.966533184051514, -4.8113861083984375, -4.6562395095825195, -4.501092433929443, -4.345945358276367, -4.190798282623291, -4.035651683807373, -3.880504608154297, -3.7253575325012207, -3.5702106952667236, -3.4150638580322266, -3.2599167823791504, -3.1047701835632324, -2.9496233463287354, -2.794476270675659, -2.639329433441162, -2.484182357788086, -2.329035520553589, -2.173888683319092, -2.0187416076660156, -1.8635947704315186, -1.708447813987732, -1.5533008575439453, -1.3981540203094482, -1.2430070638656616, -1.087860107421875, -0.9327132105827332, -0.7775663137435913, -0.6224188804626465, -0.46727195382118225, -0.312125027179718, -0.15697810053825378, -0.0018311738967895508, 0.15331578254699707, 0.3084626793861389, 0.46360957622528076, 0.6187565326690674, 0.773903489112854, 0.9290503859519958, 1.0841972827911377, 1.2393442392349243, 1.394491195678711, 1.549638032913208, 1.7047849893569946, 1.8599319458007812, 2.0150787830352783, 2.1702258586883545, 2.3253726959228516, 2.4805197715759277, 2.635666608810425, 2.790813446044922, 2.945960521697998, 3.101107358932495, 3.256254196166992, 3.4114012718200684, 3.5665481090545654, 3.7216949462890625, 3.8768420219421387, 4.031989097595215, 4.187135696411133, 4.342282772064209]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 10.0, 5.0, 7.0, 5.0, 7.0, 7.0, 11.0, 17.0, 10.0, 16.0, 15.0, 22.0, 22.0, 24.0, 23.0, 32.0, 30.0, 53.0, 32.0, 28.0, 31.0, 28.0, 40.0, 37.0, 55.0, 24.0, 31.0, 40.0, 46.0, 29.0, 32.0, 37.0, 38.0, 18.0, 17.0, 18.0, 16.0, 12.0, 11.0, 10.0, 9.0, 8.0, 14.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.541909694671631, -2.4657373428344727, -2.3895652294158936, -2.3133928775787354, -2.237220525741577, -2.161048412322998, -2.08487606048584, -2.0087037086486816, -1.9325315952301025, -1.8563593626022339, -1.7801870107650757, -1.704014778137207, -1.6278425455093384, -1.5516703128814697, -1.4754979610443115, -1.3993257284164429, -1.3231533765792847, -1.246981143951416, -1.1708087921142578, -1.0946365594863892, -1.0184643268585205, -0.9422920346260071, -0.8661197423934937, -0.789947509765625, -0.7137752175331116, -0.6376029253005981, -0.5614306926727295, -0.48525840044021606, -0.409086138010025, -0.332913875579834, -0.25674158334732056, -0.1805693507194519, -0.10439705848693848, -0.02822478860616684, 0.0479474812746048, 0.12411975860595703, 0.20029202103614807, 0.2764642834663391, 0.35263657569885254, 0.4288088083267212, 0.5049811005592346, 0.581153392791748, 0.6573256254196167, 0.7334979176521301, 0.8096702098846436, 0.8858424425125122, 0.9620147347450256, 1.038187026977539, 1.1143592596054077, 1.1905314922332764, 1.2667038440704346, 1.3428760766983032, 1.4190483093261719, 1.49522066116333, 1.5713928937911987, 1.6475651264190674, 1.7237374782562256, 1.7999097108840942, 1.8760820627212524, 1.952254295349121, 2.0284266471862793, 2.1045987606048584, 2.1807711124420166, 2.2569432258605957, 2.333115577697754]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 13.0, 12.0, 12.0, 15.0, 25.0, 40.0, 57.0, 97.0, 127.0, 176.0, 279.0, 384.0, 675.0, 964.0, 1506.0, 2413.0, 4000.0, 6566.0, 11059.0, 20009.0, 36848.0, 73141.0, 157496.0, 314532.0, 213402.0, 97509.0, 47362.0, 24858.0, 13975.0, 8095.0, 4791.0, 2977.0, 1805.0, 1175.0, 743.0, 479.0, 291.0, 201.0, 133.0, 101.0, 68.0, 41.0, 42.0, 22.0, 17.0, 7.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9560546875, -1.8979949951171875, -1.839935302734375, -1.7818756103515625, -1.72381591796875, -1.6657562255859375, -1.607696533203125, -1.5496368408203125, -1.4915771484375, -1.4335174560546875, -1.375457763671875, -1.3173980712890625, -1.25933837890625, -1.2012786865234375, -1.143218994140625, -1.0851593017578125, -1.027099609375, -0.9690399169921875, -0.910980224609375, -0.8529205322265625, -0.79486083984375, -0.7368011474609375, -0.678741455078125, -0.6206817626953125, -0.5626220703125, -0.5045623779296875, -0.446502685546875, -0.3884429931640625, -0.33038330078125, -0.2723236083984375, -0.214263916015625, -0.1562042236328125, -0.09814453125, -0.0400848388671875, 0.017974853515625, 0.0760345458984375, 0.13409423828125, 0.1921539306640625, 0.250213623046875, 0.3082733154296875, 0.3663330078125, 0.4243927001953125, 0.482452392578125, 0.5405120849609375, 0.59857177734375, 0.6566314697265625, 0.714691162109375, 0.7727508544921875, 0.830810546875, 0.8888702392578125, 0.946929931640625, 1.0049896240234375, 1.06304931640625, 1.1211090087890625, 1.179168701171875, 1.2372283935546875, 1.2952880859375, 1.3533477783203125, 1.411407470703125, 1.4694671630859375, 1.52752685546875, 1.5855865478515625, 1.643646240234375, 1.7017059326171875, 1.759765625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 6.0, 6.0, 10.0, 10.0, 12.0, 8.0, 22.0, 13.0, 20.0, 21.0, 24.0, 29.0, 29.0, 36.0, 41.0, 29.0, 31.0, 39.0, 36.0, 31.0, 37.0, 41.0, 45.0, 41.0, 35.0, 40.0, 36.0, 38.0, 34.0, 29.0, 19.0, 21.0, 17.0, 13.0, 19.0, 10.0, 9.0, 7.0, 6.0, 6.0, 12.0, 4.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.572265625, -2.493072509765625, -2.41387939453125, -2.334686279296875, -2.2554931640625, -2.176300048828125, -2.09710693359375, -2.017913818359375, -1.938720703125, -1.859527587890625, -1.78033447265625, -1.701141357421875, -1.6219482421875, -1.542755126953125, -1.46356201171875, -1.384368896484375, -1.30517578125, -1.225982666015625, -1.14678955078125, -1.067596435546875, -0.9884033203125, -0.909210205078125, -0.83001708984375, -0.750823974609375, -0.671630859375, -0.592437744140625, -0.51324462890625, -0.434051513671875, -0.3548583984375, -0.275665283203125, -0.19647216796875, -0.117279052734375, -0.0380859375, 0.041107177734375, 0.12030029296875, 0.199493408203125, 0.2786865234375, 0.357879638671875, 0.43707275390625, 0.516265869140625, 0.595458984375, 0.674652099609375, 0.75384521484375, 0.833038330078125, 0.9122314453125, 0.991424560546875, 1.07061767578125, 1.149810791015625, 1.22900390625, 1.308197021484375, 1.38739013671875, 1.466583251953125, 1.5457763671875, 1.624969482421875, 1.70416259765625, 1.783355712890625, 1.862548828125, 1.941741943359375, 2.02093505859375, 2.100128173828125, 2.1793212890625, 2.258514404296875, 2.33770751953125, 2.416900634765625, 2.49609375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 13.0, 5.0, 9.0, 26.0, 21.0, 33.0, 45.0, 99.0, 102.0, 176.0, 225.0, 343.0, 482.0, 638.0, 1022.0, 1457.0, 2204.0, 3321.0, 5402.0, 10022.0, 20976.0, 57246.0, 262757.0, 529102.0, 91990.0, 29270.0, 12865.0, 6819.0, 4012.0, 2625.0, 1686.0, 1065.0, 702.0, 508.0, 357.0, 259.0, 190.0, 113.0, 100.0, 78.0, 54.0, 35.0, 23.0, 27.0, 17.0, 14.0, 7.0, 7.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.96484375, -2.87811279296875, -2.7913818359375, -2.70465087890625, -2.617919921875, -2.53118896484375, -2.4444580078125, -2.35772705078125, -2.27099609375, -2.18426513671875, -2.0975341796875, -2.01080322265625, -1.924072265625, -1.83734130859375, -1.7506103515625, -1.66387939453125, -1.5771484375, -1.49041748046875, -1.4036865234375, -1.31695556640625, -1.230224609375, -1.14349365234375, -1.0567626953125, -0.97003173828125, -0.88330078125, -0.79656982421875, -0.7098388671875, -0.62310791015625, -0.536376953125, -0.44964599609375, -0.3629150390625, -0.27618408203125, -0.189453125, -0.10272216796875, -0.0159912109375, 0.07073974609375, 0.157470703125, 0.24420166015625, 0.3309326171875, 0.41766357421875, 0.50439453125, 0.59112548828125, 0.6778564453125, 0.76458740234375, 0.851318359375, 0.93804931640625, 1.0247802734375, 1.11151123046875, 1.1982421875, 1.28497314453125, 1.3717041015625, 1.45843505859375, 1.545166015625, 1.63189697265625, 1.7186279296875, 1.80535888671875, 1.89208984375, 1.97882080078125, 2.0655517578125, 2.15228271484375, 2.239013671875, 2.32574462890625, 2.4124755859375, 2.49920654296875, 2.5859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 8.0, 18.0, 14.0, 16.0, 15.0, 19.0, 27.0, 20.0, 24.0, 24.0, 27.0, 41.0, 30.0, 35.0, 34.0, 37.0, 49.0, 48.0, 45.0, 41.0, 49.0, 44.0, 37.0, 29.0, 41.0, 27.0, 24.0, 20.0, 23.0, 19.0, 14.0, 12.0, 11.0, 16.0, 10.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6865234375, -1.6344451904296875, -1.582366943359375, -1.5302886962890625, -1.47821044921875, -1.4261322021484375, -1.374053955078125, -1.3219757080078125, -1.2698974609375, -1.2178192138671875, -1.165740966796875, -1.1136627197265625, -1.06158447265625, -1.0095062255859375, -0.957427978515625, -0.9053497314453125, -0.853271484375, -0.8011932373046875, -0.749114990234375, -0.6970367431640625, -0.64495849609375, -0.5928802490234375, -0.540802001953125, -0.4887237548828125, -0.4366455078125, -0.3845672607421875, -0.332489013671875, -0.2804107666015625, -0.22833251953125, -0.1762542724609375, -0.124176025390625, -0.0720977783203125, -0.02001953125, 0.0320587158203125, 0.084136962890625, 0.1362152099609375, 0.18829345703125, 0.2403717041015625, 0.292449951171875, 0.3445281982421875, 0.3966064453125, 0.4486846923828125, 0.500762939453125, 0.5528411865234375, 0.60491943359375, 0.6569976806640625, 0.709075927734375, 0.7611541748046875, 0.813232421875, 0.8653106689453125, 0.917388916015625, 0.9694671630859375, 1.02154541015625, 1.0736236572265625, 1.125701904296875, 1.1777801513671875, 1.2298583984375, 1.2819366455078125, 1.334014892578125, 1.3860931396484375, 1.43817138671875, 1.4902496337890625, 1.542327880859375, 1.5944061279296875, 1.646484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 1.0, 11.0, 11.0, 14.0, 13.0, 31.0, 38.0, 42.0, 56.0, 90.0, 137.0, 171.0, 270.0, 337.0, 512.0, 700.0, 1083.0, 1555.0, 2760.0, 4777.0, 9779.0, 23228.0, 71947.0, 611475.0, 240049.0, 44899.0, 16352.0, 7348.0, 3976.0, 2320.0, 1430.0, 1000.0, 662.0, 445.0, 300.0, 202.0, 145.0, 109.0, 93.0, 42.0, 46.0, 26.0, 21.0, 11.0, 15.0, 5.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.245361328125, -0.23713302612304688, -0.22890472412109375, -0.22067642211914062, -0.2124481201171875, -0.20421981811523438, -0.19599151611328125, -0.18776321411132812, -0.179534912109375, -0.17130661010742188, -0.16307830810546875, -0.15485000610351562, -0.1466217041015625, -0.13839340209960938, -0.13016510009765625, -0.12193679809570312, -0.11370849609375, -0.10548019409179688, -0.09725189208984375, -0.08902359008789062, -0.0807952880859375, -0.07256698608398438, -0.06433868408203125, -0.056110382080078125, -0.047882080078125, -0.039653778076171875, -0.03142547607421875, -0.023197174072265625, -0.0149688720703125, -0.006740570068359375, 0.00148773193359375, 0.009716033935546875, 0.0179443359375, 0.026172637939453125, 0.03440093994140625, 0.042629241943359375, 0.0508575439453125, 0.059085845947265625, 0.06731414794921875, 0.07554244995117188, 0.083770751953125, 0.09199905395507812, 0.10022735595703125, 0.10845565795898438, 0.1166839599609375, 0.12491226196289062, 0.13314056396484375, 0.14136886596679688, 0.14959716796875, 0.15782546997070312, 0.16605377197265625, 0.17428207397460938, 0.1825103759765625, 0.19073867797851562, 0.19896697998046875, 0.20719528198242188, 0.215423583984375, 0.22365188598632812, 0.23188018798828125, 0.24010848999023438, 0.2483367919921875, 0.2565650939941406, 0.26479339599609375, 0.2730216979980469, 0.28125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 8.0, 13.0, 10.0, 17.0, 21.0, 22.0, 26.0, 46.0, 66.0, 70.0, 90.0, 138.0, 163.0, 77.0, 66.0, 41.0, 36.0, 25.0, 23.0, 13.0, 6.0, 3.0, 4.0, 3.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.436471939086914e-05, -1.3600103557109833e-05, -1.2835487723350525e-05, -1.2070871889591217e-05, -1.130625605583191e-05, -1.0541640222072601e-05, -9.777024388313293e-06, -9.012408554553986e-06, -8.247792720794678e-06, -7.48317688703537e-06, -6.718561053276062e-06, -5.953945219516754e-06, -5.189329385757446e-06, -4.4247135519981384e-06, -3.6600977182388306e-06, -2.8954818844795227e-06, -2.130866050720215e-06, -1.366250216960907e-06, -6.016343832015991e-07, 1.6298145055770874e-07, 9.275972843170166e-07, 1.6922131180763245e-06, 2.4568289518356323e-06, 3.22144478559494e-06, 3.986060619354248e-06, 4.750676453113556e-06, 5.515292286872864e-06, 6.279908120632172e-06, 7.0445239543914795e-06, 7.809139788150787e-06, 8.573755621910095e-06, 9.338371455669403e-06, 1.0102987289428711e-05, 1.0867603123188019e-05, 1.1632218956947327e-05, 1.2396834790706635e-05, 1.3161450624465942e-05, 1.392606645822525e-05, 1.4690682291984558e-05, 1.5455298125743866e-05, 1.6219913959503174e-05, 1.698452979326248e-05, 1.774914562702179e-05, 1.8513761460781097e-05, 1.9278377294540405e-05, 2.0042993128299713e-05, 2.080760896205902e-05, 2.157222479581833e-05, 2.2336840629577637e-05, 2.3101456463336945e-05, 2.3866072297096252e-05, 2.463068813085556e-05, 2.5395303964614868e-05, 2.6159919798374176e-05, 2.6924535632133484e-05, 2.7689151465892792e-05, 2.84537672996521e-05, 2.9218383133411407e-05, 2.9982998967170715e-05, 3.074761480093002e-05, 3.151223063468933e-05, 3.227684646844864e-05, 3.304146230220795e-05, 3.3806078135967255e-05, 3.457069396972656e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 20.0, 19.0, 30.0, 24.0, 48.0, 68.0, 90.0, 132.0, 161.0, 239.0, 306.0, 441.0, 670.0, 934.0, 1381.0, 2082.0, 3041.0, 4787.0, 8089.0, 13786.0, 26028.0, 53544.0, 141936.0, 456558.0, 195190.0, 66866.0, 30488.0, 15965.0, 9458.0, 5543.0, 3395.0, 2327.0, 1450.0, 1015.0, 664.0, 474.0, 340.0, 244.0, 175.0, 130.0, 96.0, 88.0, 47.0, 51.0, 33.0, 26.0, 25.0, 13.0, 8.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0], "bins": [-0.19189453125, -0.18582725524902344, -0.17975997924804688, -0.1736927032470703, -0.16762542724609375, -0.1615581512451172, -0.15549087524414062, -0.14942359924316406, -0.1433563232421875, -0.13728904724121094, -0.13122177124023438, -0.1251544952392578, -0.11908721923828125, -0.11301994323730469, -0.10695266723632812, -0.10088539123535156, -0.094818115234375, -0.08875083923339844, -0.08268356323242188, -0.07661628723144531, -0.07054901123046875, -0.06448173522949219, -0.058414459228515625, -0.05234718322753906, -0.0462799072265625, -0.04021263122558594, -0.034145355224609375, -0.028078079223632812, -0.02201080322265625, -0.015943527221679688, -0.009876251220703125, -0.0038089752197265625, 0.00225830078125, 0.008325576782226562, 0.014392852783203125, 0.020460128784179688, 0.02652740478515625, 0.03259468078613281, 0.038661956787109375, 0.04472923278808594, 0.0507965087890625, 0.05686378479003906, 0.06293106079101562, 0.06899833679199219, 0.07506561279296875, 0.08113288879394531, 0.08720016479492188, 0.09326744079589844, 0.099334716796875, 0.10540199279785156, 0.11146926879882812, 0.11753654479980469, 0.12360382080078125, 0.1296710968017578, 0.13573837280273438, 0.14180564880371094, 0.1478729248046875, 0.15394020080566406, 0.16000747680664062, 0.1660747528076172, 0.17214202880859375, 0.1782093048095703, 0.18427658081054688, 0.19034385681152344, 0.1964111328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 0.0, 7.0, 7.0, 10.0, 6.0, 12.0, 9.0, 18.0, 14.0, 26.0, 35.0, 28.0, 37.0, 47.0, 53.0, 61.0, 86.0, 80.0, 63.0, 76.0, 57.0, 46.0, 33.0, 40.0, 23.0, 19.0, 18.0, 15.0, 13.0, 13.0, 12.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.047882080078125, -0.04639387130737305, -0.044905662536621094, -0.04341745376586914, -0.04192924499511719, -0.040441036224365234, -0.03895282745361328, -0.03746461868286133, -0.035976409912109375, -0.03448820114135742, -0.03299999237060547, -0.031511783599853516, -0.030023574829101562, -0.02853536605834961, -0.027047157287597656, -0.025558948516845703, -0.02407073974609375, -0.022582530975341797, -0.021094322204589844, -0.01960611343383789, -0.018117904663085938, -0.016629695892333984, -0.015141487121582031, -0.013653278350830078, -0.012165069580078125, -0.010676860809326172, -0.009188652038574219, -0.007700443267822266, -0.0062122344970703125, -0.004724025726318359, -0.0032358169555664062, -0.0017476081848144531, -0.0002593994140625, 0.0012288093566894531, 0.0027170181274414062, 0.004205226898193359, 0.0056934356689453125, 0.007181644439697266, 0.008669853210449219, 0.010158061981201172, 0.011646270751953125, 0.013134479522705078, 0.014622688293457031, 0.016110897064208984, 0.017599105834960938, 0.01908731460571289, 0.020575523376464844, 0.022063732147216797, 0.02355194091796875, 0.025040149688720703, 0.026528358459472656, 0.02801656723022461, 0.029504776000976562, 0.030992984771728516, 0.03248119354248047, 0.03396940231323242, 0.035457611083984375, 0.03694581985473633, 0.03843402862548828, 0.039922237396240234, 0.04141044616699219, 0.04289865493774414, 0.044386863708496094, 0.04587507247924805, 0.04736328125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 6.0, 6.0, 5.0, 8.0, 13.0, 24.0, 19.0, 19.0, 30.0, 44.0, 86.0, 118.0, 145.0, 115.0, 88.0, 67.0, 56.0, 39.0, 30.0, 18.0, 21.0, 9.0, 7.0, 4.0, 5.0, 8.0, 6.0, 0.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.326508522033691, -5.178043365478516, -5.02957820892334, -4.881113052368164, -4.732647895812988, -4.5841827392578125, -4.435717582702637, -4.287252426147461, -4.138787269592285, -3.9903221130371094, -3.8418569564819336, -3.693391799926758, -3.544926643371582, -3.3964614868164062, -3.2479963302612305, -3.0995311737060547, -2.951066255569458, -2.8026010990142822, -2.6541359424591064, -2.5056707859039307, -2.357205629348755, -2.208740472793579, -2.0602755546569824, -1.911810278892517, -1.7633451223373413, -1.6148799657821655, -1.4664148092269897, -1.3179497718811035, -1.1694846153259277, -1.021019458770752, -0.8725543022155762, -0.7240891456604004, -0.5756239891052246, -0.42715883255004883, -0.27869370579719543, -0.13022857904434204, 0.01823657751083374, 0.16670173406600952, 0.3151668310165405, 0.4636319875717163, 0.6120971441268921, 0.7605623006820679, 0.9090274572372437, 1.0574924945831299, 1.2059576511383057, 1.3544228076934814, 1.5028879642486572, 1.651353120803833, 1.7998182773590088, 1.9482834339141846, 2.0967485904693604, 2.245213747024536, 2.393678903579712, 2.5421440601348877, 2.6906089782714844, 2.83907413482666, 2.987539291381836, 3.1360044479370117, 3.2844696044921875, 3.4329347610473633, 3.581399917602539, 3.729865074157715, 3.8783302307128906, 4.026795387268066, 4.175260543823242]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 9.0, 6.0, 8.0, 5.0, 9.0, 4.0, 11.0, 14.0, 13.0, 19.0, 15.0, 17.0, 25.0, 24.0, 24.0, 32.0, 31.0, 47.0, 34.0, 34.0, 25.0, 29.0, 40.0, 39.0, 52.0, 29.0, 31.0, 38.0, 41.0, 34.0, 32.0, 37.0, 36.0, 18.0, 18.0, 20.0, 14.0, 11.0, 13.0, 8.0, 8.0, 10.0, 11.0, 10.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.490424156188965, -2.4156510829925537, -2.3408777713775635, -2.2661046981811523, -2.191331624984741, -2.11655855178833, -2.04178524017334, -1.9670121669769287, -1.8922390937805176, -1.817465901374817, -1.7426928281784058, -1.667919635772705, -1.593146562576294, -1.5183733701705933, -1.4436001777648926, -1.3688271045684814, -1.2940539121627808, -1.21928071975708, -1.144507646560669, -1.0697344541549683, -0.9949613809585571, -0.9201881885528564, -0.8454150557518005, -0.7706419229507446, -0.6958687901496887, -0.6210956573486328, -0.5463225245475769, -0.4715493619441986, -0.3967762291431427, -0.3220030963420868, -0.2472299337387085, -0.1724568009376526, -0.09768366813659668, -0.022910527884960175, 0.05186261236667633, 0.12663576006889343, 0.20140889286994934, 0.27618202567100525, 0.35095518827438354, 0.42572832107543945, 0.5005014538764954, 0.5752745866775513, 0.6500477194786072, 0.7248208522796631, 0.7995940446853638, 0.8743671178817749, 0.9491403102874756, 1.0239133834838867, 1.0986865758895874, 1.173459768295288, 1.2482328414916992, 1.3230060338974, 1.397779107093811, 1.4725522994995117, 1.5473253726959229, 1.6220985651016235, 1.6968717575073242, 1.771644949913025, 1.846418023109436, 1.9211912155151367, 1.9959642887115479, 2.070737361907959, 2.145510673522949, 2.2202837467193604, 2.2950568199157715]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 9.0, 13.0, 19.0, 24.0, 40.0, 55.0, 80.0, 121.0, 143.0, 207.0, 280.0, 406.0, 679.0, 996.0, 1508.0, 2380.0, 3678.0, 6048.0, 9804.0, 16382.0, 28677.0, 50931.0, 92691.0, 169435.0, 248467.0, 182328.0, 100920.0, 55225.0, 31054.0, 17646.0, 10580.0, 6409.0, 3949.0, 2498.0, 1600.0, 1000.0, 737.0, 474.0, 336.0, 197.0, 167.0, 102.0, 73.0, 46.0, 38.0, 43.0, 21.0, 15.0, 9.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-4.15234375, -4.02081298828125, -3.8892822265625, -3.75775146484375, -3.626220703125, -3.49468994140625, -3.3631591796875, -3.23162841796875, -3.10009765625, -2.96856689453125, -2.8370361328125, -2.70550537109375, -2.573974609375, -2.44244384765625, -2.3109130859375, -2.17938232421875, -2.0478515625, -1.91632080078125, -1.7847900390625, -1.65325927734375, -1.521728515625, -1.39019775390625, -1.2586669921875, -1.12713623046875, -0.99560546875, -0.86407470703125, -0.7325439453125, -0.60101318359375, -0.469482421875, -0.33795166015625, -0.2064208984375, -0.07489013671875, 0.056640625, 0.18817138671875, 0.3197021484375, 0.45123291015625, 0.582763671875, 0.71429443359375, 0.8458251953125, 0.97735595703125, 1.10888671875, 1.24041748046875, 1.3719482421875, 1.50347900390625, 1.635009765625, 1.76654052734375, 1.8980712890625, 2.02960205078125, 2.1611328125, 2.29266357421875, 2.4241943359375, 2.55572509765625, 2.687255859375, 2.81878662109375, 2.9503173828125, 3.08184814453125, 3.21337890625, 3.34490966796875, 3.4764404296875, 3.60797119140625, 3.739501953125, 3.87103271484375, 4.0025634765625, 4.13409423828125, 4.265625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 9.0, 3.0, 5.0, 4.0, 10.0, 9.0, 12.0, 9.0, 18.0, 23.0, 14.0, 22.0, 18.0, 22.0, 43.0, 18.0, 28.0, 40.0, 36.0, 35.0, 32.0, 49.0, 35.0, 37.0, 38.0, 40.0, 41.0, 40.0, 34.0, 39.0, 39.0, 27.0, 27.0, 21.0, 22.0, 16.0, 13.0, 11.0, 13.0, 10.0, 5.0, 7.0, 9.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0], "bins": [-2.35546875, -2.286041259765625, -2.21661376953125, -2.147186279296875, -2.0777587890625, -2.008331298828125, -1.93890380859375, -1.869476318359375, -1.800048828125, -1.730621337890625, -1.66119384765625, -1.591766357421875, -1.5223388671875, -1.452911376953125, -1.38348388671875, -1.314056396484375, -1.24462890625, -1.175201416015625, -1.10577392578125, -1.036346435546875, -0.9669189453125, -0.897491455078125, -0.82806396484375, -0.758636474609375, -0.689208984375, -0.619781494140625, -0.55035400390625, -0.480926513671875, -0.4114990234375, -0.342071533203125, -0.27264404296875, -0.203216552734375, -0.1337890625, -0.064361572265625, 0.00506591796875, 0.074493408203125, 0.1439208984375, 0.213348388671875, 0.28277587890625, 0.352203369140625, 0.421630859375, 0.491058349609375, 0.56048583984375, 0.629913330078125, 0.6993408203125, 0.768768310546875, 0.83819580078125, 0.907623291015625, 0.97705078125, 1.046478271484375, 1.11590576171875, 1.185333251953125, 1.2547607421875, 1.324188232421875, 1.39361572265625, 1.463043212890625, 1.532470703125, 1.601898193359375, 1.67132568359375, 1.740753173828125, 1.8101806640625, 1.879608154296875, 1.94903564453125, 2.018463134765625, 2.087890625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 9.0, 16.0, 20.0, 27.0, 43.0, 63.0, 83.0, 140.0, 183.0, 293.0, 451.0, 758.0, 1306.0, 2140.0, 3873.0, 6656.0, 12636.0, 23786.0, 46019.0, 91712.0, 187222.0, 298235.0, 185044.0, 90545.0, 45288.0, 23446.0, 12407.0, 6679.0, 3903.0, 2135.0, 1283.0, 764.0, 497.0, 300.0, 189.0, 117.0, 71.0, 63.0, 42.0, 33.0, 21.0, 17.0, 11.0, 3.0, 3.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.71484375, -4.56512451171875, -4.4154052734375, -4.26568603515625, -4.115966796875, -3.96624755859375, -3.8165283203125, -3.66680908203125, -3.51708984375, -3.36737060546875, -3.2176513671875, -3.06793212890625, -2.918212890625, -2.76849365234375, -2.6187744140625, -2.46905517578125, -2.3193359375, -2.16961669921875, -2.0198974609375, -1.87017822265625, -1.720458984375, -1.57073974609375, -1.4210205078125, -1.27130126953125, -1.12158203125, -0.97186279296875, -0.8221435546875, -0.67242431640625, -0.522705078125, -0.37298583984375, -0.2232666015625, -0.07354736328125, 0.076171875, 0.22589111328125, 0.3756103515625, 0.52532958984375, 0.675048828125, 0.82476806640625, 0.9744873046875, 1.12420654296875, 1.27392578125, 1.42364501953125, 1.5733642578125, 1.72308349609375, 1.872802734375, 2.02252197265625, 2.1722412109375, 2.32196044921875, 2.4716796875, 2.62139892578125, 2.7711181640625, 2.92083740234375, 3.070556640625, 3.22027587890625, 3.3699951171875, 3.51971435546875, 3.66943359375, 3.81915283203125, 3.9688720703125, 4.11859130859375, 4.268310546875, 4.41802978515625, 4.5677490234375, 4.71746826171875, 4.8671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 12.0, 10.0, 7.0, 12.0, 7.0, 12.0, 21.0, 19.0, 10.0, 20.0, 27.0, 20.0, 31.0, 21.0, 21.0, 34.0, 33.0, 29.0, 36.0, 55.0, 28.0, 29.0, 33.0, 44.0, 30.0, 34.0, 39.0, 35.0, 37.0, 34.0, 35.0, 23.0, 14.0, 24.0, 13.0, 14.0, 16.0, 14.0, 14.0, 11.0, 8.0, 7.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0], "bins": [-1.5771484375, -1.533599853515625, -1.49005126953125, -1.446502685546875, -1.4029541015625, -1.359405517578125, -1.31585693359375, -1.272308349609375, -1.228759765625, -1.185211181640625, -1.14166259765625, -1.098114013671875, -1.0545654296875, -1.011016845703125, -0.96746826171875, -0.923919677734375, -0.88037109375, -0.836822509765625, -0.79327392578125, -0.749725341796875, -0.7061767578125, -0.662628173828125, -0.61907958984375, -0.575531005859375, -0.531982421875, -0.488433837890625, -0.44488525390625, -0.401336669921875, -0.3577880859375, -0.314239501953125, -0.27069091796875, -0.227142333984375, -0.18359375, -0.140045166015625, -0.09649658203125, -0.052947998046875, -0.0093994140625, 0.034149169921875, 0.07769775390625, 0.121246337890625, 0.164794921875, 0.208343505859375, 0.25189208984375, 0.295440673828125, 0.3389892578125, 0.382537841796875, 0.42608642578125, 0.469635009765625, 0.51318359375, 0.556732177734375, 0.60028076171875, 0.643829345703125, 0.6873779296875, 0.730926513671875, 0.77447509765625, 0.818023681640625, 0.861572265625, 0.905120849609375, 0.94866943359375, 0.992218017578125, 1.0357666015625, 1.079315185546875, 1.12286376953125, 1.166412353515625, 1.2099609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 12.0, 19.0, 16.0, 29.0, 37.0, 48.0, 65.0, 109.0, 157.0, 224.0, 327.0, 437.0, 720.0, 1191.0, 1791.0, 3067.0, 5360.0, 10342.0, 21455.0, 57541.0, 309100.0, 524408.0, 63566.0, 23365.0, 10751.0, 5854.0, 3094.0, 1880.0, 1214.0, 776.0, 502.0, 358.0, 221.0, 150.0, 98.0, 75.0, 54.0, 41.0, 32.0, 22.0, 13.0, 11.0, 2.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.15234375, -4.02276611328125, -3.8931884765625, -3.76361083984375, -3.634033203125, -3.50445556640625, -3.3748779296875, -3.24530029296875, -3.11572265625, -2.98614501953125, -2.8565673828125, -2.72698974609375, -2.597412109375, -2.46783447265625, -2.3382568359375, -2.20867919921875, -2.0791015625, -1.94952392578125, -1.8199462890625, -1.69036865234375, -1.560791015625, -1.43121337890625, -1.3016357421875, -1.17205810546875, -1.04248046875, -0.91290283203125, -0.7833251953125, -0.65374755859375, -0.524169921875, -0.39459228515625, -0.2650146484375, -0.13543701171875, -0.005859375, 0.12371826171875, 0.2532958984375, 0.38287353515625, 0.512451171875, 0.64202880859375, 0.7716064453125, 0.90118408203125, 1.03076171875, 1.16033935546875, 1.2899169921875, 1.41949462890625, 1.549072265625, 1.67864990234375, 1.8082275390625, 1.93780517578125, 2.0673828125, 2.19696044921875, 2.3265380859375, 2.45611572265625, 2.585693359375, 2.71527099609375, 2.8448486328125, 2.97442626953125, 3.10400390625, 3.23358154296875, 3.3631591796875, 3.49273681640625, 3.622314453125, 3.75189208984375, 3.8814697265625, 4.01104736328125, 4.140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 8.0, 11.0, 11.0, 14.0, 39.0, 48.0, 59.0, 115.0, 250.0, 167.0, 84.0, 57.0, 30.0, 35.0, 19.0, 13.0, 14.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013208389282226562, -0.00012674182653427124, -0.00012139976024627686, -0.00011605769395828247, -0.00011071562767028809, -0.0001053735613822937, -0.00010003149509429932, -9.468942880630493e-05, -8.934736251831055e-05, -8.400529623031616e-05, -7.866322994232178e-05, -7.332116365432739e-05, -6.797909736633301e-05, -6.263703107833862e-05, -5.729496479034424e-05, -5.1952898502349854e-05, -4.661083221435547e-05, -4.1268765926361084e-05, -3.59266996383667e-05, -3.0584633350372314e-05, -2.524256706237793e-05, -1.9900500774383545e-05, -1.455843448638916e-05, -9.216368198394775e-06, -3.874301910400391e-06, 1.4677643775939941e-06, 6.809830665588379e-06, 1.2151896953582764e-05, 1.749396324157715e-05, 2.2836029529571533e-05, 2.8178095817565918e-05, 3.35201621055603e-05, 3.886222839355469e-05, 4.420429468154907e-05, 4.954636096954346e-05, 5.488842725753784e-05, 6.0230493545532227e-05, 6.557255983352661e-05, 7.0914626121521e-05, 7.625669240951538e-05, 8.159875869750977e-05, 8.694082498550415e-05, 9.228289127349854e-05, 9.762495756149292e-05, 0.0001029670238494873, 0.00010830909013748169, 0.00011365115642547607, 0.00011899322271347046, 0.00012433528900146484, 0.00012967735528945923, 0.0001350194215774536, 0.000140361487865448, 0.00014570355415344238, 0.00015104562044143677, 0.00015638768672943115, 0.00016172975301742554, 0.00016707181930541992, 0.0001724138855934143, 0.0001777559518814087, 0.00018309801816940308, 0.00018844008445739746, 0.00019378215074539185, 0.00019912421703338623, 0.00020446628332138062, 0.000209808349609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 15.0, 26.0, 27.0, 39.0, 56.0, 66.0, 98.0, 150.0, 186.0, 309.0, 440.0, 653.0, 1023.0, 1562.0, 2601.0, 4631.0, 8516.0, 18518.0, 48610.0, 253502.0, 600625.0, 61986.0, 21907.0, 9759.0, 5254.0, 2847.0, 1785.0, 1092.0, 708.0, 491.0, 318.0, 213.0, 153.0, 106.0, 70.0, 49.0, 43.0, 36.0, 21.0, 13.0, 8.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.98480224609375, -3.8524169921875, -3.72003173828125, -3.587646484375, -3.45526123046875, -3.3228759765625, -3.19049072265625, -3.05810546875, -2.92572021484375, -2.7933349609375, -2.66094970703125, -2.528564453125, -2.39617919921875, -2.2637939453125, -2.13140869140625, -1.9990234375, -1.86663818359375, -1.7342529296875, -1.60186767578125, -1.469482421875, -1.33709716796875, -1.2047119140625, -1.07232666015625, -0.93994140625, -0.80755615234375, -0.6751708984375, -0.54278564453125, -0.410400390625, -0.27801513671875, -0.1456298828125, -0.01324462890625, 0.119140625, 0.25152587890625, 0.3839111328125, 0.51629638671875, 0.648681640625, 0.78106689453125, 0.9134521484375, 1.04583740234375, 1.17822265625, 1.31060791015625, 1.4429931640625, 1.57537841796875, 1.707763671875, 1.84014892578125, 1.9725341796875, 2.10491943359375, 2.2373046875, 2.36968994140625, 2.5020751953125, 2.63446044921875, 2.766845703125, 2.89923095703125, 3.0316162109375, 3.16400146484375, 3.29638671875, 3.42877197265625, 3.5611572265625, 3.69354248046875, 3.825927734375, 3.95831298828125, 4.0906982421875, 4.22308349609375, 4.35546875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 12.0, 9.0, 12.0, 19.0, 26.0, 31.0, 30.0, 70.0, 96.0, 269.0, 124.0, 70.0, 55.0, 34.0, 29.0, 31.0, 17.0, 9.0, 10.0, 2.0, 5.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.17425537109375, -1.1395263671875, -1.10479736328125, -1.070068359375, -1.03533935546875, -1.0006103515625, -0.96588134765625, -0.93115234375, -0.89642333984375, -0.8616943359375, -0.82696533203125, -0.792236328125, -0.75750732421875, -0.7227783203125, -0.68804931640625, -0.6533203125, -0.61859130859375, -0.5838623046875, -0.54913330078125, -0.514404296875, -0.47967529296875, -0.4449462890625, -0.41021728515625, -0.37548828125, -0.34075927734375, -0.3060302734375, -0.27130126953125, -0.236572265625, -0.20184326171875, -0.1671142578125, -0.13238525390625, -0.09765625, -0.06292724609375, -0.0281982421875, 0.00653076171875, 0.041259765625, 0.07598876953125, 0.1107177734375, 0.14544677734375, 0.18017578125, 0.21490478515625, 0.2496337890625, 0.28436279296875, 0.319091796875, 0.35382080078125, 0.3885498046875, 0.42327880859375, 0.4580078125, 0.49273681640625, 0.5274658203125, 0.56219482421875, 0.596923828125, 0.63165283203125, 0.6663818359375, 0.70111083984375, 0.73583984375, 0.77056884765625, 0.8052978515625, 0.84002685546875, 0.874755859375, 0.90948486328125, 0.9442138671875, 0.97894287109375, 1.013671875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 11.0, 10.0, 5.0, 8.0, 15.0, 29.0, 29.0, 43.0, 73.0, 86.0, 111.0, 124.0, 100.0, 81.0, 63.0, 41.0, 37.0, 30.0, 17.0, 20.0, 18.0, 6.0, 5.0, 9.0, 4.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1635384559631348, -3.0378291606903076, -2.9121196269989014, -2.786410331726074, -2.660700798034668, -2.534991502761841, -2.4092822074890137, -2.2835726737976074, -2.1578633785247803, -2.032154083251953, -1.9064445495605469, -1.7807352542877197, -1.655025839805603, -1.5293164253234863, -1.4036071300506592, -1.2778977155685425, -1.1521883010864258, -1.026478886604309, -0.9007695317268372, -0.7750601768493652, -0.6493507623672485, -0.5236413478851318, -0.3979319930076599, -0.272222638130188, -0.1465132236480713, -0.020803838968276978, 0.10490554571151733, 0.23061493039131165, 0.35632431507110596, 0.48203372955322266, 0.6077430844306946, 0.7334524393081665, 0.859161376953125, 0.9848707914352417, 1.1105802059173584, 1.2362895011901855, 1.3619989156723022, 1.487708330154419, 1.613417625427246, 1.7391270399093628, 1.8648364543914795, 1.9905458688735962, 2.116255283355713, 2.24196457862854, 2.367673873901367, 2.4933834075927734, 2.6190927028656006, 2.7448019981384277, 2.870511531829834, 2.996220827102661, 3.1219303607940674, 3.2476396560668945, 3.373349189758301, 3.499058485031128, 3.624767780303955, 3.7504773139953613, 3.8761866092681885, 4.001895904541016, 4.127605438232422, 4.253314971923828, 4.379024028778076, 4.504733562469482, 4.630443096160889, 4.756152153015137, 4.881861686706543]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 2.0, 7.0, 11.0, 9.0, 11.0, 11.0, 13.0, 14.0, 8.0, 21.0, 17.0, 20.0, 22.0, 23.0, 24.0, 41.0, 33.0, 32.0, 28.0, 37.0, 28.0, 36.0, 45.0, 33.0, 47.0, 36.0, 27.0, 31.0, 39.0, 35.0, 25.0, 26.0, 29.0, 28.0, 23.0, 22.0, 16.0, 10.0, 13.0, 11.0, 9.0, 12.0, 6.0, 5.0, 9.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0], "bins": [-2.2608718872070312, -2.189943790435791, -2.119015693664551, -2.0480875968933105, -1.9771595001220703, -1.90623140335083, -1.8353033065795898, -1.7643752098083496, -1.6934471130371094, -1.6225190162658691, -1.551590919494629, -1.4806628227233887, -1.4097347259521484, -1.3388066291809082, -1.267878532409668, -1.1969504356384277, -1.126022458076477, -1.0550943613052368, -0.9841662645339966, -0.9132381677627563, -0.8423100709915161, -0.7713819742202759, -0.7004539370536804, -0.6295258402824402, -0.5585977435112, -0.4876696467399597, -0.4167415499687195, -0.34581348299980164, -0.2748853862285614, -0.20395728945732117, -0.13302922248840332, -0.062101125717163086, 0.008826971054077148, 0.07975506037473679, 0.15068314969539642, 0.22161123156547546, 0.2925393283367157, 0.36346742510795593, 0.4343954920768738, 0.505323588848114, 0.5762516856193542, 0.6471797823905945, 0.7181078791618347, 0.7890359163284302, 0.8599640130996704, 0.9308921098709106, 1.0018202066421509, 1.0727483034133911, 1.1436764001846313, 1.2146044969558716, 1.2855325937271118, 1.356460690498352, 1.4273887872695923, 1.4983168840408325, 1.5692448616027832, 1.6401729583740234, 1.7111010551452637, 1.782029151916504, 1.8529572486877441, 1.9238853454589844, 1.9948134422302246, 2.065741539001465, 2.136669635772705, 2.2075977325439453, 2.2785258293151855]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 16.0, 27.0, 25.0, 48.0, 67.0, 112.0, 162.0, 210.0, 351.0, 499.0, 742.0, 1095.0, 1545.0, 2317.0, 3464.0, 5210.0, 7751.0, 11901.0, 19137.0, 31851.0, 56262.0, 110166.0, 255584.0, 865289.0, 1796762.0, 605181.0, 201033.0, 93453.0, 49388.0, 28342.0, 16766.0, 10235.0, 6706.0, 4063.0, 2802.0, 1722.0, 1282.0, 825.0, 594.0, 387.0, 298.0, 173.0, 126.0, 113.0, 55.0, 51.0, 21.0, 24.0, 19.0, 10.0, 10.0, 8.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.064453125, -2.956451416015625, -2.84844970703125, -2.740447998046875, -2.6324462890625, -2.524444580078125, -2.41644287109375, -2.308441162109375, -2.200439453125, -2.092437744140625, -1.98443603515625, -1.876434326171875, -1.7684326171875, -1.660430908203125, -1.55242919921875, -1.444427490234375, -1.33642578125, -1.228424072265625, -1.12042236328125, -1.012420654296875, -0.9044189453125, -0.796417236328125, -0.68841552734375, -0.580413818359375, -0.472412109375, -0.364410400390625, -0.25640869140625, -0.148406982421875, -0.0404052734375, 0.067596435546875, 0.17559814453125, 0.283599853515625, 0.3916015625, 0.499603271484375, 0.60760498046875, 0.715606689453125, 0.8236083984375, 0.931610107421875, 1.03961181640625, 1.147613525390625, 1.255615234375, 1.363616943359375, 1.47161865234375, 1.579620361328125, 1.6876220703125, 1.795623779296875, 1.90362548828125, 2.011627197265625, 2.11962890625, 2.227630615234375, 2.33563232421875, 2.443634033203125, 2.5516357421875, 2.659637451171875, 2.76763916015625, 2.875640869140625, 2.983642578125, 3.091644287109375, 3.19964599609375, 3.307647705078125, 3.4156494140625, 3.523651123046875, 3.63165283203125, 3.739654541015625, 3.84765625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 8.0, 8.0, 10.0, 11.0, 9.0, 16.0, 11.0, 14.0, 18.0, 27.0, 20.0, 21.0, 21.0, 25.0, 30.0, 32.0, 32.0, 34.0, 41.0, 42.0, 36.0, 34.0, 37.0, 41.0, 28.0, 35.0, 31.0, 30.0, 31.0, 32.0, 30.0, 29.0, 21.0, 16.0, 20.0, 18.0, 14.0, 16.0, 6.0, 9.0, 7.0, 12.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.3310546875, -1.28753662109375, -1.2440185546875, -1.20050048828125, -1.156982421875, -1.11346435546875, -1.0699462890625, -1.02642822265625, -0.98291015625, -0.93939208984375, -0.8958740234375, -0.85235595703125, -0.808837890625, -0.76531982421875, -0.7218017578125, -0.67828369140625, -0.634765625, -0.59124755859375, -0.5477294921875, -0.50421142578125, -0.460693359375, -0.41717529296875, -0.3736572265625, -0.33013916015625, -0.28662109375, -0.24310302734375, -0.1995849609375, -0.15606689453125, -0.112548828125, -0.06903076171875, -0.0255126953125, 0.01800537109375, 0.0615234375, 0.10504150390625, 0.1485595703125, 0.19207763671875, 0.235595703125, 0.27911376953125, 0.3226318359375, 0.36614990234375, 0.40966796875, 0.45318603515625, 0.4967041015625, 0.54022216796875, 0.583740234375, 0.62725830078125, 0.6707763671875, 0.71429443359375, 0.7578125, 0.80133056640625, 0.8448486328125, 0.88836669921875, 0.931884765625, 0.97540283203125, 1.0189208984375, 1.06243896484375, 1.10595703125, 1.14947509765625, 1.1929931640625, 1.23651123046875, 1.280029296875, 1.32354736328125, 1.3670654296875, 1.41058349609375, 1.4541015625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 7.0, 6.0, 13.0, 20.0, 26.0, 36.0, 65.0, 110.0, 155.0, 233.0, 384.0, 619.0, 1020.0, 1837.0, 2884.0, 4968.0, 9085.0, 16777.0, 31621.0, 63733.0, 140715.0, 362481.0, 1265720.0, 1549768.0, 432836.0, 161091.0, 71324.0, 34823.0, 18228.0, 10089.0, 5627.0, 3248.0, 1830.0, 1042.0, 666.0, 449.0, 277.0, 165.0, 86.0, 71.0, 50.0, 39.0, 29.0, 10.0, 7.0, 5.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.525390625, -3.411956787109375, -3.29852294921875, -3.185089111328125, -3.0716552734375, -2.958221435546875, -2.84478759765625, -2.731353759765625, -2.617919921875, -2.504486083984375, -2.39105224609375, -2.277618408203125, -2.1641845703125, -2.050750732421875, -1.93731689453125, -1.823883056640625, -1.71044921875, -1.597015380859375, -1.48358154296875, -1.370147705078125, -1.2567138671875, -1.143280029296875, -1.02984619140625, -0.916412353515625, -0.802978515625, -0.689544677734375, -0.57611083984375, -0.462677001953125, -0.3492431640625, -0.235809326171875, -0.12237548828125, -0.008941650390625, 0.1044921875, 0.217926025390625, 0.33135986328125, 0.444793701171875, 0.5582275390625, 0.671661376953125, 0.78509521484375, 0.898529052734375, 1.011962890625, 1.125396728515625, 1.23883056640625, 1.352264404296875, 1.4656982421875, 1.579132080078125, 1.69256591796875, 1.805999755859375, 1.91943359375, 2.032867431640625, 2.14630126953125, 2.259735107421875, 2.3731689453125, 2.486602783203125, 2.60003662109375, 2.713470458984375, 2.826904296875, 2.940338134765625, 3.05377197265625, 3.167205810546875, 3.2806396484375, 3.394073486328125, 3.50750732421875, 3.620941162109375, 3.734375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 11.0, 13.0, 20.0, 22.0, 19.0, 42.0, 60.0, 46.0, 92.0, 109.0, 121.0, 154.0, 210.0, 223.0, 280.0, 288.0, 343.0, 303.0, 294.0, 251.0, 244.0, 183.0, 144.0, 121.0, 99.0, 59.0, 75.0, 48.0, 48.0, 33.0, 28.0, 16.0, 13.0, 12.0, 12.0, 10.0, 11.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9580078125, -0.9275054931640625, -0.897003173828125, -0.8665008544921875, -0.83599853515625, -0.8054962158203125, -0.774993896484375, -0.7444915771484375, -0.7139892578125, -0.6834869384765625, -0.652984619140625, -0.6224822998046875, -0.59197998046875, -0.5614776611328125, -0.530975341796875, -0.5004730224609375, -0.469970703125, -0.4394683837890625, -0.408966064453125, -0.3784637451171875, -0.34796142578125, -0.3174591064453125, -0.286956787109375, -0.2564544677734375, -0.2259521484375, -0.1954498291015625, -0.164947509765625, -0.1344451904296875, -0.10394287109375, -0.0734405517578125, -0.042938232421875, -0.0124359130859375, 0.01806640625, 0.0485687255859375, 0.079071044921875, 0.1095733642578125, 0.14007568359375, 0.1705780029296875, 0.201080322265625, 0.2315826416015625, 0.2620849609375, 0.2925872802734375, 0.323089599609375, 0.3535919189453125, 0.38409423828125, 0.4145965576171875, 0.445098876953125, 0.4756011962890625, 0.506103515625, 0.5366058349609375, 0.567108154296875, 0.5976104736328125, 0.62811279296875, 0.6586151123046875, 0.689117431640625, 0.7196197509765625, 0.7501220703125, 0.7806243896484375, 0.811126708984375, 0.8416290283203125, 0.87213134765625, 0.9026336669921875, 0.933135986328125, 0.9636383056640625, 0.994140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 12.0, 27.0, 21.0, 32.0, 42.0, 49.0, 70.0, 81.0, 108.0, 117.0, 87.0, 78.0, 44.0, 46.0, 26.0, 28.0, 21.0, 19.0, 16.0, 8.0, 10.0, 3.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8087220191955566, -2.724217414855957, -2.6397128105163574, -2.555208206176758, -2.470703601837158, -2.3861989974975586, -2.301694393157959, -2.2171897888183594, -2.1326851844787598, -2.04818058013916, -1.9636759757995605, -1.879171371459961, -1.7946667671203613, -1.7101621627807617, -1.625657558441162, -1.5411529541015625, -1.456648349761963, -1.3721437454223633, -1.2876391410827637, -1.203134536743164, -1.1186299324035645, -1.0341253280639648, -0.9496207237243652, -0.8651161193847656, -0.780611515045166, -0.6961069107055664, -0.6116023063659668, -0.5270977020263672, -0.4425930976867676, -0.35808849334716797, -0.27358388900756836, -0.18907928466796875, -0.10457468032836914, -0.02007007598876953, 0.06443452835083008, 0.1489391326904297, 0.2334437370300293, 0.3179483413696289, 0.4024529457092285, 0.4869575500488281, 0.5714621543884277, 0.6559667587280273, 0.740471363067627, 0.8249759674072266, 0.9094805717468262, 0.9939851760864258, 1.0784897804260254, 1.162994384765625, 1.2474989891052246, 1.3320035934448242, 1.4165081977844238, 1.5010128021240234, 1.585517406463623, 1.6700220108032227, 1.7545266151428223, 1.8390312194824219, 1.9235358238220215, 2.008040428161621, 2.0925450325012207, 2.1770496368408203, 2.26155424118042, 2.3460588455200195, 2.430563449859619, 2.5150680541992188, 2.5995726585388184]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 4.0, 8.0, 14.0, 7.0, 13.0, 28.0, 21.0, 22.0, 26.0, 37.0, 34.0, 30.0, 41.0, 39.0, 38.0, 34.0, 36.0, 39.0, 49.0, 45.0, 34.0, 44.0, 53.0, 36.0, 43.0, 32.0, 28.0, 22.0, 25.0, 16.0, 12.0, 9.0, 18.0, 4.0, 6.0, 12.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7918034791946411, -1.73191499710083, -1.672026515007019, -1.612138032913208, -1.5522496700286865, -1.4923611879348755, -1.4324727058410645, -1.3725842237472534, -1.3126957416534424, -1.2528072595596313, -1.1929187774658203, -1.1330304145812988, -1.0731419324874878, -1.0132534503936768, -0.9533649682998657, -0.8934764862060547, -0.8335881233215332, -0.7736996412277222, -0.7138112187385559, -0.6539227366447449, -0.5940343141555786, -0.5341458320617676, -0.47425734996795654, -0.4143688976764679, -0.35448044538497925, -0.2945919930934906, -0.23470352590084076, -0.17481505870819092, -0.11492660641670227, -0.05503815412521362, 0.004850327968597412, 0.06473878026008606, 0.12462735176086426, 0.1845158040523529, 0.24440427124500275, 0.3042927384376526, 0.36418119072914124, 0.4240696430206299, 0.4839581251144409, 0.543846607208252, 0.6037350296974182, 0.6636235117912292, 0.7235119342803955, 0.7834004163742065, 0.8432888984680176, 0.9031773209571838, 0.9630658030509949, 1.0229542255401611, 1.0828427076339722, 1.1427311897277832, 1.2026196718215942, 1.2625081539154053, 1.3223965167999268, 1.3822849988937378, 1.4421734809875488, 1.5020619630813599, 1.561950445175171, 1.621838927268982, 1.681727409362793, 1.7416157722473145, 1.8015042543411255, 1.8613927364349365, 1.9212812185287476, 1.9811697006225586, 2.04105806350708]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 8.0, 12.0, 22.0, 27.0, 34.0, 61.0, 79.0, 109.0, 155.0, 206.0, 295.0, 388.0, 609.0, 838.0, 1264.0, 1757.0, 2707.0, 3820.0, 5879.0, 8940.0, 13800.0, 21847.0, 35173.0, 58661.0, 100384.0, 181124.0, 245591.0, 148030.0, 83172.0, 49317.0, 29747.0, 18776.0, 11894.0, 7794.0, 5072.0, 3365.0, 2350.0, 1586.0, 1046.0, 768.0, 580.0, 370.0, 251.0, 179.0, 126.0, 97.0, 73.0, 57.0, 38.0, 29.0, 14.0, 15.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.80908203125, -0.7840576171875, -0.759033203125, -0.7340087890625, -0.708984375, -0.6839599609375, -0.658935546875, -0.6339111328125, -0.60888671875, -0.5838623046875, -0.558837890625, -0.5338134765625, -0.5087890625, -0.4837646484375, -0.458740234375, -0.4337158203125, -0.40869140625, -0.3836669921875, -0.358642578125, -0.3336181640625, -0.30859375, -0.2835693359375, -0.258544921875, -0.2335205078125, -0.20849609375, -0.1834716796875, -0.158447265625, -0.1334228515625, -0.1083984375, -0.0833740234375, -0.058349609375, -0.0333251953125, -0.00830078125, 0.0167236328125, 0.041748046875, 0.0667724609375, 0.091796875, 0.1168212890625, 0.141845703125, 0.1668701171875, 0.19189453125, 0.2169189453125, 0.241943359375, 0.2669677734375, 0.2919921875, 0.3170166015625, 0.342041015625, 0.3670654296875, 0.39208984375, 0.4171142578125, 0.442138671875, 0.4671630859375, 0.4921875, 0.5172119140625, 0.542236328125, 0.5672607421875, 0.59228515625, 0.6173095703125, 0.642333984375, 0.6673583984375, 0.6923828125, 0.7174072265625, 0.742431640625, 0.7674560546875, 0.79248046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 6.0, 3.0, 7.0, 10.0, 10.0, 10.0, 10.0, 16.0, 17.0, 16.0, 21.0, 23.0, 27.0, 38.0, 33.0, 35.0, 36.0, 25.0, 40.0, 37.0, 37.0, 37.0, 44.0, 27.0, 45.0, 47.0, 34.0, 46.0, 47.0, 23.0, 29.0, 24.0, 17.0, 16.0, 12.0, 12.0, 16.0, 9.0, 17.0, 6.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0], "bins": [-1.873046875, -1.8178253173828125, -1.762603759765625, -1.7073822021484375, -1.65216064453125, -1.5969390869140625, -1.541717529296875, -1.4864959716796875, -1.4312744140625, -1.3760528564453125, -1.320831298828125, -1.2656097412109375, -1.21038818359375, -1.1551666259765625, -1.099945068359375, -1.0447235107421875, -0.989501953125, -0.9342803955078125, -0.879058837890625, -0.8238372802734375, -0.76861572265625, -0.7133941650390625, -0.658172607421875, -0.6029510498046875, -0.5477294921875, -0.4925079345703125, -0.437286376953125, -0.3820648193359375, -0.32684326171875, -0.2716217041015625, -0.216400146484375, -0.1611785888671875, -0.10595703125, -0.0507354736328125, 0.004486083984375, 0.0597076416015625, 0.11492919921875, 0.1701507568359375, 0.225372314453125, 0.2805938720703125, 0.3358154296875, 0.3910369873046875, 0.446258544921875, 0.5014801025390625, 0.55670166015625, 0.6119232177734375, 0.667144775390625, 0.7223663330078125, 0.777587890625, 0.8328094482421875, 0.888031005859375, 0.9432525634765625, 0.99847412109375, 1.0536956787109375, 1.108917236328125, 1.1641387939453125, 1.2193603515625, 1.2745819091796875, 1.329803466796875, 1.3850250244140625, 1.44024658203125, 1.4954681396484375, 1.550689697265625, 1.6059112548828125, 1.6611328125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 10.0, 12.0, 23.0, 27.0, 46.0, 69.0, 78.0, 122.0, 182.0, 262.0, 353.0, 541.0, 850.0, 1310.0, 2119.0, 3470.0, 5953.0, 11482.0, 26031.0, 76192.0, 378353.0, 406557.0, 79973.0, 27141.0, 11738.0, 6020.0, 3492.0, 2145.0, 1376.0, 818.0, 567.0, 373.0, 273.0, 171.0, 124.0, 84.0, 63.0, 38.0, 35.0, 24.0, 12.0, 9.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6748046875, -1.62249755859375, -1.5701904296875, -1.51788330078125, -1.465576171875, -1.41326904296875, -1.3609619140625, -1.30865478515625, -1.25634765625, -1.20404052734375, -1.1517333984375, -1.09942626953125, -1.047119140625, -0.99481201171875, -0.9425048828125, -0.89019775390625, -0.837890625, -0.78558349609375, -0.7332763671875, -0.68096923828125, -0.628662109375, -0.57635498046875, -0.5240478515625, -0.47174072265625, -0.41943359375, -0.36712646484375, -0.3148193359375, -0.26251220703125, -0.210205078125, -0.15789794921875, -0.1055908203125, -0.05328369140625, -0.0009765625, 0.05133056640625, 0.1036376953125, 0.15594482421875, 0.208251953125, 0.26055908203125, 0.3128662109375, 0.36517333984375, 0.41748046875, 0.46978759765625, 0.5220947265625, 0.57440185546875, 0.626708984375, 0.67901611328125, 0.7313232421875, 0.78363037109375, 0.8359375, 0.88824462890625, 0.9405517578125, 0.99285888671875, 1.045166015625, 1.09747314453125, 1.1497802734375, 1.20208740234375, 1.25439453125, 1.30670166015625, 1.3590087890625, 1.41131591796875, 1.463623046875, 1.51593017578125, 1.5682373046875, 1.62054443359375, 1.6728515625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 12.0, 6.0, 7.0, 12.0, 7.0, 9.0, 9.0, 16.0, 18.0, 13.0, 23.0, 21.0, 36.0, 40.0, 28.0, 42.0, 41.0, 34.0, 37.0, 39.0, 35.0, 59.0, 42.0, 44.0, 36.0, 34.0, 39.0, 24.0, 36.0, 22.0, 26.0, 30.0, 20.0, 25.0, 17.0, 16.0, 9.0, 8.0, 6.0, 5.0, 8.0, 2.0, 3.0, 1.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 4.0], "bins": [-1.2421875, -1.206024169921875, -1.16986083984375, -1.133697509765625, -1.0975341796875, -1.061370849609375, -1.02520751953125, -0.989044189453125, -0.952880859375, -0.916717529296875, -0.88055419921875, -0.844390869140625, -0.8082275390625, -0.772064208984375, -0.73590087890625, -0.699737548828125, -0.66357421875, -0.627410888671875, -0.59124755859375, -0.555084228515625, -0.5189208984375, -0.482757568359375, -0.44659423828125, -0.410430908203125, -0.374267578125, -0.338104248046875, -0.30194091796875, -0.265777587890625, -0.2296142578125, -0.193450927734375, -0.15728759765625, -0.121124267578125, -0.0849609375, -0.048797607421875, -0.01263427734375, 0.023529052734375, 0.0596923828125, 0.095855712890625, 0.13201904296875, 0.168182373046875, 0.204345703125, 0.240509033203125, 0.27667236328125, 0.312835693359375, 0.3489990234375, 0.385162353515625, 0.42132568359375, 0.457489013671875, 0.49365234375, 0.529815673828125, 0.56597900390625, 0.602142333984375, 0.6383056640625, 0.674468994140625, 0.71063232421875, 0.746795654296875, 0.782958984375, 0.819122314453125, 0.85528564453125, 0.891448974609375, 0.9276123046875, 0.963775634765625, 0.99993896484375, 1.036102294921875, 1.072265625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 14.0, 19.0, 11.0, 29.0, 44.0, 65.0, 82.0, 106.0, 120.0, 177.0, 287.0, 311.0, 428.0, 668.0, 898.0, 1328.0, 1963.0, 3039.0, 5057.0, 8704.0, 16806.0, 36447.0, 111646.0, 598500.0, 168291.0, 46569.0, 20121.0, 10191.0, 5824.0, 3526.0, 2306.0, 1510.0, 1056.0, 651.0, 452.0, 381.0, 227.0, 181.0, 137.0, 95.0, 77.0, 41.0, 37.0, 31.0, 20.0, 21.0, 19.0, 5.0, 6.0, 8.0, 4.0, 7.0, 3.0, 4.0], "bins": [-0.109619140625, -0.10635948181152344, -0.10309982299804688, -0.09984016418457031, -0.09658050537109375, -0.09332084655761719, -0.09006118774414062, -0.08680152893066406, -0.0835418701171875, -0.08028221130371094, -0.07702255249023438, -0.07376289367675781, -0.07050323486328125, -0.06724357604980469, -0.06398391723632812, -0.06072425842285156, -0.057464599609375, -0.05420494079589844, -0.050945281982421875, -0.04768562316894531, -0.04442596435546875, -0.04116630554199219, -0.037906646728515625, -0.03464698791503906, -0.0313873291015625, -0.028127670288085938, -0.024868011474609375, -0.021608352661132812, -0.01834869384765625, -0.015089035034179688, -0.011829376220703125, -0.008569717407226562, -0.00531005859375, -0.0020503997802734375, 0.001209259033203125, 0.0044689178466796875, 0.00772857666015625, 0.010988235473632812, 0.014247894287109375, 0.017507553100585938, 0.0207672119140625, 0.024026870727539062, 0.027286529541015625, 0.030546188354492188, 0.03380584716796875, 0.03706550598144531, 0.040325164794921875, 0.04358482360839844, 0.046844482421875, 0.05010414123535156, 0.053363800048828125, 0.05662345886230469, 0.05988311767578125, 0.06314277648925781, 0.06640243530273438, 0.06966209411621094, 0.0729217529296875, 0.07618141174316406, 0.07944107055664062, 0.08270072937011719, 0.08596038818359375, 0.08922004699707031, 0.09247970581054688, 0.09573936462402344, 0.0989990234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 6.0, 9.0, 14.0, 19.0, 16.0, 19.0, 36.0, 39.0, 54.0, 75.0, 65.0, 89.0, 114.0, 95.0, 77.0, 46.0, 51.0, 32.0, 27.0, 27.0, 8.0, 6.0, 7.0, 12.0, 11.0, 8.0, 2.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.046627044677734e-06, -7.759779691696167e-06, -7.4729323387146e-06, -7.186084985733032e-06, -6.899237632751465e-06, -6.6123902797698975e-06, -6.32554292678833e-06, -6.038695573806763e-06, -5.751848220825195e-06, -5.465000867843628e-06, -5.1781535148620605e-06, -4.891306161880493e-06, -4.604458808898926e-06, -4.317611455917358e-06, -4.030764102935791e-06, -3.7439167499542236e-06, -3.4570693969726562e-06, -3.170222043991089e-06, -2.8833746910095215e-06, -2.596527338027954e-06, -2.3096799850463867e-06, -2.0228326320648193e-06, -1.735985279083252e-06, -1.4491379261016846e-06, -1.1622905731201172e-06, -8.754432201385498e-07, -5.885958671569824e-07, -3.0174851417541504e-07, -1.4901161193847656e-08, 2.7194619178771973e-07, 5.587935447692871e-07, 8.456408977508545e-07, 1.1324882507324219e-06, 1.4193356037139893e-06, 1.7061829566955566e-06, 1.993030309677124e-06, 2.2798776626586914e-06, 2.566725015640259e-06, 2.853572368621826e-06, 3.1404197216033936e-06, 3.427267074584961e-06, 3.7141144275665283e-06, 4.000961780548096e-06, 4.287809133529663e-06, 4.5746564865112305e-06, 4.861503839492798e-06, 5.148351192474365e-06, 5.435198545455933e-06, 5.7220458984375e-06, 6.008893251419067e-06, 6.295740604400635e-06, 6.582587957382202e-06, 6.8694353103637695e-06, 7.156282663345337e-06, 7.443130016326904e-06, 7.729977369308472e-06, 8.016824722290039e-06, 8.303672075271606e-06, 8.590519428253174e-06, 8.877366781234741e-06, 9.164214134216309e-06, 9.451061487197876e-06, 9.737908840179443e-06, 1.002475619316101e-05, 1.0311603546142578e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 15.0, 14.0, 26.0, 34.0, 46.0, 66.0, 98.0, 139.0, 214.0, 320.0, 483.0, 762.0, 1261.0, 2163.0, 3771.0, 6982.0, 13392.0, 27614.0, 63152.0, 178512.0, 470400.0, 164821.0, 59399.0, 26208.0, 12893.0, 6597.0, 3597.0, 2110.0, 1306.0, 733.0, 435.0, 298.0, 223.0, 161.0, 79.0, 72.0, 51.0, 23.0, 13.0, 16.0, 11.0, 8.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.12103271484375, -0.11730480194091797, -0.11357688903808594, -0.1098489761352539, -0.10612106323242188, -0.10239315032958984, -0.09866523742675781, -0.09493732452392578, -0.09120941162109375, -0.08748149871826172, -0.08375358581542969, -0.08002567291259766, -0.07629776000976562, -0.0725698471069336, -0.06884193420410156, -0.06511402130126953, -0.0613861083984375, -0.05765819549560547, -0.05393028259277344, -0.050202369689941406, -0.046474456787109375, -0.042746543884277344, -0.03901863098144531, -0.03529071807861328, -0.03156280517578125, -0.02783489227294922, -0.024106979370117188, -0.020379066467285156, -0.016651153564453125, -0.012923240661621094, -0.009195327758789062, -0.005467414855957031, -0.001739501953125, 0.0019884109497070312, 0.0057163238525390625, 0.009444236755371094, 0.013172149658203125, 0.016900062561035156, 0.020627975463867188, 0.02435588836669922, 0.02808380126953125, 0.03181171417236328, 0.03553962707519531, 0.039267539978027344, 0.042995452880859375, 0.046723365783691406, 0.05045127868652344, 0.05417919158935547, 0.0579071044921875, 0.06163501739501953, 0.06536293029785156, 0.0690908432006836, 0.07281875610351562, 0.07654666900634766, 0.08027458190917969, 0.08400249481201172, 0.08773040771484375, 0.09145832061767578, 0.09518623352050781, 0.09891414642333984, 0.10264205932617188, 0.1063699722290039, 0.11009788513183594, 0.11382579803466797, 0.1175537109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 5.0, 15.0, 14.0, 19.0, 19.0, 28.0, 39.0, 39.0, 49.0, 60.0, 84.0, 99.0, 75.0, 75.0, 71.0, 54.0, 51.0, 28.0, 36.0, 27.0, 24.0, 10.0, 11.0, 14.0, 8.0, 3.0, 7.0, 3.0, 1.0, 2.0, 7.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0283966064453125, -0.027353525161743164, -0.026310443878173828, -0.025267362594604492, -0.024224281311035156, -0.02318120002746582, -0.022138118743896484, -0.02109503746032715, -0.020051956176757812, -0.019008874893188477, -0.01796579360961914, -0.016922712326049805, -0.01587963104248047, -0.014836549758911133, -0.013793468475341797, -0.012750387191772461, -0.011707305908203125, -0.010664224624633789, -0.009621143341064453, -0.008578062057495117, -0.007534980773925781, -0.006491899490356445, -0.005448818206787109, -0.0044057369232177734, -0.0033626556396484375, -0.0023195743560791016, -0.0012764930725097656, -0.0002334117889404297, 0.0008096694946289062, 0.0018527507781982422, 0.002895832061767578, 0.003938913345336914, 0.00498199462890625, 0.006025075912475586, 0.007068157196044922, 0.008111238479614258, 0.009154319763183594, 0.01019740104675293, 0.011240482330322266, 0.012283563613891602, 0.013326644897460938, 0.014369726181030273, 0.01541280746459961, 0.016455888748168945, 0.01749897003173828, 0.018542051315307617, 0.019585132598876953, 0.02062821388244629, 0.021671295166015625, 0.02271437644958496, 0.023757457733154297, 0.024800539016723633, 0.02584362030029297, 0.026886701583862305, 0.02792978286743164, 0.028972864151000977, 0.030015945434570312, 0.03105902671813965, 0.032102108001708984, 0.03314518928527832, 0.034188270568847656, 0.03523135185241699, 0.03627443313598633, 0.037317514419555664, 0.038360595703125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 7.0, 5.0, 6.0, 24.0, 26.0, 23.0, 37.0, 48.0, 63.0, 83.0, 104.0, 119.0, 105.0, 73.0, 57.0, 42.0, 39.0, 25.0, 13.0, 19.0, 24.0, 12.0, 7.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.78768253326416, -2.7016685009002686, -2.615654706954956, -2.5296406745910645, -2.443626642227173, -2.3576126098632812, -2.2715988159179688, -2.185584783554077, -2.0995707511901855, -2.013556718826294, -1.927542805671692, -1.8415288925170898, -1.7555148601531982, -1.6695009469985962, -1.5834870338439941, -1.4974730014801025, -1.4114590883255005, -1.3254451751708984, -1.2394311428070068, -1.1534172296524048, -1.0674031972885132, -0.9813892841339111, -0.8953753113746643, -0.8093613386154175, -0.7233473658561707, -0.6373333930969238, -0.551319420337677, -0.46530547738075256, -0.37929150462150574, -0.2932775318622589, -0.20726358890533447, -0.12124961614608765, -0.03523564338684082, 0.05077832192182541, 0.13679228723049164, 0.22280624508857727, 0.3088202178478241, 0.3948341906070709, 0.48084813356399536, 0.5668621063232422, 0.652876079082489, 0.7388900518417358, 0.8249040246009827, 0.9109179973602295, 0.9969319105148315, 1.0829459428787231, 1.1689598560333252, 1.2549738883972168, 1.3409878015518188, 1.427001714706421, 1.5130157470703125, 1.5990296602249146, 1.6850436925888062, 1.7710576057434082, 1.8570716381072998, 1.9430855512619019, 2.029099464416504, 2.1151134967803955, 2.201127290725708, 2.2871413230895996, 2.373155355453491, 2.459169387817383, 2.5451831817626953, 2.631197214126587, 2.7172112464904785]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 5.0, 4.0, 7.0, 16.0, 6.0, 15.0, 27.0, 20.0, 24.0, 28.0, 36.0, 32.0, 36.0, 40.0, 34.0, 39.0, 32.0, 38.0, 42.0, 48.0, 42.0, 36.0, 43.0, 53.0, 36.0, 44.0, 27.0, 32.0, 22.0, 23.0, 16.0, 13.0, 9.0, 17.0, 4.0, 7.0, 8.0, 12.0, 3.0, 7.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7687112092971802, -1.709715723991394, -1.6507203578948975, -1.5917248725891113, -1.5327293872833252, -1.473733901977539, -1.4147385358810425, -1.3557430505752563, -1.2967476844787598, -1.2377521991729736, -1.178756833076477, -1.119761347770691, -1.0607658624649048, -1.0017704963684082, -0.9427750110626221, -0.8837795257568359, -0.8247840404510498, -0.7657886147499084, -0.7067931294441223, -0.647797703742981, -0.5888022184371948, -0.5298067927360535, -0.4708113670349121, -0.41181591153144836, -0.3528204560279846, -0.2938250005245209, -0.23482955992221832, -0.17583411931991577, -0.11683866381645203, -0.05784320831298828, 0.0011522173881530762, 0.06014767289161682, 0.11914300918579102, 0.17813846468925476, 0.2371339052915573, 0.29612934589385986, 0.3551248013973236, 0.41412025690078735, 0.4731156826019287, 0.5321111679077148, 0.5911065936088562, 0.6501020193099976, 0.7090975046157837, 0.768092930316925, 0.8270883560180664, 0.8860838413238525, 0.9450792670249939, 1.0040746927261353, 1.0630701780319214, 1.1220656633377075, 1.181061029434204, 1.2400565147399902, 1.2990520000457764, 1.3580474853515625, 1.417042851448059, 1.4760383367538452, 1.5350337028503418, 1.594029188156128, 1.6530245542526245, 1.7120200395584106, 1.7710155248641968, 1.8300108909606934, 1.8890063762664795, 1.9480018615722656, 2.0069973468780518]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 9.0, 16.0, 18.0, 20.0, 38.0, 43.0, 59.0, 110.0, 138.0, 214.0, 267.0, 371.0, 595.0, 860.0, 1357.0, 2063.0, 3170.0, 5017.0, 7708.0, 12598.0, 21108.0, 36260.0, 66128.0, 128013.0, 246440.0, 239921.0, 123375.0, 63437.0, 35220.0, 20526.0, 12052.0, 7384.0, 4787.0, 3113.0, 1935.0, 1354.0, 927.0, 591.0, 417.0, 277.0, 181.0, 143.0, 95.0, 55.0, 52.0, 26.0, 34.0, 13.0, 7.0, 7.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-3.140625, -3.042388916015625, -2.94415283203125, -2.845916748046875, -2.7476806640625, -2.649444580078125, -2.55120849609375, -2.452972412109375, -2.354736328125, -2.256500244140625, -2.15826416015625, -2.060028076171875, -1.9617919921875, -1.863555908203125, -1.76531982421875, -1.667083740234375, -1.56884765625, -1.470611572265625, -1.37237548828125, -1.274139404296875, -1.1759033203125, -1.077667236328125, -0.97943115234375, -0.881195068359375, -0.782958984375, -0.684722900390625, -0.58648681640625, -0.488250732421875, -0.3900146484375, -0.291778564453125, -0.19354248046875, -0.095306396484375, 0.0029296875, 0.101165771484375, 0.19940185546875, 0.297637939453125, 0.3958740234375, 0.494110107421875, 0.59234619140625, 0.690582275390625, 0.788818359375, 0.887054443359375, 0.98529052734375, 1.083526611328125, 1.1817626953125, 1.279998779296875, 1.37823486328125, 1.476470947265625, 1.57470703125, 1.672943115234375, 1.77117919921875, 1.869415283203125, 1.9676513671875, 2.065887451171875, 2.16412353515625, 2.262359619140625, 2.360595703125, 2.458831787109375, 2.55706787109375, 2.655303955078125, 2.7535400390625, 2.851776123046875, 2.95001220703125, 3.048248291015625, 3.146484375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 2.0, 5.0, 4.0, 9.0, 6.0, 10.0, 10.0, 19.0, 23.0, 23.0, 22.0, 32.0, 28.0, 23.0, 25.0, 36.0, 45.0, 35.0, 26.0, 38.0, 33.0, 50.0, 44.0, 44.0, 39.0, 48.0, 34.0, 45.0, 29.0, 29.0, 22.0, 30.0, 20.0, 21.0, 18.0, 6.0, 9.0, 8.0, 10.0, 8.0, 5.0, 10.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.7724609375, -1.722747802734375, -1.67303466796875, -1.623321533203125, -1.5736083984375, -1.523895263671875, -1.47418212890625, -1.424468994140625, -1.374755859375, -1.325042724609375, -1.27532958984375, -1.225616455078125, -1.1759033203125, -1.126190185546875, -1.07647705078125, -1.026763916015625, -0.97705078125, -0.927337646484375, -0.87762451171875, -0.827911376953125, -0.7781982421875, -0.728485107421875, -0.67877197265625, -0.629058837890625, -0.579345703125, -0.529632568359375, -0.47991943359375, -0.430206298828125, -0.3804931640625, -0.330780029296875, -0.28106689453125, -0.231353759765625, -0.181640625, -0.131927490234375, -0.08221435546875, -0.032501220703125, 0.0172119140625, 0.066925048828125, 0.11663818359375, 0.166351318359375, 0.216064453125, 0.265777587890625, 0.31549072265625, 0.365203857421875, 0.4149169921875, 0.464630126953125, 0.51434326171875, 0.564056396484375, 0.61376953125, 0.663482666015625, 0.71319580078125, 0.762908935546875, 0.8126220703125, 0.862335205078125, 0.91204833984375, 0.961761474609375, 1.011474609375, 1.061187744140625, 1.11090087890625, 1.160614013671875, 1.2103271484375, 1.260040283203125, 1.30975341796875, 1.359466552734375, 1.4091796875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 8.0, 5.0, 7.0, 13.0, 21.0, 29.0, 30.0, 59.0, 71.0, 118.0, 165.0, 250.0, 378.0, 551.0, 786.0, 1218.0, 1749.0, 2648.0, 4243.0, 6453.0, 10246.0, 17040.0, 28866.0, 49825.0, 90176.0, 171821.0, 265435.0, 176639.0, 92412.0, 50960.0, 29352.0, 17333.0, 10557.0, 6626.0, 4199.0, 2783.0, 1774.0, 1176.0, 828.0, 534.0, 375.0, 247.0, 176.0, 127.0, 88.0, 54.0, 32.0, 33.0, 19.0, 12.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.87109375, -2.782806396484375, -2.69451904296875, -2.606231689453125, -2.5179443359375, -2.429656982421875, -2.34136962890625, -2.253082275390625, -2.164794921875, -2.076507568359375, -1.98822021484375, -1.899932861328125, -1.8116455078125, -1.723358154296875, -1.63507080078125, -1.546783447265625, -1.45849609375, -1.370208740234375, -1.28192138671875, -1.193634033203125, -1.1053466796875, -1.017059326171875, -0.92877197265625, -0.840484619140625, -0.752197265625, -0.663909912109375, -0.57562255859375, -0.487335205078125, -0.3990478515625, -0.310760498046875, -0.22247314453125, -0.134185791015625, -0.0458984375, 0.042388916015625, 0.13067626953125, 0.218963623046875, 0.3072509765625, 0.395538330078125, 0.48382568359375, 0.572113037109375, 0.660400390625, 0.748687744140625, 0.83697509765625, 0.925262451171875, 1.0135498046875, 1.101837158203125, 1.19012451171875, 1.278411865234375, 1.36669921875, 1.454986572265625, 1.54327392578125, 1.631561279296875, 1.7198486328125, 1.808135986328125, 1.89642333984375, 1.984710693359375, 2.072998046875, 2.161285400390625, 2.24957275390625, 2.337860107421875, 2.4261474609375, 2.514434814453125, 2.60272216796875, 2.691009521484375, 2.779296875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 6.0, 13.0, 9.0, 13.0, 11.0, 20.0, 19.0, 19.0, 15.0, 28.0, 27.0, 14.0, 34.0, 29.0, 32.0, 33.0, 41.0, 40.0, 36.0, 33.0, 39.0, 38.0, 41.0, 41.0, 37.0, 28.0, 32.0, 30.0, 39.0, 20.0, 30.0, 21.0, 25.0, 12.0, 17.0, 6.0, 8.0, 15.0, 3.0, 8.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.96630859375, -0.936279296875, -0.90625, -0.876220703125, -0.84619140625, -0.816162109375, -0.7861328125, -0.756103515625, -0.72607421875, -0.696044921875, -0.666015625, -0.635986328125, -0.60595703125, -0.575927734375, -0.5458984375, -0.515869140625, -0.48583984375, -0.455810546875, -0.42578125, -0.395751953125, -0.36572265625, -0.335693359375, -0.3056640625, -0.275634765625, -0.24560546875, -0.215576171875, -0.185546875, -0.155517578125, -0.12548828125, -0.095458984375, -0.0654296875, -0.035400390625, -0.00537109375, 0.024658203125, 0.0546875, 0.084716796875, 0.11474609375, 0.144775390625, 0.1748046875, 0.204833984375, 0.23486328125, 0.264892578125, 0.294921875, 0.324951171875, 0.35498046875, 0.385009765625, 0.4150390625, 0.445068359375, 0.47509765625, 0.505126953125, 0.53515625, 0.565185546875, 0.59521484375, 0.625244140625, 0.6552734375, 0.685302734375, 0.71533203125, 0.745361328125, 0.775390625, 0.805419921875, 0.83544921875, 0.865478515625, 0.8955078125, 0.925537109375, 0.95556640625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 7.0, 14.0, 10.0, 15.0, 27.0, 43.0, 37.0, 71.0, 111.0, 126.0, 207.0, 314.0, 456.0, 719.0, 1111.0, 1728.0, 2849.0, 5066.0, 9421.0, 20218.0, 47957.0, 621266.0, 250689.0, 45259.0, 19261.0, 9171.0, 4812.0, 2749.0, 1680.0, 1058.0, 676.0, 445.0, 308.0, 201.0, 138.0, 95.0, 71.0, 49.0, 37.0, 19.0, 17.0, 21.0, 7.0, 6.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.353515625, -3.251800537109375, -3.15008544921875, -3.048370361328125, -2.9466552734375, -2.844940185546875, -2.74322509765625, -2.641510009765625, -2.539794921875, -2.438079833984375, -2.33636474609375, -2.234649658203125, -2.1329345703125, -2.031219482421875, -1.92950439453125, -1.827789306640625, -1.72607421875, -1.624359130859375, -1.52264404296875, -1.420928955078125, -1.3192138671875, -1.217498779296875, -1.11578369140625, -1.014068603515625, -0.912353515625, -0.810638427734375, -0.70892333984375, -0.607208251953125, -0.5054931640625, -0.403778076171875, -0.30206298828125, -0.200347900390625, -0.0986328125, 0.003082275390625, 0.10479736328125, 0.206512451171875, 0.3082275390625, 0.409942626953125, 0.51165771484375, 0.613372802734375, 0.715087890625, 0.816802978515625, 0.91851806640625, 1.020233154296875, 1.1219482421875, 1.223663330078125, 1.32537841796875, 1.427093505859375, 1.52880859375, 1.630523681640625, 1.73223876953125, 1.833953857421875, 1.9356689453125, 2.037384033203125, 2.13909912109375, 2.240814208984375, 2.342529296875, 2.444244384765625, 2.54595947265625, 2.647674560546875, 2.7493896484375, 2.851104736328125, 2.95281982421875, 3.054534912109375, 3.15625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 13.0, 18.0, 31.0, 35.0, 65.0, 185.0, 394.0, 97.0, 49.0, 28.0, 16.0, 19.0, 14.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001544952392578125, -0.00015091896057128906, -0.00014734268188476562, -0.0001437664031982422, -0.00014019012451171875, -0.0001366138458251953, -0.00013303756713867188, -0.00012946128845214844, -0.000125885009765625, -0.00012230873107910156, -0.00011873245239257812, -0.00011515617370605469, -0.00011157989501953125, -0.00010800361633300781, -0.00010442733764648438, -0.00010085105895996094, -9.72747802734375e-05, -9.369850158691406e-05, -9.012222290039062e-05, -8.654594421386719e-05, -8.296966552734375e-05, -7.939338684082031e-05, -7.581710815429688e-05, -7.224082946777344e-05, -6.866455078125e-05, -6.508827209472656e-05, -6.151199340820312e-05, -5.793571472167969e-05, -5.435943603515625e-05, -5.078315734863281e-05, -4.7206878662109375e-05, -4.363059997558594e-05, -4.00543212890625e-05, -3.647804260253906e-05, -3.2901763916015625e-05, -2.9325485229492188e-05, -2.574920654296875e-05, -2.2172927856445312e-05, -1.8596649169921875e-05, -1.5020370483398438e-05, -1.1444091796875e-05, -7.867813110351562e-06, -4.291534423828125e-06, -7.152557373046875e-07, 2.86102294921875e-06, 6.4373016357421875e-06, 1.0013580322265625e-05, 1.3589859008789062e-05, 1.71661376953125e-05, 2.0742416381835938e-05, 2.4318695068359375e-05, 2.7894973754882812e-05, 3.147125244140625e-05, 3.504753112792969e-05, 3.8623809814453125e-05, 4.220008850097656e-05, 4.57763671875e-05, 4.935264587402344e-05, 5.2928924560546875e-05, 5.650520324707031e-05, 6.008148193359375e-05, 6.365776062011719e-05, 6.723403930664062e-05, 7.081031799316406e-05, 7.43865966796875e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 14.0, 16.0, 24.0, 38.0, 53.0, 65.0, 93.0, 148.0, 183.0, 323.0, 464.0, 719.0, 1106.0, 1788.0, 2785.0, 4862.0, 8642.0, 15706.0, 33023.0, 94103.0, 755684.0, 68609.0, 27330.0, 13703.0, 7661.0, 4327.0, 2559.0, 1623.0, 976.0, 636.0, 414.0, 284.0, 192.0, 129.0, 96.0, 58.0, 36.0, 22.0, 19.0, 14.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5234375, -2.43756103515625, -2.3516845703125, -2.26580810546875, -2.179931640625, -2.09405517578125, -2.0081787109375, -1.92230224609375, -1.83642578125, -1.75054931640625, -1.6646728515625, -1.57879638671875, -1.492919921875, -1.40704345703125, -1.3211669921875, -1.23529052734375, -1.1494140625, -1.06353759765625, -0.9776611328125, -0.89178466796875, -0.805908203125, -0.72003173828125, -0.6341552734375, -0.54827880859375, -0.46240234375, -0.37652587890625, -0.2906494140625, -0.20477294921875, -0.118896484375, -0.03302001953125, 0.0528564453125, 0.13873291015625, 0.224609375, 0.31048583984375, 0.3963623046875, 0.48223876953125, 0.568115234375, 0.65399169921875, 0.7398681640625, 0.82574462890625, 0.91162109375, 0.99749755859375, 1.0833740234375, 1.16925048828125, 1.255126953125, 1.34100341796875, 1.4268798828125, 1.51275634765625, 1.5986328125, 1.68450927734375, 1.7703857421875, 1.85626220703125, 1.942138671875, 2.02801513671875, 2.1138916015625, 2.19976806640625, 2.28564453125, 2.37152099609375, 2.4573974609375, 2.54327392578125, 2.629150390625, 2.71502685546875, 2.8009033203125, 2.88677978515625, 2.97265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 10.0, 6.0, 9.0, 6.0, 9.0, 13.0, 22.0, 20.0, 14.0, 17.0, 24.0, 46.0, 437.0, 121.0, 38.0, 26.0, 28.0, 23.0, 18.0, 12.0, 12.0, 11.0, 5.0, 11.0, 9.0, 11.0, 5.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.491912841796875, -0.47210693359375, -0.452301025390625, -0.4324951171875, -0.412689208984375, -0.39288330078125, -0.373077392578125, -0.353271484375, -0.333465576171875, -0.31365966796875, -0.293853759765625, -0.2740478515625, -0.254241943359375, -0.23443603515625, -0.214630126953125, -0.19482421875, -0.175018310546875, -0.15521240234375, -0.135406494140625, -0.1156005859375, -0.095794677734375, -0.07598876953125, -0.056182861328125, -0.036376953125, -0.016571044921875, 0.00323486328125, 0.023040771484375, 0.0428466796875, 0.062652587890625, 0.08245849609375, 0.102264404296875, 0.1220703125, 0.141876220703125, 0.16168212890625, 0.181488037109375, 0.2012939453125, 0.221099853515625, 0.24090576171875, 0.260711669921875, 0.280517578125, 0.300323486328125, 0.32012939453125, 0.339935302734375, 0.3597412109375, 0.379547119140625, 0.39935302734375, 0.419158935546875, 0.43896484375, 0.458770751953125, 0.47857666015625, 0.498382568359375, 0.5181884765625, 0.537994384765625, 0.55780029296875, 0.577606201171875, 0.597412109375, 0.617218017578125, 0.63702392578125, 0.656829833984375, 0.6766357421875, 0.696441650390625, 0.71624755859375, 0.736053466796875, 0.755859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 6.0, 11.0, 10.0, 22.0, 26.0, 38.0, 52.0, 50.0, 111.0, 115.0, 133.0, 89.0, 70.0, 64.0, 52.0, 26.0, 26.0, 14.0, 23.0, 18.0, 6.0, 7.0, 11.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.905309796333313, -1.818785309791565, -1.732260823249817, -1.6457363367080688, -1.5592118501663208, -1.4726873636245728, -1.3861628770828247, -1.2996383905410767, -1.2131139039993286, -1.1265894174575806, -1.0400649309158325, -0.9535404443740845, -0.8670159578323364, -0.7804914712905884, -0.6939669847488403, -0.6074424982070923, -0.5209180116653442, -0.4343935251235962, -0.34786903858184814, -0.2613445520401001, -0.17482006549835205, -0.088295578956604, -0.001771092414855957, 0.08475339412689209, 0.17127788066864014, 0.2578023672103882, 0.34432685375213623, 0.4308513402938843, 0.5173758268356323, 0.6039003133773804, 0.6904247999191284, 0.7769492864608765, 0.8634738922119141, 0.9499983787536621, 1.0365228652954102, 1.1230473518371582, 1.2095718383789062, 1.2960963249206543, 1.3826208114624023, 1.4691452980041504, 1.5556697845458984, 1.6421942710876465, 1.7287187576293945, 1.8152432441711426, 1.9017677307128906, 1.9882922172546387, 2.0748167037963867, 2.1613411903381348, 2.247865676879883, 2.334390163421631, 2.420914649963379, 2.507439136505127, 2.593963623046875, 2.680488109588623, 2.767012596130371, 2.853537082672119, 2.940061569213867, 3.0265860557556152, 3.1131105422973633, 3.1996350288391113, 3.2861595153808594, 3.3726840019226074, 3.4592084884643555, 3.5457329750061035, 3.6322574615478516]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 5.0, 2.0, 6.0, 8.0, 11.0, 2.0, 14.0, 10.0, 31.0, 27.0, 18.0, 22.0, 23.0, 31.0, 34.0, 33.0, 28.0, 29.0, 34.0, 34.0, 30.0, 39.0, 51.0, 33.0, 37.0, 42.0, 42.0, 33.0, 30.0, 36.0, 25.0, 24.0, 24.0, 27.0, 17.0, 15.0, 11.0, 8.0, 15.0, 17.0, 9.0, 6.0, 4.0, 7.0, 1.0, 2.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.5757516622543335, -1.5257141590118408, -1.4756765365600586, -1.4256389141082764, -1.3756014108657837, -1.325563907623291, -1.2755262851715088, -1.2254886627197266, -1.1754511594772339, -1.1254136562347412, -1.075376033782959, -1.0253384113311768, -0.9753009080886841, -0.9252633452415466, -0.8752257823944092, -0.8251882195472717, -0.7751506567001343, -0.7251130938529968, -0.6750755310058594, -0.6250379681587219, -0.5750004053115845, -0.524962842464447, -0.47492527961730957, -0.4248877167701721, -0.37485015392303467, -0.3248125910758972, -0.27477502822875977, -0.22473746538162231, -0.17469990253448486, -0.12466233968734741, -0.07462477684020996, -0.02458721399307251, 0.02545022964477539, 0.07548779249191284, 0.1255253553390503, 0.17556291818618774, 0.2256004810333252, 0.27563804388046265, 0.3256756067276001, 0.37571316957473755, 0.425750732421875, 0.47578829526901245, 0.5258258581161499, 0.5758634209632874, 0.6259009838104248, 0.6759385466575623, 0.7259761095046997, 0.7760136723518372, 0.8260512351989746, 0.8760887980461121, 0.9261263608932495, 0.976163923740387, 1.0262014865875244, 1.0762391090393066, 1.1262766122817993, 1.176314115524292, 1.2263517379760742, 1.2763893604278564, 1.3264268636703491, 1.3764643669128418, 1.426501989364624, 1.4765396118164062, 1.526577115058899, 1.5766146183013916, 1.6266522407531738]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 14.0, 19.0, 29.0, 37.0, 59.0, 72.0, 125.0, 175.0, 270.0, 448.0, 776.0, 1192.0, 1815.0, 2944.0, 4839.0, 8094.0, 13110.0, 22725.0, 39888.0, 75995.0, 164622.0, 490155.0, 1800223.0, 1054751.0, 268904.0, 111995.0, 55096.0, 29942.0, 17305.0, 10389.0, 6390.0, 4048.0, 2603.0, 1775.0, 1130.0, 744.0, 522.0, 344.0, 258.0, 144.0, 108.0, 69.0, 45.0, 26.0, 19.0, 13.0, 12.0, 6.0, 7.0, 2.0, 3.0, 2.0], "bins": [-2.759765625, -2.68035888671875, -2.6009521484375, -2.52154541015625, -2.442138671875, -2.36273193359375, -2.2833251953125, -2.20391845703125, -2.12451171875, -2.04510498046875, -1.9656982421875, -1.88629150390625, -1.806884765625, -1.72747802734375, -1.6480712890625, -1.56866455078125, -1.4892578125, -1.40985107421875, -1.3304443359375, -1.25103759765625, -1.171630859375, -1.09222412109375, -1.0128173828125, -0.93341064453125, -0.85400390625, -0.77459716796875, -0.6951904296875, -0.61578369140625, -0.536376953125, -0.45697021484375, -0.3775634765625, -0.29815673828125, -0.21875, -0.13934326171875, -0.0599365234375, 0.01947021484375, 0.098876953125, 0.17828369140625, 0.2576904296875, 0.33709716796875, 0.41650390625, 0.49591064453125, 0.5753173828125, 0.65472412109375, 0.734130859375, 0.81353759765625, 0.8929443359375, 0.97235107421875, 1.0517578125, 1.13116455078125, 1.2105712890625, 1.28997802734375, 1.369384765625, 1.44879150390625, 1.5281982421875, 1.60760498046875, 1.68701171875, 1.76641845703125, 1.8458251953125, 1.92523193359375, 2.004638671875, 2.08404541015625, 2.1634521484375, 2.24285888671875, 2.322265625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 2.0, 3.0, 7.0, 4.0, 14.0, 11.0, 19.0, 22.0, 15.0, 21.0, 25.0, 28.0, 35.0, 26.0, 40.0, 32.0, 45.0, 27.0, 38.0, 51.0, 33.0, 39.0, 39.0, 48.0, 26.0, 55.0, 38.0, 29.0, 23.0, 35.0, 23.0, 26.0, 17.0, 12.0, 11.0, 12.0, 11.0, 13.0, 11.0, 5.0, 8.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.091796875, -1.0585174560546875, -1.025238037109375, -0.9919586181640625, -0.95867919921875, -0.9253997802734375, -0.892120361328125, -0.8588409423828125, -0.8255615234375, -0.7922821044921875, -0.759002685546875, -0.7257232666015625, -0.69244384765625, -0.6591644287109375, -0.625885009765625, -0.5926055908203125, -0.559326171875, -0.5260467529296875, -0.492767333984375, -0.4594879150390625, -0.42620849609375, -0.3929290771484375, -0.359649658203125, -0.3263702392578125, -0.2930908203125, -0.2598114013671875, -0.226531982421875, -0.1932525634765625, -0.15997314453125, -0.1266937255859375, -0.093414306640625, -0.0601348876953125, -0.02685546875, 0.0064239501953125, 0.039703369140625, 0.0729827880859375, 0.10626220703125, 0.1395416259765625, 0.172821044921875, 0.2061004638671875, 0.2393798828125, 0.2726593017578125, 0.305938720703125, 0.3392181396484375, 0.37249755859375, 0.4057769775390625, 0.439056396484375, 0.4723358154296875, 0.505615234375, 0.5388946533203125, 0.572174072265625, 0.6054534912109375, 0.63873291015625, 0.6720123291015625, 0.705291748046875, 0.7385711669921875, 0.7718505859375, 0.8051300048828125, 0.838409423828125, 0.8716888427734375, 0.90496826171875, 0.9382476806640625, 0.971527099609375, 1.0048065185546875, 1.0380859375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 13.0, 15.0, 23.0, 35.0, 51.0, 67.0, 114.0, 164.0, 241.0, 394.0, 610.0, 847.0, 1461.0, 2148.0, 3515.0, 5823.0, 9683.0, 16854.0, 30375.0, 56722.0, 114065.0, 252700.0, 665728.0, 1692291.0, 785991.0, 286415.0, 126946.0, 62561.0, 32930.0, 18250.0, 10693.0, 6239.0, 3767.0, 2301.0, 1514.0, 911.0, 618.0, 437.0, 250.0, 178.0, 116.0, 81.0, 49.0, 26.0, 26.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9970703125, -1.9317474365234375, -1.866424560546875, -1.8011016845703125, -1.73577880859375, -1.6704559326171875, -1.605133056640625, -1.5398101806640625, -1.4744873046875, -1.4091644287109375, -1.343841552734375, -1.2785186767578125, -1.21319580078125, -1.1478729248046875, -1.082550048828125, -1.0172271728515625, -0.951904296875, -0.8865814208984375, -0.821258544921875, -0.7559356689453125, -0.69061279296875, -0.6252899169921875, -0.559967041015625, -0.4946441650390625, -0.4293212890625, -0.3639984130859375, -0.298675537109375, -0.2333526611328125, -0.16802978515625, -0.1027069091796875, -0.037384033203125, 0.0279388427734375, 0.09326171875, 0.1585845947265625, 0.223907470703125, 0.2892303466796875, 0.35455322265625, 0.4198760986328125, 0.485198974609375, 0.5505218505859375, 0.6158447265625, 0.6811676025390625, 0.746490478515625, 0.8118133544921875, 0.87713623046875, 0.9424591064453125, 1.007781982421875, 1.0731048583984375, 1.138427734375, 1.2037506103515625, 1.269073486328125, 1.3343963623046875, 1.39971923828125, 1.4650421142578125, 1.530364990234375, 1.5956878662109375, 1.6610107421875, 1.7263336181640625, 1.791656494140625, 1.8569793701171875, 1.92230224609375, 1.9876251220703125, 2.052947998046875, 2.1182708740234375, 2.18359375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 9.0, 3.0, 8.0, 11.0, 9.0, 12.0, 19.0, 21.0, 23.0, 36.0, 59.0, 68.0, 103.0, 97.0, 136.0, 159.0, 165.0, 192.0, 271.0, 285.0, 322.0, 310.0, 293.0, 247.0, 210.0, 187.0, 141.0, 123.0, 105.0, 97.0, 71.0, 57.0, 51.0, 35.0, 33.0, 16.0, 19.0, 15.0, 16.0, 8.0, 9.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5595703125, -0.5405120849609375, -0.521453857421875, -0.5023956298828125, -0.48333740234375, -0.4642791748046875, -0.445220947265625, -0.4261627197265625, -0.4071044921875, -0.3880462646484375, -0.368988037109375, -0.3499298095703125, -0.33087158203125, -0.3118133544921875, -0.292755126953125, -0.2736968994140625, -0.254638671875, -0.2355804443359375, -0.216522216796875, -0.1974639892578125, -0.17840576171875, -0.1593475341796875, -0.140289306640625, -0.1212310791015625, -0.1021728515625, -0.0831146240234375, -0.064056396484375, -0.0449981689453125, -0.02593994140625, -0.0068817138671875, 0.012176513671875, 0.0312347412109375, 0.05029296875, 0.0693511962890625, 0.088409423828125, 0.1074676513671875, 0.12652587890625, 0.1455841064453125, 0.164642333984375, 0.1837005615234375, 0.2027587890625, 0.2218170166015625, 0.240875244140625, 0.2599334716796875, 0.27899169921875, 0.2980499267578125, 0.317108154296875, 0.3361663818359375, 0.355224609375, 0.3742828369140625, 0.393341064453125, 0.4123992919921875, 0.43145751953125, 0.4505157470703125, 0.469573974609375, 0.4886322021484375, 0.5076904296875, 0.5267486572265625, 0.545806884765625, 0.5648651123046875, 0.58392333984375, 0.6029815673828125, 0.622039794921875, 0.6410980224609375, 0.66015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 5.0, 12.0, 21.0, 13.0, 20.0, 22.0, 31.0, 35.0, 41.0, 41.0, 45.0, 67.0, 71.0, 101.0, 77.0, 60.0, 51.0, 52.0, 34.0, 34.0, 21.0, 13.0, 20.0, 13.0, 12.0, 8.0, 14.0, 3.0, 11.0, 6.0, 5.0, 7.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2871257066726685, -1.244937539100647, -1.202749490737915, -1.1605613231658936, -1.1183732748031616, -1.0761851072311401, -1.0339970588684082, -0.9918088912963867, -0.94962078332901, -0.9074326753616333, -0.8652445673942566, -0.8230564594268799, -0.7808682918548584, -0.7386802434921265, -0.696492075920105, -0.6543039679527283, -0.6121158599853516, -0.5699277520179749, -0.5277396440505981, -0.48555150628089905, -0.44336339831352234, -0.40117529034614563, -0.35898715257644653, -0.3167990446090698, -0.2746109366416931, -0.2324228286743164, -0.1902347058057785, -0.1480465829372406, -0.10585847496986389, -0.06367036700248718, -0.021482229232788086, 0.020705878734588623, 0.06289398670196533, 0.10508210211992264, 0.14727021753787994, 0.18945834040641785, 0.23164644837379456, 0.27383455634117126, 0.31602269411087036, 0.35821080207824707, 0.4003989100456238, 0.4425870180130005, 0.4847751259803772, 0.5269632339477539, 0.5691514015197754, 0.6113394498825073, 0.6535276174545288, 0.6957157254219055, 0.7379038333892822, 0.7800919413566589, 0.8222800493240356, 0.8644682168960571, 0.9066562652587891, 0.9488444328308105, 0.9910325407981873, 1.033220648765564, 1.075408697128296, 1.1175968647003174, 1.1597849130630493, 1.2019730806350708, 1.2441611289978027, 1.2863492965698242, 1.3285374641418457, 1.3707255125045776, 1.4129136800765991]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 1.0, 7.0, 10.0, 13.0, 15.0, 26.0, 20.0, 21.0, 29.0, 27.0, 32.0, 32.0, 31.0, 38.0, 22.0, 40.0, 42.0, 38.0, 40.0, 38.0, 43.0, 45.0, 40.0, 41.0, 39.0, 46.0, 19.0, 24.0, 14.0, 30.0, 20.0, 18.0, 22.0, 12.0, 11.0, 12.0, 15.0, 5.0, 6.0, 1.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2873976230621338, -1.2483890056610107, -1.2093803882598877, -1.1703717708587646, -1.1313631534576416, -1.0923545360565186, -1.0533459186553955, -1.014337420463562, -0.975328803062439, -0.9363201856613159, -0.8973115682601929, -0.8583029508590698, -0.8192943930625916, -0.7802857756614685, -0.7412771582603455, -0.7022686004638672, -0.6632599234580994, -0.6242513060569763, -0.5852426886558533, -0.546234130859375, -0.507225513458252, -0.4682168960571289, -0.42920827865600586, -0.3901996910572052, -0.35119107365608215, -0.3121824562549591, -0.27317386865615845, -0.2341652512550354, -0.19515664875507355, -0.1561480462551117, -0.11713942885398865, -0.07813084125518799, -0.03912222385406494, -0.00011361762881278992, 0.03889498859643936, 0.07790359854698181, 0.11691220104694366, 0.15592080354690552, 0.19492942094802856, 0.23393800854682922, 0.27294662594795227, 0.3119552433490753, 0.350963830947876, 0.389972448348999, 0.42898106575012207, 0.46798965334892273, 0.5069983005523682, 0.5460068583488464, 0.5850154757499695, 0.6240240931510925, 0.6630327105522156, 0.7020412683486938, 0.7410498857498169, 0.7800585031509399, 0.819067120552063, 0.858075737953186, 0.8970843553543091, 0.9360929727554321, 0.9751015901565552, 1.0141102075576782, 1.0531188249588013, 1.0921273231506348, 1.1311359405517578, 1.1701445579528809, 1.209153175354004]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 17.0, 26.0, 68.0, 107.0, 165.0, 205.0, 297.0, 561.0, 858.0, 1400.0, 2129.0, 3460.0, 5946.0, 9826.0, 17681.0, 32545.0, 61569.0, 120515.0, 243458.0, 265005.0, 132705.0, 67832.0, 35693.0, 19254.0, 10870.0, 6240.0, 3786.0, 2428.0, 1474.0, 914.0, 586.0, 329.0, 196.0, 155.0, 74.0, 64.0, 36.0, 20.0, 23.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.6348419189453125, -0.614410400390625, -0.5939788818359375, -0.57354736328125, -0.5531158447265625, -0.532684326171875, -0.5122528076171875, -0.4918212890625, -0.4713897705078125, -0.450958251953125, -0.4305267333984375, -0.41009521484375, -0.3896636962890625, -0.369232177734375, -0.3488006591796875, -0.328369140625, -0.3079376220703125, -0.287506103515625, -0.2670745849609375, -0.24664306640625, -0.2262115478515625, -0.205780029296875, -0.1853485107421875, -0.1649169921875, -0.1444854736328125, -0.124053955078125, -0.1036224365234375, -0.08319091796875, -0.0627593994140625, -0.042327880859375, -0.0218963623046875, -0.00146484375, 0.0189666748046875, 0.039398193359375, 0.0598297119140625, 0.08026123046875, 0.1006927490234375, 0.121124267578125, 0.1415557861328125, 0.1619873046875, 0.1824188232421875, 0.202850341796875, 0.2232818603515625, 0.24371337890625, 0.2641448974609375, 0.284576416015625, 0.3050079345703125, 0.325439453125, 0.3458709716796875, 0.366302490234375, 0.3867340087890625, 0.40716552734375, 0.4275970458984375, 0.448028564453125, 0.4684600830078125, 0.4888916015625, 0.5093231201171875, 0.529754638671875, 0.5501861572265625, 0.57061767578125, 0.5910491943359375, 0.611480712890625, 0.6319122314453125, 0.65234375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 5.0, 2.0, 11.0, 6.0, 16.0, 15.0, 20.0, 22.0, 24.0, 25.0, 35.0, 32.0, 28.0, 42.0, 33.0, 45.0, 40.0, 35.0, 29.0, 50.0, 42.0, 39.0, 35.0, 46.0, 48.0, 36.0, 33.0, 28.0, 21.0, 16.0, 25.0, 17.0, 18.0, 20.0, 17.0, 6.0, 13.0, 4.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.267578125, -1.227264404296875, -1.18695068359375, -1.146636962890625, -1.1063232421875, -1.066009521484375, -1.02569580078125, -0.985382080078125, -0.945068359375, -0.904754638671875, -0.86444091796875, -0.824127197265625, -0.7838134765625, -0.743499755859375, -0.70318603515625, -0.662872314453125, -0.62255859375, -0.582244873046875, -0.54193115234375, -0.501617431640625, -0.4613037109375, -0.420989990234375, -0.38067626953125, -0.340362548828125, -0.300048828125, -0.259735107421875, -0.21942138671875, -0.179107666015625, -0.1387939453125, -0.098480224609375, -0.05816650390625, -0.017852783203125, 0.0224609375, 0.062774658203125, 0.10308837890625, 0.143402099609375, 0.1837158203125, 0.224029541015625, 0.26434326171875, 0.304656982421875, 0.344970703125, 0.385284423828125, 0.42559814453125, 0.465911865234375, 0.5062255859375, 0.546539306640625, 0.58685302734375, 0.627166748046875, 0.66748046875, 0.707794189453125, 0.74810791015625, 0.788421630859375, 0.8287353515625, 0.869049072265625, 0.90936279296875, 0.949676513671875, 0.989990234375, 1.030303955078125, 1.07061767578125, 1.110931396484375, 1.1512451171875, 1.191558837890625, 1.23187255859375, 1.272186279296875, 1.3125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 10.0, 4.0, 11.0, 11.0, 21.0, 31.0, 33.0, 49.0, 69.0, 97.0, 143.0, 289.0, 482.0, 799.0, 1434.0, 2678.0, 5251.0, 10642.0, 27671.0, 101100.0, 592024.0, 226691.0, 47610.0, 16137.0, 7177.0, 3585.0, 1867.0, 1052.0, 590.0, 385.0, 210.0, 138.0, 86.0, 60.0, 35.0, 26.0, 20.0, 11.0, 9.0, 4.0, 8.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.248046875, -1.2060699462890625, -1.164093017578125, -1.1221160888671875, -1.08013916015625, -1.0381622314453125, -0.996185302734375, -0.9542083740234375, -0.9122314453125, -0.8702545166015625, -0.828277587890625, -0.7863006591796875, -0.74432373046875, -0.7023468017578125, -0.660369873046875, -0.6183929443359375, -0.576416015625, -0.5344390869140625, -0.492462158203125, -0.4504852294921875, -0.40850830078125, -0.3665313720703125, -0.324554443359375, -0.2825775146484375, -0.2406005859375, -0.1986236572265625, -0.156646728515625, -0.1146697998046875, -0.07269287109375, -0.0307159423828125, 0.011260986328125, 0.0532379150390625, 0.09521484375, 0.1371917724609375, 0.179168701171875, 0.2211456298828125, 0.26312255859375, 0.3050994873046875, 0.347076416015625, 0.3890533447265625, 0.4310302734375, 0.4730072021484375, 0.514984130859375, 0.5569610595703125, 0.59893798828125, 0.6409149169921875, 0.682891845703125, 0.7248687744140625, 0.766845703125, 0.8088226318359375, 0.850799560546875, 0.8927764892578125, 0.93475341796875, 0.9767303466796875, 1.018707275390625, 1.0606842041015625, 1.1026611328125, 1.1446380615234375, 1.186614990234375, 1.2285919189453125, 1.27056884765625, 1.3125457763671875, 1.354522705078125, 1.3964996337890625, 1.4384765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 12.0, 7.0, 11.0, 14.0, 12.0, 10.0, 24.0, 18.0, 36.0, 21.0, 29.0, 37.0, 24.0, 35.0, 36.0, 31.0, 41.0, 43.0, 51.0, 38.0, 34.0, 41.0, 40.0, 29.0, 38.0, 36.0, 32.0, 32.0, 27.0, 13.0, 22.0, 19.0, 22.0, 13.0, 16.0, 4.0, 10.0, 5.0, 6.0, 7.0, 4.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.7978515625, -0.773406982421875, -0.74896240234375, -0.724517822265625, -0.7000732421875, -0.675628662109375, -0.65118408203125, -0.626739501953125, -0.602294921875, -0.577850341796875, -0.55340576171875, -0.528961181640625, -0.5045166015625, -0.480072021484375, -0.45562744140625, -0.431182861328125, -0.40673828125, -0.382293701171875, -0.35784912109375, -0.333404541015625, -0.3089599609375, -0.284515380859375, -0.26007080078125, -0.235626220703125, -0.211181640625, -0.186737060546875, -0.16229248046875, -0.137847900390625, -0.1134033203125, -0.088958740234375, -0.06451416015625, -0.040069580078125, -0.015625, 0.008819580078125, 0.03326416015625, 0.057708740234375, 0.0821533203125, 0.106597900390625, 0.13104248046875, 0.155487060546875, 0.179931640625, 0.204376220703125, 0.22882080078125, 0.253265380859375, 0.2777099609375, 0.302154541015625, 0.32659912109375, 0.351043701171875, 0.37548828125, 0.399932861328125, 0.42437744140625, 0.448822021484375, 0.4732666015625, 0.497711181640625, 0.52215576171875, 0.546600341796875, 0.571044921875, 0.595489501953125, 0.61993408203125, 0.644378662109375, 0.6688232421875, 0.693267822265625, 0.71771240234375, 0.742156982421875, 0.7666015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 14.0, 9.0, 11.0, 24.0, 26.0, 23.0, 49.0, 46.0, 70.0, 109.0, 134.0, 206.0, 301.0, 448.0, 689.0, 1165.0, 1814.0, 3006.0, 5333.0, 11173.0, 27505.0, 90041.0, 651191.0, 180208.0, 42174.0, 15947.0, 7047.0, 3785.0, 2115.0, 1376.0, 812.0, 541.0, 326.0, 206.0, 154.0, 137.0, 82.0, 67.0, 50.0, 40.0, 21.0, 28.0, 8.0, 13.0, 5.0, 7.0, 9.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.11962890625, -0.11607933044433594, -0.11252975463867188, -0.10898017883300781, -0.10543060302734375, -0.10188102722167969, -0.09833145141601562, -0.09478187561035156, -0.0912322998046875, -0.08768272399902344, -0.08413314819335938, -0.08058357238769531, -0.07703399658203125, -0.07348442077636719, -0.06993484497070312, -0.06638526916503906, -0.062835693359375, -0.05928611755371094, -0.055736541748046875, -0.05218696594238281, -0.04863739013671875, -0.04508781433105469, -0.041538238525390625, -0.03798866271972656, -0.0344390869140625, -0.030889511108398438, -0.027339935302734375, -0.023790359497070312, -0.02024078369140625, -0.016691207885742188, -0.013141632080078125, -0.009592056274414062, -0.00604248046875, -0.0024929046630859375, 0.001056671142578125, 0.0046062469482421875, 0.00815582275390625, 0.011705398559570312, 0.015254974365234375, 0.018804550170898438, 0.0223541259765625, 0.025903701782226562, 0.029453277587890625, 0.03300285339355469, 0.03655242919921875, 0.04010200500488281, 0.043651580810546875, 0.04720115661621094, 0.050750732421875, 0.05430030822753906, 0.057849884033203125, 0.06139945983886719, 0.06494903564453125, 0.06849861145019531, 0.07204818725585938, 0.07559776306152344, 0.0791473388671875, 0.08269691467285156, 0.08624649047851562, 0.08979606628417969, 0.09334564208984375, 0.09689521789550781, 0.10044479370117188, 0.10399436950683594, 0.1075439453125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 6.0, 5.0, 5.0, 12.0, 5.0, 16.0, 8.0, 27.0, 19.0, 46.0, 34.0, 43.0, 60.0, 132.0, 95.0, 108.0, 76.0, 50.0, 67.0, 40.0, 35.0, 18.0, 23.0, 13.0, 7.0, 12.0, 9.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-06, -5.991198122501373e-06, -5.783513188362122e-06, -5.57582825422287e-06, -5.368143320083618e-06, -5.1604583859443665e-06, -4.952773451805115e-06, -4.745088517665863e-06, -4.537403583526611e-06, -4.32971864938736e-06, -4.122033715248108e-06, -3.914348781108856e-06, -3.7066638469696045e-06, -3.4989789128303528e-06, -3.291293978691101e-06, -3.0836090445518494e-06, -2.8759241104125977e-06, -2.668239176273346e-06, -2.4605542421340942e-06, -2.2528693079948425e-06, -2.045184373855591e-06, -1.8374994397163391e-06, -1.6298145055770874e-06, -1.4221295714378357e-06, -1.214444637298584e-06, -1.0067597031593323e-06, -7.990747690200806e-07, -5.913898348808289e-07, -3.8370490074157715e-07, -1.7601996660232544e-07, 3.166496753692627e-08, 2.39349901676178e-07, 4.470348358154297e-07, 6.547197699546814e-07, 8.624047040939331e-07, 1.0700896382331848e-06, 1.2777745723724365e-06, 1.4854595065116882e-06, 1.69314444065094e-06, 1.9008293747901917e-06, 2.1085143089294434e-06, 2.316199243068695e-06, 2.5238841772079468e-06, 2.7315691113471985e-06, 2.93925404548645e-06, 3.146938979625702e-06, 3.3546239137649536e-06, 3.5623088479042053e-06, 3.769993782043457e-06, 3.977678716182709e-06, 4.1853636503219604e-06, 4.393048584461212e-06, 4.600733518600464e-06, 4.8084184527397156e-06, 5.016103386878967e-06, 5.223788321018219e-06, 5.431473255157471e-06, 5.639158189296722e-06, 5.846843123435974e-06, 6.054528057575226e-06, 6.2622129917144775e-06, 6.469897925853729e-06, 6.677582859992981e-06, 6.885267794132233e-06, 7.092952728271484e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 7.0, 13.0, 16.0, 18.0, 41.0, 44.0, 62.0, 84.0, 120.0, 169.0, 270.0, 354.0, 618.0, 934.0, 1461.0, 2388.0, 4157.0, 6928.0, 12425.0, 22997.0, 44332.0, 95539.0, 309605.0, 342502.0, 101734.0, 46625.0, 23674.0, 13100.0, 7154.0, 4267.0, 2535.0, 1571.0, 958.0, 598.0, 415.0, 257.0, 186.0, 121.0, 77.0, 65.0, 42.0, 29.0, 15.0, 22.0, 15.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.08099365234375, -0.07854175567626953, -0.07608985900878906, -0.0736379623413086, -0.07118606567382812, -0.06873416900634766, -0.06628227233886719, -0.06383037567138672, -0.06137847900390625, -0.05892658233642578, -0.05647468566894531, -0.054022789001464844, -0.051570892333984375, -0.049118995666503906, -0.04666709899902344, -0.04421520233154297, -0.0417633056640625, -0.03931140899658203, -0.03685951232910156, -0.034407615661621094, -0.031955718994140625, -0.029503822326660156, -0.027051925659179688, -0.02460002899169922, -0.02214813232421875, -0.01969623565673828, -0.017244338989257812, -0.014792442321777344, -0.012340545654296875, -0.009888648986816406, -0.0074367523193359375, -0.004984855651855469, -0.002532958984375, -8.106231689453125e-05, 0.0023708343505859375, 0.004822731018066406, 0.007274627685546875, 0.009726524353027344, 0.012178421020507812, 0.014630317687988281, 0.01708221435546875, 0.01953411102294922, 0.021986007690429688, 0.024437904357910156, 0.026889801025390625, 0.029341697692871094, 0.03179359436035156, 0.03424549102783203, 0.0366973876953125, 0.03914928436279297, 0.04160118103027344, 0.044053077697753906, 0.046504974365234375, 0.048956871032714844, 0.05140876770019531, 0.05386066436767578, 0.05631256103515625, 0.05876445770263672, 0.06121635437011719, 0.06366825103759766, 0.06612014770507812, 0.0685720443725586, 0.07102394104003906, 0.07347583770751953, 0.075927734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 7.0, 8.0, 14.0, 16.0, 11.0, 17.0, 25.0, 31.0, 38.0, 55.0, 69.0, 63.0, 90.0, 85.0, 67.0, 77.0, 68.0, 49.0, 36.0, 43.0, 14.0, 23.0, 23.0, 19.0, 8.0, 9.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0216522216796875, -0.020944833755493164, -0.020237445831298828, -0.019530057907104492, -0.018822669982910156, -0.01811528205871582, -0.017407894134521484, -0.01670050621032715, -0.015993118286132812, -0.015285730361938477, -0.01457834243774414, -0.013870954513549805, -0.013163566589355469, -0.012456178665161133, -0.011748790740966797, -0.011041402816772461, -0.010334014892578125, -0.009626626968383789, -0.008919239044189453, -0.008211851119995117, -0.007504463195800781, -0.006797075271606445, -0.006089687347412109, -0.0053822994232177734, -0.0046749114990234375, -0.0039675235748291016, -0.0032601356506347656, -0.0025527477264404297, -0.0018453598022460938, -0.0011379718780517578, -0.0004305839538574219, 0.00027680397033691406, 0.00098419189453125, 0.001691579818725586, 0.002398967742919922, 0.003106355667114258, 0.0038137435913085938, 0.00452113151550293, 0.005228519439697266, 0.0059359073638916016, 0.0066432952880859375, 0.0073506832122802734, 0.00805807113647461, 0.008765459060668945, 0.009472846984863281, 0.010180234909057617, 0.010887622833251953, 0.011595010757446289, 0.012302398681640625, 0.013009786605834961, 0.013717174530029297, 0.014424562454223633, 0.015131950378417969, 0.015839338302612305, 0.01654672622680664, 0.017254114151000977, 0.017961502075195312, 0.01866888999938965, 0.019376277923583984, 0.02008366584777832, 0.020791053771972656, 0.021498441696166992, 0.022205829620361328, 0.022913217544555664, 0.02362060546875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 8.0, 4.0, 4.0, 10.0, 10.0, 14.0, 17.0, 19.0, 17.0, 18.0, 39.0, 36.0, 33.0, 46.0, 44.0, 71.0, 79.0, 92.0, 76.0, 59.0, 53.0, 37.0, 36.0, 26.0, 28.0, 10.0, 23.0, 9.0, 19.0, 7.0, 10.0, 8.0, 12.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.2287468910217285, -1.188111424446106, -1.1474759578704834, -1.1068404912948608, -1.0662050247192383, -1.0255695581436157, -0.9849341511726379, -0.9442986845970154, -0.9036632180213928, -0.8630277514457703, -0.8223922848701477, -0.7817568182945251, -0.7411214113235474, -0.7004859447479248, -0.6598504781723022, -0.6192150115966797, -0.5785795450210571, -0.5379440784454346, -0.497308611869812, -0.45667317509651184, -0.4160377085208893, -0.3754022419452667, -0.33476680517196655, -0.294131338596344, -0.25349587202072144, -0.21286040544509888, -0.1722249537706375, -0.13158950209617615, -0.09095403552055359, -0.05031856894493103, -0.009683117270469666, 0.0309523344039917, 0.07158792018890381, 0.11222337931394577, 0.15285883843898773, 0.1934942901134491, 0.23412975668907166, 0.2747652232646942, 0.3154006600379944, 0.35603612661361694, 0.3966715931892395, 0.43730705976486206, 0.4779425263404846, 0.5185779929161072, 0.559213399887085, 0.5998488664627075, 0.6404843330383301, 0.6811197996139526, 0.7217552661895752, 0.7623907327651978, 0.8030261993408203, 0.8436616659164429, 0.8842971324920654, 0.924932599067688, 0.9655680060386658, 1.0062034130096436, 1.0468389987945557, 1.0874744653701782, 1.1281099319458008, 1.1687453985214233, 1.209380865097046, 1.2500163316726685, 1.290651798248291, 1.331287145614624, 1.3719226121902466]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 8.0, 2.0, 1.0, 7.0, 12.0, 12.0, 15.0, 28.0, 18.0, 21.0, 29.0, 27.0, 31.0, 34.0, 31.0, 34.0, 29.0, 40.0, 37.0, 38.0, 42.0, 38.0, 38.0, 50.0, 38.0, 40.0, 35.0, 51.0, 19.0, 22.0, 18.0, 28.0, 21.0, 15.0, 23.0, 12.0, 11.0, 14.0, 13.0, 6.0, 6.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2606418132781982, -1.2223528623580933, -1.1840640306472778, -1.1457750797271729, -1.1074861288070679, -1.069197177886963, -1.0309083461761475, -0.9926193952560425, -0.9543305039405823, -0.9160416126251221, -0.8777526617050171, -0.8394637703895569, -0.8011748790740967, -0.7628859281539917, -0.7245970368385315, -0.6863081455230713, -0.6480191946029663, -0.6097303032875061, -0.5714413523674011, -0.5331524610519409, -0.4948635399341583, -0.45657461881637573, -0.4182857275009155, -0.37999680638313293, -0.34170788526535034, -0.30341896414756775, -0.26513004302978516, -0.22684115171432495, -0.18855223059654236, -0.15026330947875977, -0.11197440326213837, -0.07368549704551697, -0.035396456718444824, 0.0028924569487571716, 0.04118137061595917, 0.07947028428316116, 0.11775919795036316, 0.15604811906814575, 0.19433702528476715, 0.23262593150138855, 0.27091485261917114, 0.30920377373695374, 0.34749269485473633, 0.38578158617019653, 0.4240705072879791, 0.4623594284057617, 0.5006483197212219, 0.5389372110366821, 0.5772261619567871, 0.6155150532722473, 0.6538040041923523, 0.6920928955078125, 0.7303818464279175, 0.7686707377433777, 0.8069596290588379, 0.8452485799789429, 0.8835374712944031, 0.9218263626098633, 0.9601153135299683, 0.9984042048454285, 1.0366930961608887, 1.0749820470809937, 1.1132709980010986, 1.151559829711914, 1.189848780632019]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 9.0, 14.0, 22.0, 34.0, 63.0, 75.0, 127.0, 161.0, 244.0, 346.0, 506.0, 840.0, 1205.0, 1737.0, 2621.0, 3900.0, 5799.0, 8729.0, 13699.0, 21908.0, 36443.0, 63103.0, 118974.0, 231326.0, 241906.0, 125389.0, 66729.0, 38242.0, 22856.0, 13996.0, 9182.0, 6013.0, 4094.0, 2689.0, 1812.0, 1211.0, 820.0, 544.0, 376.0, 231.0, 195.0, 134.0, 99.0, 47.0, 40.0, 25.0, 18.0, 11.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91796875, -1.8541259765625, -1.790283203125, -1.7264404296875, -1.66259765625, -1.5987548828125, -1.534912109375, -1.4710693359375, -1.4072265625, -1.3433837890625, -1.279541015625, -1.2156982421875, -1.15185546875, -1.0880126953125, -1.024169921875, -0.9603271484375, -0.896484375, -0.8326416015625, -0.768798828125, -0.7049560546875, -0.64111328125, -0.5772705078125, -0.513427734375, -0.4495849609375, -0.3857421875, -0.3218994140625, -0.258056640625, -0.1942138671875, -0.13037109375, -0.0665283203125, -0.002685546875, 0.0611572265625, 0.125, 0.1888427734375, 0.252685546875, 0.3165283203125, 0.38037109375, 0.4442138671875, 0.508056640625, 0.5718994140625, 0.6357421875, 0.6995849609375, 0.763427734375, 0.8272705078125, 0.89111328125, 0.9549560546875, 1.018798828125, 1.0826416015625, 1.146484375, 1.2103271484375, 1.274169921875, 1.3380126953125, 1.40185546875, 1.4656982421875, 1.529541015625, 1.5933837890625, 1.6572265625, 1.7210693359375, 1.784912109375, 1.8487548828125, 1.91259765625, 1.9764404296875, 2.040283203125, 2.1041259765625, 2.16796875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 13.0, 6.0, 12.0, 21.0, 20.0, 11.0, 24.0, 16.0, 25.0, 25.0, 35.0, 38.0, 27.0, 26.0, 29.0, 30.0, 25.0, 40.0, 46.0, 41.0, 40.0, 41.0, 50.0, 29.0, 35.0, 36.0, 35.0, 18.0, 23.0, 15.0, 23.0, 20.0, 16.0, 16.0, 12.0, 19.0, 16.0, 6.0, 4.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.078125, -1.04644775390625, -1.0147705078125, -0.98309326171875, -0.951416015625, -0.91973876953125, -0.8880615234375, -0.85638427734375, -0.82470703125, -0.79302978515625, -0.7613525390625, -0.72967529296875, -0.697998046875, -0.66632080078125, -0.6346435546875, -0.60296630859375, -0.5712890625, -0.53961181640625, -0.5079345703125, -0.47625732421875, -0.444580078125, -0.41290283203125, -0.3812255859375, -0.34954833984375, -0.31787109375, -0.28619384765625, -0.2545166015625, -0.22283935546875, -0.191162109375, -0.15948486328125, -0.1278076171875, -0.09613037109375, -0.064453125, -0.03277587890625, -0.0010986328125, 0.03057861328125, 0.062255859375, 0.09393310546875, 0.1256103515625, 0.15728759765625, 0.18896484375, 0.22064208984375, 0.2523193359375, 0.28399658203125, 0.315673828125, 0.34735107421875, 0.3790283203125, 0.41070556640625, 0.4423828125, 0.47406005859375, 0.5057373046875, 0.53741455078125, 0.569091796875, 0.60076904296875, 0.6324462890625, 0.66412353515625, 0.69580078125, 0.72747802734375, 0.7591552734375, 0.79083251953125, 0.822509765625, 0.85418701171875, 0.8858642578125, 0.91754150390625, 0.94921875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 10.0, 13.0, 20.0, 23.0, 35.0, 62.0, 74.0, 101.0, 173.0, 218.0, 360.0, 542.0, 748.0, 1196.0, 1768.0, 2594.0, 4133.0, 6525.0, 10277.0, 16996.0, 28676.0, 51182.0, 94091.0, 184636.0, 283327.0, 162826.0, 84216.0, 45796.0, 25846.0, 15538.0, 9361.0, 5952.0, 3756.0, 2554.0, 1691.0, 1027.0, 710.0, 467.0, 352.0, 227.0, 150.0, 105.0, 62.0, 35.0, 35.0, 25.0, 17.0, 10.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.072265625, -2.00628662109375, -1.9403076171875, -1.87432861328125, -1.808349609375, -1.74237060546875, -1.6763916015625, -1.61041259765625, -1.54443359375, -1.47845458984375, -1.4124755859375, -1.34649658203125, -1.280517578125, -1.21453857421875, -1.1485595703125, -1.08258056640625, -1.0166015625, -0.95062255859375, -0.8846435546875, -0.81866455078125, -0.752685546875, -0.68670654296875, -0.6207275390625, -0.55474853515625, -0.48876953125, -0.42279052734375, -0.3568115234375, -0.29083251953125, -0.224853515625, -0.15887451171875, -0.0928955078125, -0.02691650390625, 0.0390625, 0.10504150390625, 0.1710205078125, 0.23699951171875, 0.302978515625, 0.36895751953125, 0.4349365234375, 0.50091552734375, 0.56689453125, 0.63287353515625, 0.6988525390625, 0.76483154296875, 0.830810546875, 0.89678955078125, 0.9627685546875, 1.02874755859375, 1.0947265625, 1.16070556640625, 1.2266845703125, 1.29266357421875, 1.358642578125, 1.42462158203125, 1.4906005859375, 1.55657958984375, 1.62255859375, 1.68853759765625, 1.7545166015625, 1.82049560546875, 1.886474609375, 1.95245361328125, 2.0184326171875, 2.08441162109375, 2.150390625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 7.0, 14.0, 12.0, 22.0, 16.0, 17.0, 29.0, 17.0, 27.0, 27.0, 34.0, 32.0, 32.0, 41.0, 44.0, 38.0, 41.0, 31.0, 38.0, 31.0, 38.0, 18.0, 36.0, 43.0, 29.0, 22.0, 28.0, 29.0, 27.0, 24.0, 27.0, 13.0, 18.0, 13.0, 14.0, 9.0, 13.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.689453125, -0.6685791015625, -0.647705078125, -0.6268310546875, -0.60595703125, -0.5850830078125, -0.564208984375, -0.5433349609375, -0.5224609375, -0.5015869140625, -0.480712890625, -0.4598388671875, -0.43896484375, -0.4180908203125, -0.397216796875, -0.3763427734375, -0.35546875, -0.3345947265625, -0.313720703125, -0.2928466796875, -0.27197265625, -0.2510986328125, -0.230224609375, -0.2093505859375, -0.1884765625, -0.1676025390625, -0.146728515625, -0.1258544921875, -0.10498046875, -0.0841064453125, -0.063232421875, -0.0423583984375, -0.021484375, -0.0006103515625, 0.020263671875, 0.0411376953125, 0.06201171875, 0.0828857421875, 0.103759765625, 0.1246337890625, 0.1455078125, 0.1663818359375, 0.187255859375, 0.2081298828125, 0.22900390625, 0.2498779296875, 0.270751953125, 0.2916259765625, 0.3125, 0.3333740234375, 0.354248046875, 0.3751220703125, 0.39599609375, 0.4168701171875, 0.437744140625, 0.4586181640625, 0.4794921875, 0.5003662109375, 0.521240234375, 0.5421142578125, 0.56298828125, 0.5838623046875, 0.604736328125, 0.6256103515625, 0.646484375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 10.0, 16.0, 29.0, 37.0, 49.0, 82.0, 97.0, 129.0, 177.0, 243.0, 370.0, 475.0, 692.0, 946.0, 1392.0, 2001.0, 3112.0, 4613.0, 6941.0, 11103.0, 18237.0, 35061.0, 109659.0, 729890.0, 57001.0, 25277.0, 14188.0, 8940.0, 5782.0, 3710.0, 2392.0, 1770.0, 1206.0, 847.0, 573.0, 409.0, 313.0, 202.0, 162.0, 126.0, 80.0, 71.0, 39.0, 25.0, 24.0, 18.0, 9.0, 11.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-1.583984375, -1.5348968505859375, -1.485809326171875, -1.4367218017578125, -1.38763427734375, -1.3385467529296875, -1.289459228515625, -1.2403717041015625, -1.1912841796875, -1.1421966552734375, -1.093109130859375, -1.0440216064453125, -0.99493408203125, -0.9458465576171875, -0.896759033203125, -0.8476715087890625, -0.798583984375, -0.7494964599609375, -0.700408935546875, -0.6513214111328125, -0.60223388671875, -0.5531463623046875, -0.504058837890625, -0.4549713134765625, -0.4058837890625, -0.3567962646484375, -0.307708740234375, -0.2586212158203125, -0.20953369140625, -0.1604461669921875, -0.111358642578125, -0.0622711181640625, -0.01318359375, 0.0359039306640625, 0.084991455078125, 0.1340789794921875, 0.18316650390625, 0.2322540283203125, 0.281341552734375, 0.3304290771484375, 0.3795166015625, 0.4286041259765625, 0.477691650390625, 0.5267791748046875, 0.57586669921875, 0.6249542236328125, 0.674041748046875, 0.7231292724609375, 0.772216796875, 0.8213043212890625, 0.870391845703125, 0.9194793701171875, 0.96856689453125, 1.0176544189453125, 1.066741943359375, 1.1158294677734375, 1.1649169921875, 1.2140045166015625, 1.263092041015625, 1.3121795654296875, 1.36126708984375, 1.4103546142578125, 1.459442138671875, 1.5085296630859375, 1.5576171875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 15.0, 9.0, 10.0, 13.0, 25.0, 31.0, 64.0, 143.0, 444.0, 75.0, 36.0, 26.0, 16.0, 23.0, 9.0, 5.0, 5.0, 7.0, 8.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.291534423828125e-05, -4.114210605621338e-05, -3.936886787414551e-05, -3.759562969207764e-05, -3.5822391510009766e-05, -3.4049153327941895e-05, -3.2275915145874023e-05, -3.0502676963806152e-05, -2.872943878173828e-05, -2.695620059967041e-05, -2.518296241760254e-05, -2.3409724235534668e-05, -2.1636486053466797e-05, -1.9863247871398926e-05, -1.8090009689331055e-05, -1.6316771507263184e-05, -1.4543533325195312e-05, -1.2770295143127441e-05, -1.099705696105957e-05, -9.2238187789917e-06, -7.450580596923828e-06, -5.677342414855957e-06, -3.904104232788086e-06, -2.130866050720215e-06, -3.5762786865234375e-07, 1.4156103134155273e-06, 3.1888484954833984e-06, 4.9620866775512695e-06, 6.735324859619141e-06, 8.508563041687012e-06, 1.0281801223754883e-05, 1.2055039405822754e-05, 1.3828277587890625e-05, 1.5601515769958496e-05, 1.7374753952026367e-05, 1.9147992134094238e-05, 2.092123031616211e-05, 2.269446849822998e-05, 2.446770668029785e-05, 2.6240944862365723e-05, 2.8014183044433594e-05, 2.9787421226501465e-05, 3.1560659408569336e-05, 3.333389759063721e-05, 3.510713577270508e-05, 3.688037395477295e-05, 3.865361213684082e-05, 4.042685031890869e-05, 4.220008850097656e-05, 4.3973326683044434e-05, 4.5746564865112305e-05, 4.7519803047180176e-05, 4.929304122924805e-05, 5.106627941131592e-05, 5.283951759338379e-05, 5.461275577545166e-05, 5.638599395751953e-05, 5.81592321395874e-05, 5.9932470321655273e-05, 6.170570850372314e-05, 6.347894668579102e-05, 6.525218486785889e-05, 6.702542304992676e-05, 6.879866123199463e-05, 7.05718994140625e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 10.0, 15.0, 15.0, 34.0, 48.0, 47.0, 80.0, 109.0, 168.0, 203.0, 313.0, 446.0, 721.0, 1176.0, 1881.0, 3104.0, 5138.0, 9555.0, 17767.0, 38770.0, 174591.0, 701161.0, 46813.0, 20634.0, 10844.0, 5793.0, 3337.0, 2057.0, 1287.0, 811.0, 480.0, 332.0, 226.0, 162.0, 133.0, 78.0, 57.0, 51.0, 38.0, 15.0, 10.0, 15.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.205078125, -2.138458251953125, -2.07183837890625, -2.005218505859375, -1.9385986328125, -1.871978759765625, -1.80535888671875, -1.738739013671875, -1.672119140625, -1.605499267578125, -1.53887939453125, -1.472259521484375, -1.4056396484375, -1.339019775390625, -1.27239990234375, -1.205780029296875, -1.13916015625, -1.072540283203125, -1.00592041015625, -0.939300537109375, -0.8726806640625, -0.806060791015625, -0.73944091796875, -0.672821044921875, -0.606201171875, -0.539581298828125, -0.47296142578125, -0.406341552734375, -0.3397216796875, -0.273101806640625, -0.20648193359375, -0.139862060546875, -0.0732421875, -0.006622314453125, 0.05999755859375, 0.126617431640625, 0.1932373046875, 0.259857177734375, 0.32647705078125, 0.393096923828125, 0.459716796875, 0.526336669921875, 0.59295654296875, 0.659576416015625, 0.7261962890625, 0.792816162109375, 0.85943603515625, 0.926055908203125, 0.99267578125, 1.059295654296875, 1.12591552734375, 1.192535400390625, 1.2591552734375, 1.325775146484375, 1.39239501953125, 1.459014892578125, 1.525634765625, 1.592254638671875, 1.65887451171875, 1.725494384765625, 1.7921142578125, 1.858734130859375, 1.92535400390625, 1.991973876953125, 2.05859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 4.0, 5.0, 6.0, 9.0, 8.0, 15.0, 19.0, 14.0, 31.0, 30.0, 129.0, 460.0, 61.0, 34.0, 23.0, 20.0, 18.0, 15.0, 24.0, 14.0, 6.0, 7.0, 8.0, 10.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59619140625, -0.5782623291015625, -0.560333251953125, -0.5424041748046875, -0.52447509765625, -0.5065460205078125, -0.488616943359375, -0.4706878662109375, -0.4527587890625, -0.4348297119140625, -0.416900634765625, -0.3989715576171875, -0.38104248046875, -0.3631134033203125, -0.345184326171875, -0.3272552490234375, -0.309326171875, -0.2913970947265625, -0.273468017578125, -0.2555389404296875, -0.23760986328125, -0.2196807861328125, -0.201751708984375, -0.1838226318359375, -0.1658935546875, -0.1479644775390625, -0.130035400390625, -0.1121063232421875, -0.09417724609375, -0.0762481689453125, -0.058319091796875, -0.0403900146484375, -0.0224609375, -0.0045318603515625, 0.013397216796875, 0.0313262939453125, 0.04925537109375, 0.0671844482421875, 0.085113525390625, 0.1030426025390625, 0.1209716796875, 0.1389007568359375, 0.156829833984375, 0.1747589111328125, 0.19268798828125, 0.2106170654296875, 0.228546142578125, 0.2464752197265625, 0.264404296875, 0.2823333740234375, 0.300262451171875, 0.3181915283203125, 0.33612060546875, 0.3540496826171875, 0.371978759765625, 0.3899078369140625, 0.4078369140625, 0.4257659912109375, 0.443695068359375, 0.4616241455078125, 0.47955322265625, 0.4974822998046875, 0.515411376953125, 0.5333404541015625, 0.55126953125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 8.0, 8.0, 8.0, 13.0, 15.0, 16.0, 18.0, 37.0, 46.0, 45.0, 73.0, 107.0, 85.0, 96.0, 90.0, 78.0, 43.0, 50.0, 18.0, 24.0, 17.0, 12.0, 18.0, 10.0, 10.0, 12.0, 7.0, 7.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3013391494750977, -1.2525334358215332, -1.2037277221679688, -1.1549220085144043, -1.1061162948608398, -1.0573105812072754, -1.008504867553711, -0.9596990942955017, -0.9108933806419373, -0.8620876669883728, -0.8132819533348083, -0.7644761800765991, -0.7156704664230347, -0.6668647527694702, -0.6180590391159058, -0.5692533254623413, -0.5204476118087769, -0.4716418981552124, -0.42283618450164795, -0.3740304410457611, -0.32522472739219666, -0.2764190137386322, -0.22761327028274536, -0.1788075566291809, -0.13000184297561646, -0.0811961218714714, -0.032390400767326355, 0.016415327787399292, 0.06522104144096375, 0.1140267550945282, 0.16283249855041504, 0.2116382122039795, 0.2604440450668335, 0.30924975872039795, 0.3580554723739624, 0.40686121582984924, 0.4556669294834137, 0.5044726133346558, 0.553278386592865, 0.6020841002464294, 0.6508898138999939, 0.6996955275535583, 0.7485012412071228, 0.797307014465332, 0.8461127281188965, 0.8949184417724609, 0.9437241554260254, 0.9925298690795898, 1.0413355827331543, 1.0901412963867188, 1.1389470100402832, 1.1877527236938477, 1.236558437347412, 1.2853641510009766, 1.334169864654541, 1.3829755783081055, 1.43178129196167, 1.4805870056152344, 1.5293927192687988, 1.5781984329223633, 1.6270041465759277, 1.6758098602294922, 1.7246155738830566, 1.773421287536621, 1.822227120399475]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 7.0, 13.0, 19.0, 24.0, 22.0, 18.0, 19.0, 34.0, 35.0, 29.0, 45.0, 31.0, 31.0, 41.0, 41.0, 44.0, 41.0, 38.0, 47.0, 35.0, 53.0, 31.0, 40.0, 27.0, 31.0, 23.0, 26.0, 19.0, 29.0, 10.0, 18.0, 12.0, 11.0, 11.0, 9.0, 12.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.186215877532959, -1.1497374773025513, -1.1132590770721436, -1.0767805576324463, -1.0403021574020386, -1.0038237571716309, -0.9673453569412231, -0.9308669567108154, -0.8943884968757629, -0.8579100966453552, -0.8214316368103027, -0.784953236579895, -0.7484748363494873, -0.7119963765144348, -0.6755179762840271, -0.6390395164489746, -0.6025611162185669, -0.5660827159881592, -0.5296042561531067, -0.493125855922699, -0.45664742588996887, -0.42016899585723877, -0.38369059562683105, -0.34721216559410095, -0.31073373556137085, -0.27425530552864075, -0.23777689039707184, -0.20129847526550293, -0.16482004523277283, -0.12834161520004272, -0.09186320006847382, -0.05538478493690491, -0.018906354904174805, 0.0175720676779747, 0.05405049026012421, 0.09052891284227371, 0.12700733542442322, 0.16348576545715332, 0.19996418058872223, 0.23644259572029114, 0.27292102575302124, 0.30939945578575134, 0.34587788581848145, 0.38235628604888916, 0.41883471608161926, 0.45531314611434937, 0.4917915463447571, 0.5282700061798096, 0.5647484064102173, 0.601226806640625, 0.6377052664756775, 0.6741836667060852, 0.7106621265411377, 0.7471405267715454, 0.7836189270019531, 0.8200973272323608, 0.8565757870674133, 0.893054187297821, 0.9295326471328735, 0.9660110473632812, 1.002489447593689, 1.0389678478240967, 1.075446367263794, 1.1119247674942017, 1.1484031677246094]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 9.0, 17.0, 27.0, 26.0, 43.0, 56.0, 85.0, 128.0, 192.0, 218.0, 288.0, 390.0, 609.0, 781.0, 1079.0, 1457.0, 2018.0, 2790.0, 3851.0, 5585.0, 7895.0, 11334.0, 16602.0, 24908.0, 38057.0, 62033.0, 103700.0, 190045.0, 437564.0, 1210844.0, 1169306.0, 428580.0, 194597.0, 104694.0, 61337.0, 37934.0, 24363.0, 16301.0, 10846.0, 7452.0, 4983.0, 3522.0, 2433.0, 1689.0, 1102.0, 876.0, 548.0, 415.0, 234.0, 160.0, 122.0, 59.0, 42.0, 25.0, 15.0, 8.0, 5.0, 4.0], "bins": [-1.3232421875, -1.286468505859375, -1.24969482421875, -1.212921142578125, -1.1761474609375, -1.139373779296875, -1.10260009765625, -1.065826416015625, -1.029052734375, -0.992279052734375, -0.95550537109375, -0.918731689453125, -0.8819580078125, -0.845184326171875, -0.80841064453125, -0.771636962890625, -0.73486328125, -0.698089599609375, -0.66131591796875, -0.624542236328125, -0.5877685546875, -0.550994873046875, -0.51422119140625, -0.477447509765625, -0.440673828125, -0.403900146484375, -0.36712646484375, -0.330352783203125, -0.2935791015625, -0.256805419921875, -0.22003173828125, -0.183258056640625, -0.146484375, -0.109710693359375, -0.07293701171875, -0.036163330078125, 0.0006103515625, 0.037384033203125, 0.07415771484375, 0.110931396484375, 0.147705078125, 0.184478759765625, 0.22125244140625, 0.258026123046875, 0.2947998046875, 0.331573486328125, 0.36834716796875, 0.405120849609375, 0.44189453125, 0.478668212890625, 0.51544189453125, 0.552215576171875, 0.5889892578125, 0.625762939453125, 0.66253662109375, 0.699310302734375, 0.736083984375, 0.772857666015625, 0.80963134765625, 0.846405029296875, 0.8831787109375, 0.919952392578125, 0.95672607421875, 0.993499755859375, 1.0302734375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 9.0, 9.0, 6.0, 19.0, 4.0, 17.0, 18.0, 18.0, 25.0, 25.0, 22.0, 35.0, 42.0, 41.0, 40.0, 27.0, 27.0, 39.0, 56.0, 33.0, 36.0, 35.0, 47.0, 38.0, 35.0, 37.0, 35.0, 36.0, 18.0, 20.0, 21.0, 19.0, 19.0, 17.0, 14.0, 10.0, 13.0, 9.0, 5.0, 5.0, 4.0, 5.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7368011474609375, -0.714813232421875, -0.6928253173828125, -0.67083740234375, -0.6488494873046875, -0.626861572265625, -0.6048736572265625, -0.5828857421875, -0.5608978271484375, -0.538909912109375, -0.5169219970703125, -0.49493408203125, -0.4729461669921875, -0.450958251953125, -0.4289703369140625, -0.406982421875, -0.3849945068359375, -0.363006591796875, -0.3410186767578125, -0.31903076171875, -0.2970428466796875, -0.275054931640625, -0.2530670166015625, -0.2310791015625, -0.2090911865234375, -0.187103271484375, -0.1651153564453125, -0.14312744140625, -0.1211395263671875, -0.099151611328125, -0.0771636962890625, -0.05517578125, -0.0331878662109375, -0.011199951171875, 0.0107879638671875, 0.03277587890625, 0.0547637939453125, 0.076751708984375, 0.0987396240234375, 0.1207275390625, 0.1427154541015625, 0.164703369140625, 0.1866912841796875, 0.20867919921875, 0.2306671142578125, 0.252655029296875, 0.2746429443359375, 0.296630859375, 0.3186187744140625, 0.340606689453125, 0.3625946044921875, 0.38458251953125, 0.4065704345703125, 0.428558349609375, 0.4505462646484375, 0.4725341796875, 0.4945220947265625, 0.516510009765625, 0.5384979248046875, 0.56048583984375, 0.5824737548828125, 0.604461669921875, 0.6264495849609375, 0.6484375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 9.0, 15.0, 17.0, 25.0, 39.0, 69.0, 75.0, 158.0, 244.0, 394.0, 606.0, 939.0, 1484.0, 2505.0, 4028.0, 6918.0, 12272.0, 21633.0, 39505.0, 76329.0, 157084.0, 369585.0, 1112948.0, 1504179.0, 486490.0, 196827.0, 92593.0, 47260.0, 25324.0, 14267.0, 8190.0, 4734.0, 2897.0, 1724.0, 1056.0, 697.0, 438.0, 243.0, 183.0, 111.0, 66.0, 38.0, 32.0, 16.0, 16.0, 11.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.48046875, -1.437103271484375, -1.39373779296875, -1.350372314453125, -1.3070068359375, -1.263641357421875, -1.22027587890625, -1.176910400390625, -1.133544921875, -1.090179443359375, -1.04681396484375, -1.003448486328125, -0.9600830078125, -0.916717529296875, -0.87335205078125, -0.829986572265625, -0.78662109375, -0.743255615234375, -0.69989013671875, -0.656524658203125, -0.6131591796875, -0.569793701171875, -0.52642822265625, -0.483062744140625, -0.439697265625, -0.396331787109375, -0.35296630859375, -0.309600830078125, -0.2662353515625, -0.222869873046875, -0.17950439453125, -0.136138916015625, -0.0927734375, -0.049407958984375, -0.00604248046875, 0.037322998046875, 0.0806884765625, 0.124053955078125, 0.16741943359375, 0.210784912109375, 0.254150390625, 0.297515869140625, 0.34088134765625, 0.384246826171875, 0.4276123046875, 0.470977783203125, 0.51434326171875, 0.557708740234375, 0.60107421875, 0.644439697265625, 0.68780517578125, 0.731170654296875, 0.7745361328125, 0.817901611328125, 0.86126708984375, 0.904632568359375, 0.947998046875, 0.991363525390625, 1.03472900390625, 1.078094482421875, 1.1214599609375, 1.164825439453125, 1.20819091796875, 1.251556396484375, 1.294921875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 7.0, 8.0, 16.0, 9.0, 16.0, 22.0, 45.0, 48.0, 75.0, 83.0, 97.0, 121.0, 151.0, 173.0, 189.0, 285.0, 299.0, 310.0, 298.0, 325.0, 276.0, 241.0, 188.0, 176.0, 145.0, 102.0, 79.0, 58.0, 60.0, 31.0, 38.0, 21.0, 20.0, 10.0, 18.0, 6.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40966796875, -0.3962364196777344, -0.38280487060546875, -0.3693733215332031, -0.3559417724609375, -0.3425102233886719, -0.32907867431640625, -0.3156471252441406, -0.302215576171875, -0.2887840270996094, -0.27535247802734375, -0.2619209289550781, -0.2484893798828125, -0.23505783081054688, -0.22162628173828125, -0.20819473266601562, -0.19476318359375, -0.18133163452148438, -0.16790008544921875, -0.15446853637695312, -0.1410369873046875, -0.12760543823242188, -0.11417388916015625, -0.10074234008789062, -0.087310791015625, -0.07387924194335938, -0.06044769287109375, -0.047016143798828125, -0.0335845947265625, -0.020153045654296875, -0.00672149658203125, 0.006710052490234375, 0.0201416015625, 0.033573150634765625, 0.04700469970703125, 0.060436248779296875, 0.0738677978515625, 0.08729934692382812, 0.10073089599609375, 0.11416244506835938, 0.127593994140625, 0.14102554321289062, 0.15445709228515625, 0.16788864135742188, 0.1813201904296875, 0.19475173950195312, 0.20818328857421875, 0.22161483764648438, 0.23504638671875, 0.24847793579101562, 0.26190948486328125, 0.2753410339355469, 0.2887725830078125, 0.3022041320800781, 0.31563568115234375, 0.3290672302246094, 0.342498779296875, 0.3559303283691406, 0.36936187744140625, 0.3827934265136719, 0.3962249755859375, 0.4096565246582031, 0.42308807373046875, 0.4365196228027344, 0.449951171875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 5.0, 8.0, 6.0, 7.0, 11.0, 13.0, 12.0, 23.0, 20.0, 28.0, 35.0, 40.0, 55.0, 80.0, 91.0, 86.0, 98.0, 77.0, 53.0, 54.0, 43.0, 30.0, 22.0, 16.0, 14.0, 9.0, 12.0, 6.0, 6.0, 8.0, 8.0, 6.0, 9.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.078287959098816, -1.046448826789856, -1.0146095752716064, -0.9827704429626465, -0.9509313106536865, -0.9190921783447266, -0.8872529864311218, -0.8554137945175171, -0.8235746622085571, -0.7917355298995972, -0.7598963379859924, -0.7280571460723877, -0.6962180137634277, -0.6643788814544678, -0.632539689540863, -0.6007004976272583, -0.5688613653182983, -0.5370222330093384, -0.5051830410957336, -0.4733438789844513, -0.44150471687316895, -0.4096655547618866, -0.37782639265060425, -0.3459872305393219, -0.31414806842803955, -0.2823089063167572, -0.25046974420547485, -0.2186305820941925, -0.18679141998291016, -0.1549522578716278, -0.12311309576034546, -0.09127393364906311, -0.05943489074707031, -0.027595728635787964, 0.004243433475494385, 0.03608259558677673, 0.06792175769805908, 0.09976091980934143, 0.13160008192062378, 0.16343924403190613, 0.19527840614318848, 0.22711756825447083, 0.2589567303657532, 0.2907958924770355, 0.32263505458831787, 0.3544742166996002, 0.38631337881088257, 0.4181525409221649, 0.44999170303344727, 0.4818308651447296, 0.513670027256012, 0.5455092191696167, 0.5773483514785767, 0.6091874837875366, 0.6410266757011414, 0.6728658676147461, 0.704704999923706, 0.736544132232666, 0.7683833241462708, 0.8002225160598755, 0.8320616483688354, 0.8639007806777954, 0.8957399725914001, 0.9275791645050049, 0.9594182968139648]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 5.0, 4.0, 3.0, 6.0, 8.0, 15.0, 11.0, 20.0, 22.0, 23.0, 26.0, 41.0, 29.0, 29.0, 35.0, 44.0, 35.0, 41.0, 36.0, 40.0, 44.0, 48.0, 34.0, 36.0, 50.0, 36.0, 27.0, 39.0, 28.0, 26.0, 25.0, 20.0, 23.0, 16.0, 16.0, 16.0, 10.0, 10.0, 5.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9402976036071777, -0.9146940112113953, -0.8890904188156128, -0.8634868264198303, -0.8378832340240479, -0.8122796416282654, -0.7866760492324829, -0.7610725164413452, -0.735468864440918, -0.7098652720451355, -0.684261679649353, -0.6586580872535706, -0.6330544948577881, -0.6074509024620056, -0.5818473100662231, -0.5562437772750854, -0.530640184879303, -0.5050365924835205, -0.47943300008773804, -0.45382940769195557, -0.4282258152961731, -0.4026222229003906, -0.37701866030693054, -0.35141506791114807, -0.3258114755153656, -0.30020788311958313, -0.27460429072380066, -0.24900071322917938, -0.2233971208333969, -0.19779352843761444, -0.17218995094299316, -0.1465863585472107, -0.12098276615142822, -0.09537917375564575, -0.06977558881044388, -0.044172003865242004, -0.018568411469459534, 0.007035180926322937, 0.032638758420944214, 0.058242350816726685, 0.08384594321250916, 0.10944953560829163, 0.1350531280040741, 0.16065670549869537, 0.18626029789447784, 0.21186389029026031, 0.2374674677848816, 0.26307106018066406, 0.28867465257644653, 0.314278244972229, 0.3398818373680115, 0.36548542976379395, 0.3910890221595764, 0.4166926145553589, 0.44229617714881897, 0.46789976954460144, 0.4935033619403839, 0.519106924533844, 0.5447105169296265, 0.5703141093254089, 0.5959177017211914, 0.6215212941169739, 0.6471248865127563, 0.6727284789085388, 0.6983320713043213]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 10.0, 20.0, 27.0, 42.0, 61.0, 95.0, 139.0, 254.0, 338.0, 537.0, 841.0, 1258.0, 2025.0, 3057.0, 5201.0, 8356.0, 14347.0, 25263.0, 45040.0, 85287.0, 165151.0, 272909.0, 193972.0, 100681.0, 53320.0, 28593.0, 16337.0, 9769.0, 5758.0, 3556.0, 2265.0, 1441.0, 888.0, 631.0, 351.0, 246.0, 156.0, 116.0, 60.0, 43.0, 38.0, 24.0, 14.0, 12.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.419189453125, -0.4067230224609375, -0.394256591796875, -0.3817901611328125, -0.36932373046875, -0.3568572998046875, -0.344390869140625, -0.3319244384765625, -0.3194580078125, -0.3069915771484375, -0.294525146484375, -0.2820587158203125, -0.26959228515625, -0.2571258544921875, -0.244659423828125, -0.2321929931640625, -0.2197265625, -0.2072601318359375, -0.194793701171875, -0.1823272705078125, -0.16986083984375, -0.1573944091796875, -0.144927978515625, -0.1324615478515625, -0.1199951171875, -0.1075286865234375, -0.095062255859375, -0.0825958251953125, -0.07012939453125, -0.0576629638671875, -0.045196533203125, -0.0327301025390625, -0.020263671875, -0.0077972412109375, 0.004669189453125, 0.0171356201171875, 0.02960205078125, 0.0420684814453125, 0.054534912109375, 0.0670013427734375, 0.0794677734375, 0.0919342041015625, 0.104400634765625, 0.1168670654296875, 0.12933349609375, 0.1417999267578125, 0.154266357421875, 0.1667327880859375, 0.17919921875, 0.1916656494140625, 0.204132080078125, 0.2165985107421875, 0.22906494140625, 0.2415313720703125, 0.253997802734375, 0.2664642333984375, 0.2789306640625, 0.2913970947265625, 0.303863525390625, 0.3163299560546875, 0.32879638671875, 0.3412628173828125, 0.353729248046875, 0.3661956787109375, 0.378662109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 4.0, 9.0, 8.0, 7.0, 14.0, 18.0, 23.0, 29.0, 24.0, 34.0, 30.0, 25.0, 37.0, 45.0, 41.0, 45.0, 42.0, 41.0, 36.0, 47.0, 48.0, 32.0, 37.0, 39.0, 32.0, 33.0, 40.0, 29.0, 26.0, 17.0, 15.0, 12.0, 17.0, 15.0, 12.0, 7.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0], "bins": [-1.025390625, -0.9993057250976562, -0.9732208251953125, -0.9471359252929688, -0.921051025390625, -0.8949661254882812, -0.8688812255859375, -0.8427963256835938, -0.81671142578125, -0.7906265258789062, -0.7645416259765625, -0.7384567260742188, -0.712371826171875, -0.6862869262695312, -0.6602020263671875, -0.6341171264648438, -0.6080322265625, -0.5819473266601562, -0.5558624267578125, -0.5297775268554688, -0.503692626953125, -0.47760772705078125, -0.4515228271484375, -0.42543792724609375, -0.39935302734375, -0.37326812744140625, -0.3471832275390625, -0.32109832763671875, -0.295013427734375, -0.26892852783203125, -0.2428436279296875, -0.21675872802734375, -0.190673828125, -0.16458892822265625, -0.1385040283203125, -0.11241912841796875, -0.086334228515625, -0.06024932861328125, -0.0341644287109375, -0.00807952880859375, 0.01800537109375, 0.04409027099609375, 0.0701751708984375, 0.09626007080078125, 0.122344970703125, 0.14842987060546875, 0.1745147705078125, 0.20059967041015625, 0.2266845703125, 0.25276947021484375, 0.2788543701171875, 0.30493927001953125, 0.331024169921875, 0.35710906982421875, 0.3831939697265625, 0.40927886962890625, 0.43536376953125, 0.46144866943359375, 0.4875335693359375, 0.5136184692382812, 0.539703369140625, 0.5657882690429688, 0.5918731689453125, 0.6179580688476562, 0.64404296875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 11.0, 23.0, 29.0, 49.0, 76.0, 87.0, 140.0, 225.0, 307.0, 431.0, 646.0, 842.0, 1257.0, 1858.0, 2791.0, 4655.0, 7588.0, 14235.0, 29815.0, 77565.0, 296011.0, 431528.0, 101520.0, 36260.0, 16725.0, 8780.0, 5239.0, 3306.0, 2047.0, 1408.0, 935.0, 662.0, 474.0, 313.0, 209.0, 159.0, 99.0, 82.0, 43.0, 36.0, 19.0, 20.0, 12.0, 8.0, 10.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6484375, -0.6294326782226562, -0.6104278564453125, -0.5914230346679688, -0.572418212890625, -0.5534133911132812, -0.5344085693359375, -0.5154037475585938, -0.49639892578125, -0.47739410400390625, -0.4583892822265625, -0.43938446044921875, -0.420379638671875, -0.40137481689453125, -0.3823699951171875, -0.36336517333984375, -0.3443603515625, -0.32535552978515625, -0.3063507080078125, -0.28734588623046875, -0.268341064453125, -0.24933624267578125, -0.2303314208984375, -0.21132659912109375, -0.19232177734375, -0.17331695556640625, -0.1543121337890625, -0.13530731201171875, -0.116302490234375, -0.09729766845703125, -0.0782928466796875, -0.05928802490234375, -0.040283203125, -0.02127838134765625, -0.0022735595703125, 0.01673126220703125, 0.035736083984375, 0.05474090576171875, 0.0737457275390625, 0.09275054931640625, 0.11175537109375, 0.13076019287109375, 0.1497650146484375, 0.16876983642578125, 0.187774658203125, 0.20677947998046875, 0.2257843017578125, 0.24478912353515625, 0.2637939453125, 0.28279876708984375, 0.3018035888671875, 0.32080841064453125, 0.339813232421875, 0.35881805419921875, 0.3778228759765625, 0.39682769775390625, 0.41583251953125, 0.43483734130859375, 0.4538421630859375, 0.47284698486328125, 0.491851806640625, 0.5108566284179688, 0.5298614501953125, 0.5488662719726562, 0.56787109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 4.0, 12.0, 11.0, 9.0, 12.0, 16.0, 20.0, 27.0, 24.0, 28.0, 26.0, 26.0, 29.0, 32.0, 33.0, 42.0, 34.0, 51.0, 33.0, 29.0, 45.0, 39.0, 39.0, 46.0, 32.0, 24.0, 34.0, 30.0, 34.0, 25.0, 22.0, 17.0, 9.0, 19.0, 17.0, 8.0, 15.0, 7.0, 6.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50146484375, -0.4863929748535156, -0.47132110595703125, -0.4562492370605469, -0.4411773681640625, -0.4261054992675781, -0.41103363037109375, -0.3959617614746094, -0.380889892578125, -0.3658180236816406, -0.35074615478515625, -0.3356742858886719, -0.3206024169921875, -0.3055305480957031, -0.29045867919921875, -0.2753868103027344, -0.26031494140625, -0.24524307250976562, -0.23017120361328125, -0.21509933471679688, -0.2000274658203125, -0.18495559692382812, -0.16988372802734375, -0.15481185913085938, -0.139739990234375, -0.12466812133789062, -0.10959625244140625, -0.09452438354492188, -0.0794525146484375, -0.06438064575195312, -0.04930877685546875, -0.034236907958984375, -0.0191650390625, -0.004093170166015625, 0.01097869873046875, 0.026050567626953125, 0.0411224365234375, 0.056194305419921875, 0.07126617431640625, 0.08633804321289062, 0.101409912109375, 0.11648178100585938, 0.13155364990234375, 0.14662551879882812, 0.1616973876953125, 0.17676925659179688, 0.19184112548828125, 0.20691299438476562, 0.22198486328125, 0.23705673217773438, 0.25212860107421875, 0.2672004699707031, 0.2822723388671875, 0.2973442077636719, 0.31241607666015625, 0.3274879455566406, 0.342559814453125, 0.3576316833496094, 0.37270355224609375, 0.3877754211425781, 0.4028472900390625, 0.4179191589355469, 0.43299102783203125, 0.4480628967285156, 0.463134765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 8.0, 11.0, 3.0, 20.0, 23.0, 24.0, 34.0, 50.0, 72.0, 106.0, 145.0, 194.0, 366.0, 476.0, 656.0, 1144.0, 1745.0, 3000.0, 5324.0, 10702.0, 24810.0, 75538.0, 581688.0, 254324.0, 49450.0, 18811.0, 8577.0, 4497.0, 2456.0, 1465.0, 944.0, 644.0, 350.0, 237.0, 190.0, 121.0, 71.0, 69.0, 61.0, 36.0, 37.0, 11.0, 22.0, 10.0, 6.0, 8.0, 5.0, 0.0, 1.0, 8.0, 3.0, 0.0, 2.0], "bins": [-0.058746337890625, -0.05701017379760742, -0.055274009704589844, -0.053537845611572266, -0.05180168151855469, -0.05006551742553711, -0.04832935333251953, -0.04659318923950195, -0.044857025146484375, -0.0431208610534668, -0.04138469696044922, -0.03964853286743164, -0.03791236877441406, -0.036176204681396484, -0.034440040588378906, -0.03270387649536133, -0.03096771240234375, -0.029231548309326172, -0.027495384216308594, -0.025759220123291016, -0.024023056030273438, -0.02228689193725586, -0.02055072784423828, -0.018814563751220703, -0.017078399658203125, -0.015342235565185547, -0.013606071472167969, -0.01186990737915039, -0.010133743286132812, -0.008397579193115234, -0.006661415100097656, -0.004925251007080078, -0.0031890869140625, -0.0014529228210449219, 0.00028324127197265625, 0.0020194053649902344, 0.0037555694580078125, 0.005491733551025391, 0.007227897644042969, 0.008964061737060547, 0.010700225830078125, 0.012436389923095703, 0.014172554016113281, 0.01590871810913086, 0.017644882202148438, 0.019381046295166016, 0.021117210388183594, 0.022853374481201172, 0.02458953857421875, 0.026325702667236328, 0.028061866760253906, 0.029798030853271484, 0.03153419494628906, 0.03327035903930664, 0.03500652313232422, 0.0367426872253418, 0.038478851318359375, 0.04021501541137695, 0.04195117950439453, 0.04368734359741211, 0.04542350769042969, 0.047159671783447266, 0.048895835876464844, 0.05063199996948242, 0.0523681640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 1.0, 6.0, 13.0, 10.0, 15.0, 19.0, 25.0, 38.0, 35.0, 43.0, 51.0, 107.0, 98.0, 88.0, 104.0, 68.0, 83.0, 38.0, 23.0, 27.0, 35.0, 10.0, 14.0, 7.0, 6.0, 9.0, 4.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.066394805908203e-06, -4.934147000312805e-06, -4.801899194717407e-06, -4.669651389122009e-06, -4.537403583526611e-06, -4.405155777931213e-06, -4.2729079723358154e-06, -4.1406601667404175e-06, -4.0084123611450195e-06, -3.876164555549622e-06, -3.7439167499542236e-06, -3.6116689443588257e-06, -3.4794211387634277e-06, -3.3471733331680298e-06, -3.214925527572632e-06, -3.082677721977234e-06, -2.950429916381836e-06, -2.818182110786438e-06, -2.68593430519104e-06, -2.553686499595642e-06, -2.421438694000244e-06, -2.289190888404846e-06, -2.1569430828094482e-06, -2.0246952772140503e-06, -1.8924474716186523e-06, -1.7601996660232544e-06, -1.6279518604278564e-06, -1.4957040548324585e-06, -1.3634562492370605e-06, -1.2312084436416626e-06, -1.0989606380462646e-06, -9.667128324508667e-07, -8.344650268554688e-07, -7.022172212600708e-07, -5.699694156646729e-07, -4.377216100692749e-07, -3.0547380447387695e-07, -1.73225998878479e-07, -4.0978193283081055e-08, 9.12696123123169e-08, 2.2351741790771484e-07, 3.557652235031128e-07, 4.880130290985107e-07, 6.202608346939087e-07, 7.525086402893066e-07, 8.847564458847046e-07, 1.0170042514801025e-06, 1.1492520570755005e-06, 1.2814998626708984e-06, 1.4137476682662964e-06, 1.5459954738616943e-06, 1.6782432794570923e-06, 1.8104910850524902e-06, 1.942738890647888e-06, 2.074986696243286e-06, 2.207234501838684e-06, 2.339482307434082e-06, 2.47173011302948e-06, 2.603977918624878e-06, 2.736225724220276e-06, 2.868473529815674e-06, 3.0007213354110718e-06, 3.1329691410064697e-06, 3.2652169466018677e-06, 3.3974647521972656e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 5.0, 7.0, 15.0, 19.0, 28.0, 46.0, 63.0, 87.0, 96.0, 163.0, 220.0, 326.0, 479.0, 702.0, 1014.0, 1582.0, 2438.0, 3886.0, 6390.0, 10827.0, 19547.0, 37826.0, 86642.0, 253736.0, 387887.0, 124790.0, 50779.0, 24612.0, 13348.0, 7739.0, 4611.0, 2974.0, 1841.0, 1242.0, 794.0, 558.0, 355.0, 265.0, 195.0, 107.0, 104.0, 61.0, 45.0, 32.0, 25.0, 11.0, 8.0, 11.0, 5.0, 6.0, 5.0, 1.0], "bins": [-0.04522705078125, -0.04397726058959961, -0.04272747039794922, -0.04147768020629883, -0.04022789001464844, -0.03897809982299805, -0.037728309631347656, -0.036478519439697266, -0.035228729248046875, -0.033978939056396484, -0.032729148864746094, -0.0314793586730957, -0.030229568481445312, -0.028979778289794922, -0.02772998809814453, -0.02648019790649414, -0.02523040771484375, -0.02398061752319336, -0.02273082733154297, -0.021481037139892578, -0.020231246948242188, -0.018981456756591797, -0.017731666564941406, -0.016481876373291016, -0.015232086181640625, -0.013982295989990234, -0.012732505798339844, -0.011482715606689453, -0.010232925415039062, -0.008983135223388672, -0.007733345031738281, -0.006483554840087891, -0.0052337646484375, -0.003983974456787109, -0.0027341842651367188, -0.0014843940734863281, -0.0002346038818359375, 0.0010151863098144531, 0.0022649765014648438, 0.0035147666931152344, 0.004764556884765625, 0.006014347076416016, 0.007264137268066406, 0.008513927459716797, 0.009763717651367188, 0.011013507843017578, 0.012263298034667969, 0.01351308822631836, 0.01476287841796875, 0.01601266860961914, 0.01726245880126953, 0.018512248992919922, 0.019762039184570312, 0.021011829376220703, 0.022261619567871094, 0.023511409759521484, 0.024761199951171875, 0.026010990142822266, 0.027260780334472656, 0.028510570526123047, 0.029760360717773438, 0.031010150909423828, 0.03225994110107422, 0.03350973129272461, 0.034759521484375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 12.0, 6.0, 22.0, 23.0, 36.0, 41.0, 76.0, 98.0, 102.0, 115.0, 105.0, 92.0, 81.0, 55.0, 39.0, 24.0, 28.0, 15.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0225372314453125, -0.021826982498168945, -0.02111673355102539, -0.020406484603881836, -0.01969623565673828, -0.018985986709594727, -0.018275737762451172, -0.017565488815307617, -0.016855239868164062, -0.016144990921020508, -0.015434741973876953, -0.014724493026733398, -0.014014244079589844, -0.013303995132446289, -0.012593746185302734, -0.01188349723815918, -0.011173248291015625, -0.01046299934387207, -0.009752750396728516, -0.009042501449584961, -0.008332252502441406, -0.0076220035552978516, -0.006911754608154297, -0.006201505661010742, -0.0054912567138671875, -0.004781007766723633, -0.004070758819580078, -0.0033605098724365234, -0.0026502609252929688, -0.001940011978149414, -0.0012297630310058594, -0.0005195140838623047, 0.00019073486328125, 0.0009009838104248047, 0.0016112327575683594, 0.002321481704711914, 0.0030317306518554688, 0.0037419795989990234, 0.004452228546142578, 0.005162477493286133, 0.0058727264404296875, 0.006582975387573242, 0.007293224334716797, 0.008003473281860352, 0.008713722229003906, 0.009423971176147461, 0.010134220123291016, 0.01084446907043457, 0.011554718017578125, 0.01226496696472168, 0.012975215911865234, 0.013685464859008789, 0.014395713806152344, 0.015105962753295898, 0.015816211700439453, 0.016526460647583008, 0.017236709594726562, 0.017946958541870117, 0.018657207489013672, 0.019367456436157227, 0.02007770538330078, 0.020787954330444336, 0.02149820327758789, 0.022208452224731445, 0.022918701171875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 9.0, 5.0, 15.0, 12.0, 19.0, 15.0, 27.0, 23.0, 29.0, 53.0, 55.0, 61.0, 92.0, 92.0, 98.0, 79.0, 56.0, 51.0, 42.0, 33.0, 24.0, 15.0, 11.0, 10.0, 10.0, 10.0, 5.0, 6.0, 10.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.0635896921157837, -1.0320584774017334, -1.000527262687683, -0.968995988368988, -0.9374647736549377, -0.9059335589408875, -0.8744022846221924, -0.8428710699081421, -0.8113398551940918, -0.7798086404800415, -0.7482774257659912, -0.7167461514472961, -0.6852149367332458, -0.6536837220191956, -0.6221524477005005, -0.5906212329864502, -0.5590900182723999, -0.5275588035583496, -0.49602755904197693, -0.46449631452560425, -0.43296509981155396, -0.40143388509750366, -0.369902640581131, -0.3383713960647583, -0.306840181350708, -0.2753089666366577, -0.24377772212028503, -0.21224649250507355, -0.18071526288986206, -0.14918403327465057, -0.11765280365943909, -0.0861215740442276, -0.05459022521972656, -0.023058995604515076, 0.008472234010696411, 0.0400034636259079, 0.07153469324111938, 0.10306592285633087, 0.13459715247154236, 0.16612838208675385, 0.19765961170196533, 0.22919084131717682, 0.2607220709323883, 0.292253315448761, 0.3237845301628113, 0.3553157448768616, 0.38684698939323425, 0.41837823390960693, 0.4499094486236572, 0.4814406633377075, 0.5129718780517578, 0.5445031523704529, 0.5760343670845032, 0.6075655817985535, 0.6390968561172485, 0.6706280708312988, 0.7021592855453491, 0.7336905002593994, 0.7652217149734497, 0.7967529892921448, 0.8282842040061951, 0.8598154187202454, 0.8913466930389404, 0.9228779077529907, 0.954409122467041]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 3.0, 3.0, 6.0, 8.0, 14.0, 12.0, 21.0, 21.0, 21.0, 28.0, 39.0, 28.0, 32.0, 35.0, 43.0, 36.0, 41.0, 38.0, 41.0, 40.0, 48.0, 33.0, 41.0, 49.0, 36.0, 24.0, 40.0, 31.0, 22.0, 24.0, 24.0, 19.0, 18.0, 16.0, 17.0, 9.0, 9.0, 6.0, 6.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9225988388061523, -0.897320032119751, -0.8720412254333496, -0.8467624187469482, -0.8214836120605469, -0.7962048053741455, -0.7709259390830994, -0.745647132396698, -0.7203683257102966, -0.6950895190238953, -0.6698107123374939, -0.6445319056510925, -0.6192530393600464, -0.593974232673645, -0.5686954259872437, -0.5434166193008423, -0.5181378126144409, -0.49285900592803955, -0.4675801992416382, -0.44230136275291443, -0.41702255606651306, -0.3917437493801117, -0.36646491289138794, -0.3411861062049866, -0.3159072995185852, -0.29062849283218384, -0.26534968614578247, -0.24007084965705872, -0.21479204297065735, -0.18951323628425598, -0.16423441469669342, -0.13895559310913086, -0.11367684602737427, -0.0883980318903923, -0.06311921775341034, -0.037840403616428375, -0.012561589479446411, 0.012717217206954956, 0.03799603879451752, 0.06327486038208008, 0.08855366706848145, 0.11383248120546341, 0.13911129534244537, 0.16439011693000793, 0.1896689236164093, 0.21494773030281067, 0.24022655189037323, 0.2655053734779358, 0.29078418016433716, 0.3160629868507385, 0.3413417935371399, 0.36662063002586365, 0.391899436712265, 0.4171782433986664, 0.44245707988739014, 0.4677358865737915, 0.49301469326019287, 0.5182934999465942, 0.5435723066329956, 0.568851113319397, 0.5941299200057983, 0.6194087266921997, 0.6446875929832458, 0.6699663996696472, 0.6952452063560486]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 14.0, 13.0, 24.0, 63.0, 55.0, 73.0, 108.0, 180.0, 286.0, 371.0, 552.0, 791.0, 1196.0, 1737.0, 2573.0, 3696.0, 5716.0, 8909.0, 13727.0, 22111.0, 35671.0, 59920.0, 105410.0, 191320.0, 243213.0, 145339.0, 79932.0, 46630.0, 28234.0, 17768.0, 11184.0, 7261.0, 4764.0, 3158.0, 2087.0, 1417.0, 938.0, 666.0, 434.0, 345.0, 201.0, 136.0, 101.0, 82.0, 51.0, 27.0, 25.0, 20.0, 9.0, 4.0, 1.0, 8.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2041015625, -1.16558837890625, -1.1270751953125, -1.08856201171875, -1.050048828125, -1.01153564453125, -0.9730224609375, -0.93450927734375, -0.89599609375, -0.85748291015625, -0.8189697265625, -0.78045654296875, -0.741943359375, -0.70343017578125, -0.6649169921875, -0.62640380859375, -0.587890625, -0.54937744140625, -0.5108642578125, -0.47235107421875, -0.433837890625, -0.39532470703125, -0.3568115234375, -0.31829833984375, -0.27978515625, -0.24127197265625, -0.2027587890625, -0.16424560546875, -0.125732421875, -0.08721923828125, -0.0487060546875, -0.01019287109375, 0.0283203125, 0.06683349609375, 0.1053466796875, 0.14385986328125, 0.182373046875, 0.22088623046875, 0.2593994140625, 0.29791259765625, 0.33642578125, 0.37493896484375, 0.4134521484375, 0.45196533203125, 0.490478515625, 0.52899169921875, 0.5675048828125, 0.60601806640625, 0.64453125, 0.68304443359375, 0.7215576171875, 0.76007080078125, 0.798583984375, 0.83709716796875, 0.8756103515625, 0.91412353515625, 0.95263671875, 0.99114990234375, 1.0296630859375, 1.06817626953125, 1.106689453125, 1.14520263671875, 1.1837158203125, 1.22222900390625, 1.2607421875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 1.0, 3.0, 6.0, 3.0, 3.0, 8.0, 6.0, 18.0, 19.0, 24.0, 25.0, 23.0, 38.0, 26.0, 30.0, 40.0, 49.0, 26.0, 38.0, 39.0, 39.0, 40.0, 46.0, 51.0, 40.0, 38.0, 37.0, 35.0, 35.0, 32.0, 21.0, 28.0, 19.0, 20.0, 15.0, 15.0, 12.0, 15.0, 12.0, 7.0, 8.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.7285308837890625, -0.705596923828125, -0.6826629638671875, -0.65972900390625, -0.6367950439453125, -0.613861083984375, -0.5909271240234375, -0.5679931640625, -0.5450592041015625, -0.522125244140625, -0.4991912841796875, -0.47625732421875, -0.4533233642578125, -0.430389404296875, -0.4074554443359375, -0.384521484375, -0.3615875244140625, -0.338653564453125, -0.3157196044921875, -0.29278564453125, -0.2698516845703125, -0.246917724609375, -0.2239837646484375, -0.2010498046875, -0.1781158447265625, -0.155181884765625, -0.1322479248046875, -0.10931396484375, -0.0863800048828125, -0.063446044921875, -0.0405120849609375, -0.017578125, 0.0053558349609375, 0.028289794921875, 0.0512237548828125, 0.07415771484375, 0.0970916748046875, 0.120025634765625, 0.1429595947265625, 0.1658935546875, 0.1888275146484375, 0.211761474609375, 0.2346954345703125, 0.25762939453125, 0.2805633544921875, 0.303497314453125, 0.3264312744140625, 0.349365234375, 0.3722991943359375, 0.395233154296875, 0.4181671142578125, 0.44110107421875, 0.4640350341796875, 0.486968994140625, 0.5099029541015625, 0.5328369140625, 0.5557708740234375, 0.578704833984375, 0.6016387939453125, 0.62457275390625, 0.6475067138671875, 0.670440673828125, 0.6933746337890625, 0.71630859375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 8.0, 13.0, 19.0, 24.0, 25.0, 30.0, 38.0, 69.0, 114.0, 131.0, 207.0, 327.0, 430.0, 613.0, 948.0, 1375.0, 2211.0, 3398.0, 5252.0, 8542.0, 14078.0, 23943.0, 41604.0, 78313.0, 161332.0, 308289.0, 191351.0, 89839.0, 47796.0, 26495.0, 15534.0, 9366.0, 5856.0, 3713.0, 2428.0, 1574.0, 1062.0, 665.0, 499.0, 319.0, 192.0, 160.0, 114.0, 71.0, 53.0, 40.0, 26.0, 21.0, 9.0, 14.0, 7.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0], "bins": [-1.4228515625, -1.37921142578125, -1.3355712890625, -1.29193115234375, -1.248291015625, -1.20465087890625, -1.1610107421875, -1.11737060546875, -1.07373046875, -1.03009033203125, -0.9864501953125, -0.94281005859375, -0.899169921875, -0.85552978515625, -0.8118896484375, -0.76824951171875, -0.724609375, -0.68096923828125, -0.6373291015625, -0.59368896484375, -0.550048828125, -0.50640869140625, -0.4627685546875, -0.41912841796875, -0.37548828125, -0.33184814453125, -0.2882080078125, -0.24456787109375, -0.200927734375, -0.15728759765625, -0.1136474609375, -0.07000732421875, -0.0263671875, 0.01727294921875, 0.0609130859375, 0.10455322265625, 0.148193359375, 0.19183349609375, 0.2354736328125, 0.27911376953125, 0.32275390625, 0.36639404296875, 0.4100341796875, 0.45367431640625, 0.497314453125, 0.54095458984375, 0.5845947265625, 0.62823486328125, 0.671875, 0.71551513671875, 0.7591552734375, 0.80279541015625, 0.846435546875, 0.89007568359375, 0.9337158203125, 0.97735595703125, 1.02099609375, 1.06463623046875, 1.1082763671875, 1.15191650390625, 1.195556640625, 1.23919677734375, 1.2828369140625, 1.32647705078125, 1.3701171875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 4.0, 6.0, 4.0, 6.0, 9.0, 10.0, 20.0, 13.0, 20.0, 30.0, 23.0, 28.0, 32.0, 29.0, 27.0, 36.0, 36.0, 26.0, 34.0, 37.0, 37.0, 32.0, 50.0, 34.0, 34.0, 26.0, 33.0, 50.0, 41.0, 26.0, 31.0, 27.0, 22.0, 15.0, 15.0, 20.0, 11.0, 9.0, 13.0, 7.0, 5.0, 8.0, 3.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.427734375, -0.4144783020019531, -0.40122222900390625, -0.3879661560058594, -0.3747100830078125, -0.3614540100097656, -0.34819793701171875, -0.3349418640136719, -0.321685791015625, -0.3084297180175781, -0.29517364501953125, -0.2819175720214844, -0.2686614990234375, -0.2554054260253906, -0.24214935302734375, -0.22889328002929688, -0.21563720703125, -0.20238113403320312, -0.18912506103515625, -0.17586898803710938, -0.1626129150390625, -0.14935684204101562, -0.13610076904296875, -0.12284469604492188, -0.109588623046875, -0.09633255004882812, -0.08307647705078125, -0.06982040405273438, -0.0565643310546875, -0.043308258056640625, -0.03005218505859375, -0.016796112060546875, -0.0035400390625, 0.009716033935546875, 0.02297210693359375, 0.036228179931640625, 0.0494842529296875, 0.06274032592773438, 0.07599639892578125, 0.08925247192382812, 0.102508544921875, 0.11576461791992188, 0.12902069091796875, 0.14227676391601562, 0.1555328369140625, 0.16878890991210938, 0.18204498291015625, 0.19530105590820312, 0.20855712890625, 0.22181320190429688, 0.23506927490234375, 0.24832534790039062, 0.2615814208984375, 0.2748374938964844, 0.28809356689453125, 0.3013496398925781, 0.314605712890625, 0.3278617858886719, 0.34111785888671875, 0.3543739318847656, 0.3676300048828125, 0.3808860778808594, 0.39414215087890625, 0.4073982238769531, 0.420654296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 7.0, 15.0, 11.0, 15.0, 21.0, 24.0, 43.0, 45.0, 94.0, 145.0, 177.0, 260.0, 437.0, 694.0, 1150.0, 1849.0, 3110.0, 5162.0, 9357.0, 16799.0, 33983.0, 89317.0, 702104.0, 104428.0, 37148.0, 18136.0, 9872.0, 5582.0, 3308.0, 1964.0, 1174.0, 687.0, 485.0, 292.0, 213.0, 133.0, 85.0, 71.0, 50.0, 26.0, 30.0, 19.0, 13.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.184326171875, -1.14794921875, -1.111572265625, -1.0751953125, -1.038818359375, -1.00244140625, -0.966064453125, -0.9296875, -0.893310546875, -0.85693359375, -0.820556640625, -0.7841796875, -0.747802734375, -0.71142578125, -0.675048828125, -0.638671875, -0.602294921875, -0.56591796875, -0.529541015625, -0.4931640625, -0.456787109375, -0.42041015625, -0.384033203125, -0.34765625, -0.311279296875, -0.27490234375, -0.238525390625, -0.2021484375, -0.165771484375, -0.12939453125, -0.093017578125, -0.056640625, -0.020263671875, 0.01611328125, 0.052490234375, 0.0888671875, 0.125244140625, 0.16162109375, 0.197998046875, 0.234375, 0.270751953125, 0.30712890625, 0.343505859375, 0.3798828125, 0.416259765625, 0.45263671875, 0.489013671875, 0.525390625, 0.561767578125, 0.59814453125, 0.634521484375, 0.6708984375, 0.707275390625, 0.74365234375, 0.780029296875, 0.81640625, 0.852783203125, 0.88916015625, 0.925537109375, 0.9619140625, 0.998291015625, 1.03466796875, 1.071044921875, 1.107421875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 4.0, 9.0, 10.0, 7.0, 13.0, 22.0, 20.0, 31.0, 31.0, 54.0, 75.0, 245.0, 165.0, 63.0, 49.0, 44.0, 31.0, 15.0, 16.0, 13.0, 6.0, 9.0, 8.0, 6.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.2649765014648438e-05, -2.1938234567642212e-05, -2.1226704120635986e-05, -2.051517367362976e-05, -1.9803643226623535e-05, -1.909211277961731e-05, -1.8380582332611084e-05, -1.766905188560486e-05, -1.6957521438598633e-05, -1.6245990991592407e-05, -1.553446054458618e-05, -1.4822930097579956e-05, -1.411139965057373e-05, -1.3399869203567505e-05, -1.268833875656128e-05, -1.1976808309555054e-05, -1.1265277862548828e-05, -1.0553747415542603e-05, -9.842216968536377e-06, -9.130686521530151e-06, -8.419156074523926e-06, -7.7076256275177e-06, -6.996095180511475e-06, -6.284564733505249e-06, -5.5730342864990234e-06, -4.861503839492798e-06, -4.149973392486572e-06, -3.4384429454803467e-06, -2.726912498474121e-06, -2.0153820514678955e-06, -1.30385160446167e-06, -5.923211574554443e-07, 1.1920928955078125e-07, 8.307397365570068e-07, 1.5422701835632324e-06, 2.253800630569458e-06, 2.9653310775756836e-06, 3.676861524581909e-06, 4.388391971588135e-06, 5.09992241859436e-06, 5.811452865600586e-06, 6.5229833126068115e-06, 7.234513759613037e-06, 7.946044206619263e-06, 8.657574653625488e-06, 9.369105100631714e-06, 1.008063554763794e-05, 1.0792165994644165e-05, 1.150369644165039e-05, 1.2215226888656616e-05, 1.2926757335662842e-05, 1.3638287782669067e-05, 1.4349818229675293e-05, 1.5061348676681519e-05, 1.5772879123687744e-05, 1.648440957069397e-05, 1.7195940017700195e-05, 1.790747046470642e-05, 1.8619000911712646e-05, 1.9330531358718872e-05, 2.0042061805725098e-05, 2.0753592252731323e-05, 2.146512269973755e-05, 2.2176653146743774e-05, 2.288818359375e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 11.0, 14.0, 19.0, 37.0, 59.0, 76.0, 111.0, 153.0, 246.0, 344.0, 544.0, 808.0, 1333.0, 2041.0, 3546.0, 5993.0, 11060.0, 22308.0, 53917.0, 597204.0, 254153.0, 48818.0, 20565.0, 10468.0, 5735.0, 3330.0, 2026.0, 1245.0, 824.0, 503.0, 341.0, 240.0, 150.0, 99.0, 65.0, 46.0, 36.0, 23.0, 17.0, 12.0, 6.0, 3.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4365234375, -1.3929290771484375, -1.349334716796875, -1.3057403564453125, -1.26214599609375, -1.2185516357421875, -1.174957275390625, -1.1313629150390625, -1.0877685546875, -1.0441741943359375, -1.000579833984375, -0.9569854736328125, -0.91339111328125, -0.8697967529296875, -0.826202392578125, -0.7826080322265625, -0.739013671875, -0.6954193115234375, -0.651824951171875, -0.6082305908203125, -0.56463623046875, -0.5210418701171875, -0.477447509765625, -0.4338531494140625, -0.3902587890625, -0.3466644287109375, -0.303070068359375, -0.2594757080078125, -0.21588134765625, -0.1722869873046875, -0.128692626953125, -0.0850982666015625, -0.04150390625, 0.0020904541015625, 0.045684814453125, 0.0892791748046875, 0.13287353515625, 0.1764678955078125, 0.220062255859375, 0.2636566162109375, 0.3072509765625, 0.3508453369140625, 0.394439697265625, 0.4380340576171875, 0.48162841796875, 0.5252227783203125, 0.568817138671875, 0.6124114990234375, 0.656005859375, 0.6996002197265625, 0.743194580078125, 0.7867889404296875, 0.83038330078125, 0.8739776611328125, 0.917572021484375, 0.9611663818359375, 1.0047607421875, 1.0483551025390625, 1.091949462890625, 1.1355438232421875, 1.17913818359375, 1.2227325439453125, 1.266326904296875, 1.3099212646484375, 1.353515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 6.0, 8.0, 8.0, 6.0, 17.0, 17.0, 21.0, 31.0, 33.0, 58.0, 76.0, 368.0, 89.0, 55.0, 44.0, 30.0, 21.0, 20.0, 13.0, 15.0, 8.0, 12.0, 7.0, 8.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42919921875, -0.4175071716308594, -0.40581512451171875, -0.3941230773925781, -0.3824310302734375, -0.3707389831542969, -0.35904693603515625, -0.3473548889160156, -0.335662841796875, -0.3239707946777344, -0.31227874755859375, -0.3005867004394531, -0.2888946533203125, -0.2772026062011719, -0.26551055908203125, -0.2538185119628906, -0.24212646484375, -0.23043441772460938, -0.21874237060546875, -0.20705032348632812, -0.1953582763671875, -0.18366622924804688, -0.17197418212890625, -0.16028213500976562, -0.148590087890625, -0.13689804077148438, -0.12520599365234375, -0.11351394653320312, -0.1018218994140625, -0.09012985229492188, -0.07843780517578125, -0.06674575805664062, -0.0550537109375, -0.043361663818359375, -0.03166961669921875, -0.019977569580078125, -0.0082855224609375, 0.003406524658203125, 0.01509857177734375, 0.026790618896484375, 0.038482666015625, 0.050174713134765625, 0.06186676025390625, 0.07355880737304688, 0.0852508544921875, 0.09694290161132812, 0.10863494873046875, 0.12032699584960938, 0.13201904296875, 0.14371109008789062, 0.15540313720703125, 0.16709518432617188, 0.1787872314453125, 0.19047927856445312, 0.20217132568359375, 0.21386337280273438, 0.225555419921875, 0.23724746704101562, 0.24893951416015625, 0.2606315612792969, 0.2723236083984375, 0.2840156555175781, 0.29570770263671875, 0.3073997497558594, 0.319091796875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 11.0, 9.0, 12.0, 22.0, 25.0, 31.0, 31.0, 55.0, 63.0, 85.0, 94.0, 103.0, 95.0, 57.0, 56.0, 38.0, 29.0, 29.0, 23.0, 13.0, 15.0, 11.0, 14.0, 8.0, 15.0, 5.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8605236411094666, -0.8299636244773865, -0.7994035482406616, -0.7688435316085815, -0.7382835149765015, -0.7077234983444214, -0.6771634817123413, -0.6466034054756165, -0.6160433888435364, -0.5854833722114563, -0.5549232959747314, -0.5243632793426514, -0.4938032627105713, -0.4632432460784912, -0.43268319964408875, -0.4021231532096863, -0.3715631365776062, -0.3410031199455261, -0.31044307351112366, -0.2798830270767212, -0.2493230104446411, -0.21876297891139984, -0.18820294737815857, -0.1576429158449173, -0.12708288431167603, -0.09652285277843475, -0.06596282124519348, -0.03540278971195221, -0.0048427581787109375, 0.025717273354530334, 0.056277304887771606, 0.08683733642101288, 0.11739742755889893, 0.1479574590921402, 0.17851749062538147, 0.20907752215862274, 0.239637553691864, 0.2701975703239441, 0.30075761675834656, 0.331317663192749, 0.3618776798248291, 0.3924376964569092, 0.42299774289131165, 0.4535577893257141, 0.4841178059577942, 0.5146778225898743, 0.5452378988265991, 0.5757979154586792, 0.6063579320907593, 0.6369179487228394, 0.6674779653549194, 0.6980380415916443, 0.7285980582237244, 0.7591580748558044, 0.7897181510925293, 0.8202781677246094, 0.8508381843566895, 0.8813982009887695, 0.9119582176208496, 0.9425182938575745, 0.9730783104896545, 1.0036383867263794, 1.0341984033584595, 1.0647584199905396, 1.0953184366226196]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 8.0, 4.0, 2.0, 6.0, 7.0, 9.0, 16.0, 14.0, 16.0, 24.0, 24.0, 24.0, 28.0, 36.0, 41.0, 39.0, 31.0, 35.0, 38.0, 29.0, 40.0, 49.0, 44.0, 30.0, 41.0, 32.0, 37.0, 31.0, 26.0, 27.0, 28.0, 33.0, 28.0, 18.0, 12.0, 7.0, 19.0, 14.0, 12.0, 8.0, 3.0, 2.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7715363502502441, -0.7486935257911682, -0.7258507609367371, -0.7030079364776611, -0.6801651120185852, -0.657322347164154, -0.6344795227050781, -0.611636757850647, -0.588793933391571, -0.5659511089324951, -0.543108344078064, -0.520265519618988, -0.4974227249622345, -0.47457993030548096, -0.45173710584640503, -0.4288943111896515, -0.40605148673057556, -0.383208692073822, -0.3603658676147461, -0.33752307295799255, -0.314680278301239, -0.2918374538421631, -0.26899465918540955, -0.246151864528656, -0.22330905497074127, -0.20046624541282654, -0.177623450756073, -0.15478064119815826, -0.13193783164024353, -0.10909503698348999, -0.08625222742557526, -0.06340943276882172, -0.04056662321090698, -0.017723819240927696, 0.00511898472905159, 0.027961790561676025, 0.05080459266901016, 0.0736473947763443, 0.09649020433425903, 0.11933299899101257, 0.1421758085489273, 0.16501861810684204, 0.18786141276359558, 0.21070422232151031, 0.23354703187942505, 0.2563898265361786, 0.27923262119293213, 0.30207544565200806, 0.3249182403087616, 0.34776103496551514, 0.37060385942459106, 0.3934466540813446, 0.41628944873809814, 0.4391322731971741, 0.4619750678539276, 0.48481786251068115, 0.5076606869697571, 0.530503511428833, 0.5533462762832642, 0.5761891007423401, 0.599031925201416, 0.6218746900558472, 0.6447175145149231, 0.667560338973999, 0.6904031038284302]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 11.0, 9.0, 15.0, 23.0, 45.0, 52.0, 79.0, 140.0, 191.0, 322.0, 480.0, 660.0, 1021.0, 1563.0, 2328.0, 3487.0, 5765.0, 8617.0, 13460.0, 21612.0, 35546.0, 61092.0, 109102.0, 222796.0, 626703.0, 1691805.0, 827337.0, 266236.0, 124779.0, 67344.0, 38446.0, 23513.0, 14473.0, 9000.0, 5627.0, 3714.0, 2372.0, 1577.0, 1001.0, 665.0, 439.0, 314.0, 180.0, 128.0, 80.0, 45.0, 29.0, 27.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.98779296875, -0.957489013671875, -0.92718505859375, -0.896881103515625, -0.8665771484375, -0.836273193359375, -0.80596923828125, -0.775665283203125, -0.745361328125, -0.715057373046875, -0.68475341796875, -0.654449462890625, -0.6241455078125, -0.593841552734375, -0.56353759765625, -0.533233642578125, -0.5029296875, -0.472625732421875, -0.44232177734375, -0.412017822265625, -0.3817138671875, -0.351409912109375, -0.32110595703125, -0.290802001953125, -0.260498046875, -0.230194091796875, -0.19989013671875, -0.169586181640625, -0.1392822265625, -0.108978271484375, -0.07867431640625, -0.048370361328125, -0.01806640625, 0.012237548828125, 0.04254150390625, 0.072845458984375, 0.1031494140625, 0.133453369140625, 0.16375732421875, 0.194061279296875, 0.224365234375, 0.254669189453125, 0.28497314453125, 0.315277099609375, 0.3455810546875, 0.375885009765625, 0.40618896484375, 0.436492919921875, 0.466796875, 0.497100830078125, 0.52740478515625, 0.557708740234375, 0.5880126953125, 0.618316650390625, 0.64862060546875, 0.678924560546875, 0.709228515625, 0.739532470703125, 0.76983642578125, 0.800140380859375, 0.8304443359375, 0.860748291015625, 0.89105224609375, 0.921356201171875, 0.95166015625]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 2.0, 5.0, 6.0, 1.0, 12.0, 16.0, 15.0, 10.0, 27.0, 23.0, 20.0, 30.0, 27.0, 41.0, 30.0, 37.0, 38.0, 37.0, 39.0, 38.0, 42.0, 46.0, 37.0, 33.0, 35.0, 46.0, 36.0, 24.0, 32.0, 30.0, 32.0, 24.0, 11.0, 17.0, 15.0, 16.0, 11.0, 15.0, 13.0, 4.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4638671875, -0.4497528076171875, -0.435638427734375, -0.4215240478515625, -0.40740966796875, -0.3932952880859375, -0.379180908203125, -0.3650665283203125, -0.3509521484375, -0.3368377685546875, -0.322723388671875, -0.3086090087890625, -0.29449462890625, -0.2803802490234375, -0.266265869140625, -0.2521514892578125, -0.238037109375, -0.2239227294921875, -0.209808349609375, -0.1956939697265625, -0.18157958984375, -0.1674652099609375, -0.153350830078125, -0.1392364501953125, -0.1251220703125, -0.1110076904296875, -0.096893310546875, -0.0827789306640625, -0.06866455078125, -0.0545501708984375, -0.040435791015625, -0.0263214111328125, -0.01220703125, 0.0019073486328125, 0.016021728515625, 0.0301361083984375, 0.04425048828125, 0.0583648681640625, 0.072479248046875, 0.0865936279296875, 0.1007080078125, 0.1148223876953125, 0.128936767578125, 0.1430511474609375, 0.15716552734375, 0.1712799072265625, 0.185394287109375, 0.1995086669921875, 0.213623046875, 0.2277374267578125, 0.241851806640625, 0.2559661865234375, 0.27008056640625, 0.2841949462890625, 0.298309326171875, 0.3124237060546875, 0.3265380859375, 0.3406524658203125, 0.354766845703125, 0.3688812255859375, 0.38299560546875, 0.3971099853515625, 0.411224365234375, 0.4253387451171875, 0.439453125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 9.0, 10.0, 13.0, 21.0, 28.0, 49.0, 69.0, 104.0, 151.0, 251.0, 323.0, 575.0, 873.0, 1371.0, 2169.0, 3436.0, 5593.0, 9186.0, 14627.0, 24803.0, 41223.0, 71556.0, 129776.0, 259307.0, 594795.0, 1472443.0, 845356.0, 339505.0, 163061.0, 87956.0, 49953.0, 29518.0, 17608.0, 10661.0, 6514.0, 4209.0, 2564.0, 1614.0, 1086.0, 666.0, 444.0, 286.0, 186.0, 115.0, 71.0, 50.0, 36.0, 20.0, 15.0, 9.0, 11.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.802734375, -0.778167724609375, -0.75360107421875, -0.729034423828125, -0.7044677734375, -0.679901123046875, -0.65533447265625, -0.630767822265625, -0.606201171875, -0.581634521484375, -0.55706787109375, -0.532501220703125, -0.5079345703125, -0.483367919921875, -0.45880126953125, -0.434234619140625, -0.40966796875, -0.385101318359375, -0.36053466796875, -0.335968017578125, -0.3114013671875, -0.286834716796875, -0.26226806640625, -0.237701416015625, -0.213134765625, -0.188568115234375, -0.16400146484375, -0.139434814453125, -0.1148681640625, -0.090301513671875, -0.06573486328125, -0.041168212890625, -0.0166015625, 0.007965087890625, 0.03253173828125, 0.057098388671875, 0.0816650390625, 0.106231689453125, 0.13079833984375, 0.155364990234375, 0.179931640625, 0.204498291015625, 0.22906494140625, 0.253631591796875, 0.2781982421875, 0.302764892578125, 0.32733154296875, 0.351898193359375, 0.37646484375, 0.401031494140625, 0.42559814453125, 0.450164794921875, 0.4747314453125, 0.499298095703125, 0.52386474609375, 0.548431396484375, 0.572998046875, 0.597564697265625, 0.62213134765625, 0.646697998046875, 0.6712646484375, 0.695831298828125, 0.72039794921875, 0.744964599609375, 0.76953125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 8.0, 14.0, 13.0, 19.0, 22.0, 32.0, 58.0, 53.0, 71.0, 81.0, 104.0, 140.0, 144.0, 208.0, 208.0, 270.0, 278.0, 284.0, 311.0, 298.0, 252.0, 211.0, 176.0, 157.0, 132.0, 105.0, 79.0, 72.0, 70.0, 52.0, 42.0, 33.0, 27.0, 10.0, 5.0, 6.0, 6.0, 4.0, 5.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2763671875, -0.2680320739746094, -0.25969696044921875, -0.2513618469238281, -0.2430267333984375, -0.23469161987304688, -0.22635650634765625, -0.21802139282226562, -0.209686279296875, -0.20135116577148438, -0.19301605224609375, -0.18468093872070312, -0.1763458251953125, -0.16801071166992188, -0.15967559814453125, -0.15134048461914062, -0.14300537109375, -0.13467025756835938, -0.12633514404296875, -0.11800003051757812, -0.1096649169921875, -0.10132980346679688, -0.09299468994140625, -0.08465957641601562, -0.076324462890625, -0.06798934936523438, -0.05965423583984375, -0.051319122314453125, -0.0429840087890625, -0.034648895263671875, -0.02631378173828125, -0.017978668212890625, -0.0096435546875, -0.001308441162109375, 0.00702667236328125, 0.015361785888671875, 0.0236968994140625, 0.032032012939453125, 0.04036712646484375, 0.048702239990234375, 0.057037353515625, 0.06537246704101562, 0.07370758056640625, 0.08204269409179688, 0.0903778076171875, 0.09871292114257812, 0.10704803466796875, 0.11538314819335938, 0.12371826171875, 0.13205337524414062, 0.14038848876953125, 0.14872360229492188, 0.1570587158203125, 0.16539382934570312, 0.17372894287109375, 0.18206405639648438, 0.190399169921875, 0.19873428344726562, 0.20706939697265625, 0.21540451049804688, 0.2237396240234375, 0.23207473754882812, 0.24040985107421875, 0.24874496459960938, 0.257080078125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 5.0, 3.0, 8.0, 3.0, 14.0, 9.0, 11.0, 14.0, 24.0, 23.0, 21.0, 31.0, 33.0, 46.0, 54.0, 87.0, 68.0, 76.0, 74.0, 61.0, 62.0, 46.0, 30.0, 29.0, 33.0, 19.0, 22.0, 10.0, 11.0, 8.0, 12.0, 10.0, 9.0, 7.0, 2.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5192223787307739, -0.5011470913887024, -0.48307186365127563, -0.4649966061115265, -0.44692134857177734, -0.4288460612297058, -0.41077080368995667, -0.3926955461502075, -0.3746202886104584, -0.35654503107070923, -0.3384697735309601, -0.32039451599121094, -0.3023192286491394, -0.28424400091171265, -0.2661687135696411, -0.24809345602989197, -0.23001819849014282, -0.21194294095039368, -0.19386768341064453, -0.1757924109697342, -0.15771715342998505, -0.1396418958902359, -0.12156663089990616, -0.10349136590957642, -0.08541610836982727, -0.06734085083007812, -0.04926558583974838, -0.03119032457470894, -0.013115063309669495, 0.004960194230079651, 0.023035459220409393, 0.041110724210739136, 0.059185922145843506, 0.07726117968559265, 0.0953364446759224, 0.11341170966625214, 0.13148696720600128, 0.14956222474575043, 0.16763749718666077, 0.1857127547264099, 0.20378801226615906, 0.2218632698059082, 0.23993852734565735, 0.2580137848854065, 0.276089072227478, 0.2941642999649048, 0.3122395873069763, 0.33031484484672546, 0.3483901023864746, 0.36646535992622375, 0.3845406174659729, 0.40261587500572205, 0.4206911325454712, 0.4387664198875427, 0.45684167742729187, 0.474916934967041, 0.49299219250679016, 0.5110674500465393, 0.5291427373886108, 0.5472179651260376, 0.5652932524681091, 0.5833684802055359, 0.6014437675476074, 0.6195189952850342, 0.6375942826271057]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 9.0, 6.0, 10.0, 7.0, 13.0, 10.0, 16.0, 11.0, 15.0, 29.0, 26.0, 29.0, 25.0, 31.0, 30.0, 43.0, 31.0, 35.0, 32.0, 40.0, 30.0, 38.0, 37.0, 26.0, 45.0, 29.0, 37.0, 26.0, 38.0, 29.0, 37.0, 17.0, 25.0, 16.0, 21.0, 20.0, 16.0, 14.0, 6.0, 9.0, 6.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.5000180006027222, -0.4853484332561493, -0.4706788659095764, -0.45600929856300354, -0.44133973121643066, -0.4266701936721802, -0.4120005965232849, -0.3973310589790344, -0.38266149163246155, -0.36799192428588867, -0.3533223569393158, -0.3386527895927429, -0.32398322224617004, -0.30931365489959717, -0.2946441173553467, -0.2799745500087738, -0.2653049826622009, -0.25063541531562805, -0.23596584796905518, -0.2212962806224823, -0.20662672817707062, -0.19195716083049774, -0.17728759348392487, -0.16261804103851318, -0.14794844388961792, -0.13327887654304504, -0.11860931664705276, -0.10393974930047989, -0.08927018940448761, -0.07460062205791473, -0.05993105471134186, -0.04526149481534958, -0.0305919349193573, -0.015922371298074722, -0.0012528058141469955, 0.013416759669780731, 0.02808632329106331, 0.042755886912345886, 0.05742545425891876, 0.07209501415491104, 0.08676458150148392, 0.1014341488480568, 0.11610370874404907, 0.13077327609062195, 0.14544284343719482, 0.1601124107837677, 0.17478197813034058, 0.18945153057575226, 0.20412109792232513, 0.218790665268898, 0.2334602326154709, 0.24812978506088257, 0.26279935240745544, 0.2774689197540283, 0.2921384871006012, 0.3068080544471741, 0.32147762179374695, 0.3361471891403198, 0.3508167564868927, 0.3654863238334656, 0.38015589118003845, 0.39482545852661133, 0.4094949960708618, 0.4241645634174347, 0.43883413076400757]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 8.0, 15.0, 25.0, 25.0, 38.0, 48.0, 79.0, 114.0, 137.0, 216.0, 282.0, 393.0, 640.0, 875.0, 1233.0, 1772.0, 2764.0, 4265.0, 6512.0, 10291.0, 16547.0, 27521.0, 46214.0, 82005.0, 149012.0, 246306.0, 192256.0, 107977.0, 59684.0, 34363.0, 20700.0, 12721.0, 7965.0, 5124.0, 3354.0, 2186.0, 1477.0, 1053.0, 669.0, 490.0, 336.0, 236.0, 181.0, 126.0, 102.0, 48.0, 46.0, 30.0, 21.0, 14.0, 13.0, 10.0, 7.0, 3.0, 6.0, 5.0, 2.0], "bins": [-0.23681640625, -0.22957992553710938, -0.22234344482421875, -0.21510696411132812, -0.2078704833984375, -0.20063400268554688, -0.19339752197265625, -0.18616104125976562, -0.178924560546875, -0.17168807983398438, -0.16445159912109375, -0.15721511840820312, -0.1499786376953125, -0.14274215698242188, -0.13550567626953125, -0.12826919555664062, -0.12103271484375, -0.11379623413085938, -0.10655975341796875, -0.09932327270507812, -0.0920867919921875, -0.08485031127929688, -0.07761383056640625, -0.07037734985351562, -0.063140869140625, -0.055904388427734375, -0.04866790771484375, -0.041431427001953125, -0.0341949462890625, -0.026958465576171875, -0.01972198486328125, -0.012485504150390625, -0.0052490234375, 0.001987457275390625, 0.00922393798828125, 0.016460418701171875, 0.0236968994140625, 0.030933380126953125, 0.03816986083984375, 0.045406341552734375, 0.052642822265625, 0.059879302978515625, 0.06711578369140625, 0.07435226440429688, 0.0815887451171875, 0.08882522583007812, 0.09606170654296875, 0.10329818725585938, 0.11053466796875, 0.11777114868164062, 0.12500762939453125, 0.13224411010742188, 0.1394805908203125, 0.14671707153320312, 0.15395355224609375, 0.16119003295898438, 0.168426513671875, 0.17566299438476562, 0.18289947509765625, 0.19013595581054688, 0.1973724365234375, 0.20460891723632812, 0.21184539794921875, 0.21908187866210938, 0.226318359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 8.0, 14.0, 10.0, 7.0, 10.0, 11.0, 24.0, 28.0, 27.0, 25.0, 25.0, 26.0, 41.0, 47.0, 36.0, 33.0, 26.0, 31.0, 40.0, 46.0, 34.0, 39.0, 34.0, 44.0, 33.0, 35.0, 21.0, 33.0, 27.0, 24.0, 21.0, 21.0, 16.0, 15.0, 17.0, 12.0, 6.0, 9.0, 6.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.4912109375, -0.4759483337402344, -0.46068572998046875, -0.4454231262207031, -0.4301605224609375, -0.4148979187011719, -0.39963531494140625, -0.3843727111816406, -0.369110107421875, -0.3538475036621094, -0.33858489990234375, -0.3233222961425781, -0.3080596923828125, -0.2927970886230469, -0.27753448486328125, -0.2622718811035156, -0.24700927734375, -0.23174667358398438, -0.21648406982421875, -0.20122146606445312, -0.1859588623046875, -0.17069625854492188, -0.15543365478515625, -0.14017105102539062, -0.124908447265625, -0.10964584350585938, -0.09438323974609375, -0.07912063598632812, -0.0638580322265625, -0.048595428466796875, -0.03333282470703125, -0.018070220947265625, -0.0028076171875, 0.012454986572265625, 0.02771759033203125, 0.042980194091796875, 0.0582427978515625, 0.07350540161132812, 0.08876800537109375, 0.10403060913085938, 0.119293212890625, 0.13455581665039062, 0.14981842041015625, 0.16508102416992188, 0.1803436279296875, 0.19560623168945312, 0.21086883544921875, 0.22613143920898438, 0.24139404296875, 0.2566566467285156, 0.27191925048828125, 0.2871818542480469, 0.3024444580078125, 0.3177070617675781, 0.33296966552734375, 0.3482322692871094, 0.363494873046875, 0.3787574768066406, 0.39402008056640625, 0.4092826843261719, 0.4245452880859375, 0.4398078918457031, 0.45507049560546875, 0.4703330993652344, 0.485595703125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 10.0, 8.0, 21.0, 25.0, 33.0, 50.0, 72.0, 94.0, 151.0, 193.0, 285.0, 426.0, 573.0, 826.0, 1293.0, 1997.0, 2968.0, 4700.0, 8064.0, 14845.0, 33425.0, 96057.0, 443098.0, 306005.0, 73294.0, 27426.0, 13102.0, 7013.0, 4195.0, 2811.0, 1783.0, 1174.0, 783.0, 527.0, 377.0, 262.0, 156.0, 127.0, 100.0, 57.0, 46.0, 27.0, 21.0, 12.0, 13.0, 10.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3858146667480469, -0.37245941162109375, -0.3591041564941406, -0.3457489013671875, -0.3323936462402344, -0.31903839111328125, -0.3056831359863281, -0.292327880859375, -0.2789726257324219, -0.26561737060546875, -0.2522621154785156, -0.2389068603515625, -0.22555160522460938, -0.21219635009765625, -0.19884109497070312, -0.18548583984375, -0.17213058471679688, -0.15877532958984375, -0.14542007446289062, -0.1320648193359375, -0.11870956420898438, -0.10535430908203125, -0.09199905395507812, -0.078643798828125, -0.06528854370117188, -0.05193328857421875, -0.038578033447265625, -0.0252227783203125, -0.011867523193359375, 0.00148773193359375, 0.014842987060546875, 0.0281982421875, 0.041553497314453125, 0.05490875244140625, 0.06826400756835938, 0.0816192626953125, 0.09497451782226562, 0.10832977294921875, 0.12168502807617188, 0.135040283203125, 0.14839553833007812, 0.16175079345703125, 0.17510604858398438, 0.1884613037109375, 0.20181655883789062, 0.21517181396484375, 0.22852706909179688, 0.24188232421875, 0.2552375793457031, 0.26859283447265625, 0.2819480895996094, 0.2953033447265625, 0.3086585998535156, 0.32201385498046875, 0.3353691101074219, 0.348724365234375, 0.3620796203613281, 0.37543487548828125, 0.3887901306152344, 0.4021453857421875, 0.4155006408691406, 0.42885589599609375, 0.4422111511230469, 0.45556640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 12.0, 9.0, 10.0, 8.0, 12.0, 8.0, 21.0, 19.0, 26.0, 26.0, 21.0, 38.0, 36.0, 37.0, 40.0, 24.0, 29.0, 33.0, 39.0, 48.0, 36.0, 44.0, 40.0, 36.0, 27.0, 30.0, 21.0, 21.0, 34.0, 25.0, 31.0, 24.0, 21.0, 11.0, 22.0, 11.0, 16.0, 11.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.287841796875, -0.2786827087402344, -0.26952362060546875, -0.2603645324707031, -0.2512054443359375, -0.24204635620117188, -0.23288726806640625, -0.22372817993164062, -0.214569091796875, -0.20541000366210938, -0.19625091552734375, -0.18709182739257812, -0.1779327392578125, -0.16877365112304688, -0.15961456298828125, -0.15045547485351562, -0.14129638671875, -0.13213729858398438, -0.12297821044921875, -0.11381912231445312, -0.1046600341796875, -0.09550094604492188, -0.08634185791015625, -0.07718276977539062, -0.068023681640625, -0.058864593505859375, -0.04970550537109375, -0.040546417236328125, -0.0313873291015625, -0.022228240966796875, -0.01306915283203125, -0.003910064697265625, 0.0052490234375, 0.014408111572265625, 0.02356719970703125, 0.032726287841796875, 0.0418853759765625, 0.051044464111328125, 0.06020355224609375, 0.06936264038085938, 0.078521728515625, 0.08768081665039062, 0.09683990478515625, 0.10599899291992188, 0.1151580810546875, 0.12431716918945312, 0.13347625732421875, 0.14263534545898438, 0.15179443359375, 0.16095352172851562, 0.17011260986328125, 0.17927169799804688, 0.1884307861328125, 0.19758987426757812, 0.20674896240234375, 0.21590805053710938, 0.225067138671875, 0.23422622680664062, 0.24338531494140625, 0.2525444030761719, 0.2617034912109375, 0.2708625793457031, 0.28002166748046875, 0.2891807556152344, 0.29833984375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 10.0, 21.0, 15.0, 14.0, 35.0, 34.0, 45.0, 80.0, 68.0, 118.0, 162.0, 207.0, 259.0, 370.0, 628.0, 893.0, 1366.0, 2129.0, 3677.0, 6854.0, 15099.0, 46133.0, 594528.0, 310272.0, 36870.0, 13073.0, 6132.0, 3367.0, 1999.0, 1237.0, 846.0, 576.0, 401.0, 272.0, 186.0, 152.0, 106.0, 78.0, 66.0, 41.0, 26.0, 25.0, 22.0, 9.0, 8.0, 7.0, 10.0, 3.0, 1.0, 7.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.046722412109375, -0.0452113151550293, -0.043700218200683594, -0.04218912124633789, -0.04067802429199219, -0.039166927337646484, -0.03765583038330078, -0.03614473342895508, -0.034633636474609375, -0.03312253952026367, -0.03161144256591797, -0.030100345611572266, -0.028589248657226562, -0.02707815170288086, -0.025567054748535156, -0.024055957794189453, -0.02254486083984375, -0.021033763885498047, -0.019522666931152344, -0.01801156997680664, -0.016500473022460938, -0.014989376068115234, -0.013478279113769531, -0.011967182159423828, -0.010456085205078125, -0.008944988250732422, -0.007433891296386719, -0.005922794342041016, -0.0044116973876953125, -0.0029006004333496094, -0.0013895034790039062, 0.00012159347534179688, 0.0016326904296875, 0.003143787384033203, 0.004654884338378906, 0.006165981292724609, 0.0076770782470703125, 0.009188175201416016, 0.010699272155761719, 0.012210369110107422, 0.013721466064453125, 0.015232563018798828, 0.01674365997314453, 0.018254756927490234, 0.019765853881835938, 0.02127695083618164, 0.022788047790527344, 0.024299144744873047, 0.02581024169921875, 0.027321338653564453, 0.028832435607910156, 0.03034353256225586, 0.03185462951660156, 0.033365726470947266, 0.03487682342529297, 0.03638792037963867, 0.037899017333984375, 0.03941011428833008, 0.04092121124267578, 0.042432308197021484, 0.04394340515136719, 0.04545450210571289, 0.046965599060058594, 0.0484766960144043, 0.04998779296875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 8.0, 13.0, 9.0, 13.0, 18.0, 36.0, 32.0, 22.0, 62.0, 39.0, 43.0, 42.0, 101.0, 64.0, 63.0, 54.0, 90.0, 42.0, 45.0, 56.0, 28.0, 16.0, 12.0, 33.0, 8.0, 11.0, 11.0, 3.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1886080503463745e-06, -2.1122395992279053e-06, -2.035871148109436e-06, -1.959502696990967e-06, -1.8831342458724976e-06, -1.8067657947540283e-06, -1.730397343635559e-06, -1.6540288925170898e-06, -1.5776604413986206e-06, -1.5012919902801514e-06, -1.4249235391616821e-06, -1.3485550880432129e-06, -1.2721866369247437e-06, -1.1958181858062744e-06, -1.1194497346878052e-06, -1.043081283569336e-06, -9.667128324508667e-07, -8.903443813323975e-07, -8.139759302139282e-07, -7.37607479095459e-07, -6.612390279769897e-07, -5.848705768585205e-07, -5.085021257400513e-07, -4.3213367462158203e-07, -3.557652235031128e-07, -2.7939677238464355e-07, -2.0302832126617432e-07, -1.2665987014770508e-07, -5.029141902923584e-08, 2.60770320892334e-08, 1.0244548320770264e-07, 1.7881393432617188e-07, 2.551823854446411e-07, 3.3155083656311035e-07, 4.079192876815796e-07, 4.842877388000488e-07, 5.606561899185181e-07, 6.370246410369873e-07, 7.133930921554565e-07, 7.897615432739258e-07, 8.66129994392395e-07, 9.424984455108643e-07, 1.0188668966293335e-06, 1.0952353477478027e-06, 1.171603798866272e-06, 1.2479722499847412e-06, 1.3243407011032104e-06, 1.4007091522216797e-06, 1.477077603340149e-06, 1.5534460544586182e-06, 1.6298145055770874e-06, 1.7061829566955566e-06, 1.7825514078140259e-06, 1.8589198589324951e-06, 1.9352883100509644e-06, 2.0116567611694336e-06, 2.088025212287903e-06, 2.164393663406372e-06, 2.2407621145248413e-06, 2.3171305656433105e-06, 2.3934990167617798e-06, 2.469867467880249e-06, 2.5462359189987183e-06, 2.6226043701171875e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 13.0, 7.0, 18.0, 25.0, 57.0, 54.0, 48.0, 77.0, 117.0, 132.0, 203.0, 286.0, 348.0, 523.0, 719.0, 1039.0, 1528.0, 2292.0, 3717.0, 5961.0, 10093.0, 19411.0, 41224.0, 108901.0, 471269.0, 242403.0, 70988.0, 29788.0, 14610.0, 8145.0, 4858.0, 3076.0, 2122.0, 1355.0, 875.0, 642.0, 442.0, 297.0, 225.0, 171.0, 137.0, 87.0, 65.0, 47.0, 41.0, 22.0, 26.0, 15.0, 11.0, 19.0, 5.0, 8.0, 4.0, 0.0, 2.0, 4.0], "bins": [-0.038909912109375, -0.037723541259765625, -0.03653717041015625, -0.035350799560546875, -0.0341644287109375, -0.032978057861328125, -0.03179168701171875, -0.030605316162109375, -0.0294189453125, -0.028232574462890625, -0.02704620361328125, -0.025859832763671875, -0.0246734619140625, -0.023487091064453125, -0.02230072021484375, -0.021114349365234375, -0.019927978515625, -0.018741607666015625, -0.01755523681640625, -0.016368865966796875, -0.0151824951171875, -0.013996124267578125, -0.01280975341796875, -0.011623382568359375, -0.01043701171875, -0.009250640869140625, -0.00806427001953125, -0.006877899169921875, -0.0056915283203125, -0.004505157470703125, -0.00331878662109375, -0.002132415771484375, -0.000946044921875, 0.000240325927734375, 0.00142669677734375, 0.002613067626953125, 0.0037994384765625, 0.004985809326171875, 0.00617218017578125, 0.007358551025390625, 0.008544921875, 0.009731292724609375, 0.01091766357421875, 0.012104034423828125, 0.0132904052734375, 0.014476776123046875, 0.01566314697265625, 0.016849517822265625, 0.018035888671875, 0.019222259521484375, 0.02040863037109375, 0.021595001220703125, 0.0227813720703125, 0.023967742919921875, 0.02515411376953125, 0.026340484619140625, 0.02752685546875, 0.028713226318359375, 0.02989959716796875, 0.031085968017578125, 0.0322723388671875, 0.033458709716796875, 0.03464508056640625, 0.035831451416015625, 0.037017822265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 3.0, 3.0, 13.0, 8.0, 13.0, 10.0, 13.0, 17.0, 16.0, 25.0, 24.0, 42.0, 54.0, 68.0, 104.0, 119.0, 86.0, 67.0, 65.0, 48.0, 26.0, 27.0, 20.0, 23.0, 11.0, 13.0, 16.0, 12.0, 11.0, 2.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009124755859375, -0.008833169937133789, -0.008541584014892578, -0.008249998092651367, -0.007958412170410156, -0.007666826248168945, -0.007375240325927734, -0.0070836544036865234, -0.0067920684814453125, -0.0065004825592041016, -0.006208896636962891, -0.00591731071472168, -0.005625724792480469, -0.005334138870239258, -0.005042552947998047, -0.004750967025756836, -0.004459381103515625, -0.004167795181274414, -0.003876209259033203, -0.003584623336791992, -0.0032930374145507812, -0.0030014514923095703, -0.0027098655700683594, -0.0024182796478271484, -0.0021266937255859375, -0.0018351078033447266, -0.0015435218811035156, -0.0012519359588623047, -0.0009603500366210938, -0.0006687641143798828, -0.0003771781921386719, -8.559226989746094e-05, 0.00020599365234375, 0.0004975795745849609, 0.0007891654968261719, 0.0010807514190673828, 0.0013723373413085938, 0.0016639232635498047, 0.0019555091857910156, 0.0022470951080322266, 0.0025386810302734375, 0.0028302669525146484, 0.0031218528747558594, 0.0034134387969970703, 0.0037050247192382812, 0.003996610641479492, 0.004288196563720703, 0.004579782485961914, 0.004871368408203125, 0.005162954330444336, 0.005454540252685547, 0.005746126174926758, 0.006037712097167969, 0.00632929801940918, 0.006620883941650391, 0.0069124698638916016, 0.0072040557861328125, 0.0074956417083740234, 0.007787227630615234, 0.008078813552856445, 0.008370399475097656, 0.008661985397338867, 0.008953571319580078, 0.009245157241821289, 0.0095367431640625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 3.0, 5.0, 4.0, 7.0, 7.0, 7.0, 10.0, 16.0, 16.0, 29.0, 19.0, 20.0, 34.0, 43.0, 40.0, 67.0, 78.0, 84.0, 59.0, 83.0, 66.0, 60.0, 37.0, 22.0, 33.0, 22.0, 20.0, 16.0, 15.0, 10.0, 6.0, 16.0, 6.0, 7.0, 8.0, 2.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5102124214172363, -0.49216005206108093, -0.47410768270492554, -0.45605534315109253, -0.43800297379493713, -0.41995060443878174, -0.40189826488494873, -0.38384589552879333, -0.36579352617263794, -0.34774115681648254, -0.32968878746032715, -0.31163644790649414, -0.29358407855033875, -0.27553170919418335, -0.25747936964035034, -0.23942700028419495, -0.22137463092803955, -0.20332226157188416, -0.18526990711688995, -0.16721755266189575, -0.14916518330574036, -0.13111281394958496, -0.11306045949459076, -0.09500810503959656, -0.07695573568344116, -0.058903373777866364, -0.040851011872291565, -0.022798649966716766, -0.004746288061141968, 0.01330607384443283, 0.03135843575000763, 0.04941079020500183, 0.067463219165802, 0.0855155810713768, 0.1035679429769516, 0.1216203048825264, 0.1396726667881012, 0.1577250361442566, 0.1757773905992508, 0.193829745054245, 0.2118821144104004, 0.2299344837665558, 0.24798683822155, 0.2660391926765442, 0.2840915620326996, 0.302143931388855, 0.320196270942688, 0.3382486402988434, 0.3563010096549988, 0.3743533790111542, 0.39240574836730957, 0.4104580879211426, 0.428510457277298, 0.44656282663345337, 0.4646151661872864, 0.4826675355434418, 0.5007199048995972, 0.5187722444534302, 0.536824643611908, 0.554876983165741, 0.5729293823242188, 0.5909817218780518, 0.6090340614318848, 0.6270864009857178, 0.6451388001441956]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 10.0, 6.0, 11.0, 7.0, 14.0, 9.0, 16.0, 10.0, 17.0, 28.0, 25.0, 34.0, 22.0, 31.0, 33.0, 40.0, 33.0, 29.0, 36.0, 39.0, 29.0, 40.0, 34.0, 33.0, 38.0, 32.0, 36.0, 26.0, 40.0, 26.0, 39.0, 15.0, 26.0, 17.0, 19.0, 21.0, 15.0, 13.0, 8.0, 8.0, 5.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.49394622445106506, -0.4794827699661255, -0.4650193154811859, -0.45055586099624634, -0.43609243631362915, -0.4216289818286896, -0.40716552734375, -0.3927020728588104, -0.37823861837387085, -0.3637751638889313, -0.3493117094039917, -0.3348482847213745, -0.32038483023643494, -0.30592137575149536, -0.2914579212665558, -0.2769944667816162, -0.262531042098999, -0.24806758761405945, -0.23360414803028107, -0.2191406935453415, -0.20467723906040192, -0.19021379947662354, -0.17575034499168396, -0.16128689050674438, -0.1468234360218048, -0.13235998153686523, -0.11789653450250626, -0.10343308746814728, -0.0889696329832077, -0.07450618594884872, -0.060042738914489746, -0.04557928442955017, -0.031115829944610596, -0.01665237918496132, -0.0021889302879571915, 0.012274518609046936, 0.026737969368696213, 0.04120142012834549, 0.05566486716270447, 0.07012832164764404, 0.08459176868200302, 0.099055215716362, 0.11351867020130157, 0.12798210978507996, 0.14244556427001953, 0.1569090187549591, 0.17137247323989868, 0.18583592772483826, 0.20029936730861664, 0.2147628217935562, 0.2292262613773346, 0.24368971586227417, 0.25815317034721375, 0.2726166248321533, 0.2870800495147705, 0.30154353380203247, 0.31600695848464966, 0.33047041296958923, 0.3449338674545288, 0.359397292137146, 0.37386074662208557, 0.38832420110702515, 0.4027876555919647, 0.4172511100769043, 0.43171456456184387]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 0.0, 14.0, 23.0, 29.0, 41.0, 62.0, 95.0, 156.0, 210.0, 325.0, 465.0, 738.0, 1033.0, 1563.0, 2281.0, 3560.0, 5459.0, 8416.0, 13142.0, 21091.0, 35228.0, 60997.0, 110627.0, 215614.0, 253243.0, 133854.0, 71890.0, 41069.0, 24675.0, 15267.0, 9490.0, 5964.0, 3978.0, 2619.0, 1770.0, 1169.0, 813.0, 513.0, 353.0, 254.0, 154.0, 124.0, 71.0, 49.0, 23.0, 21.0, 15.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.91845703125, -0.8898849487304688, -0.8613128662109375, -0.8327407836914062, -0.804168701171875, -0.7755966186523438, -0.7470245361328125, -0.7184524536132812, -0.68988037109375, -0.6613082885742188, -0.6327362060546875, -0.6041641235351562, -0.575592041015625, -0.5470199584960938, -0.5184478759765625, -0.48987579345703125, -0.4613037109375, -0.43273162841796875, -0.4041595458984375, -0.37558746337890625, -0.347015380859375, -0.31844329833984375, -0.2898712158203125, -0.26129913330078125, -0.23272705078125, -0.20415496826171875, -0.1755828857421875, -0.14701080322265625, -0.118438720703125, -0.08986663818359375, -0.0612945556640625, -0.03272247314453125, -0.004150390625, 0.02442169189453125, 0.0529937744140625, 0.08156585693359375, 0.110137939453125, 0.13871002197265625, 0.1672821044921875, 0.19585418701171875, 0.22442626953125, 0.25299835205078125, 0.2815704345703125, 0.31014251708984375, 0.338714599609375, 0.36728668212890625, 0.3958587646484375, 0.42443084716796875, 0.4530029296875, 0.48157501220703125, 0.5101470947265625, 0.5387191772460938, 0.567291259765625, 0.5958633422851562, 0.6244354248046875, 0.6530075073242188, 0.68157958984375, 0.7101516723632812, 0.7387237548828125, 0.7672958374023438, 0.795867919921875, 0.8244400024414062, 0.8530120849609375, 0.8815841674804688, 0.91015625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 3.0, 9.0, 10.0, 13.0, 16.0, 14.0, 14.0, 29.0, 24.0, 30.0, 23.0, 38.0, 42.0, 32.0, 35.0, 34.0, 34.0, 35.0, 49.0, 43.0, 33.0, 39.0, 38.0, 30.0, 41.0, 24.0, 45.0, 30.0, 24.0, 19.0, 20.0, 25.0, 10.0, 15.0, 13.0, 12.0, 10.0, 9.0, 6.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.462646484375, -0.4485321044921875, -0.434417724609375, -0.4203033447265625, -0.40618896484375, -0.3920745849609375, -0.377960205078125, -0.3638458251953125, -0.3497314453125, -0.3356170654296875, -0.321502685546875, -0.3073883056640625, -0.29327392578125, -0.2791595458984375, -0.265045166015625, -0.2509307861328125, -0.23681640625, -0.2227020263671875, -0.208587646484375, -0.1944732666015625, -0.18035888671875, -0.1662445068359375, -0.152130126953125, -0.1380157470703125, -0.1239013671875, -0.1097869873046875, -0.095672607421875, -0.0815582275390625, -0.06744384765625, -0.0533294677734375, -0.039215087890625, -0.0251007080078125, -0.010986328125, 0.0031280517578125, 0.017242431640625, 0.0313568115234375, 0.04547119140625, 0.0595855712890625, 0.073699951171875, 0.0878143310546875, 0.1019287109375, 0.1160430908203125, 0.130157470703125, 0.1442718505859375, 0.15838623046875, 0.1725006103515625, 0.186614990234375, 0.2007293701171875, 0.21484375, 0.2289581298828125, 0.243072509765625, 0.2571868896484375, 0.27130126953125, 0.2854156494140625, 0.299530029296875, 0.3136444091796875, 0.3277587890625, 0.3418731689453125, 0.355987548828125, 0.3701019287109375, 0.38421630859375, 0.3983306884765625, 0.412445068359375, 0.4265594482421875, 0.440673828125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 15.0, 14.0, 26.0, 32.0, 38.0, 72.0, 87.0, 154.0, 180.0, 265.0, 381.0, 536.0, 806.0, 1134.0, 1621.0, 2268.0, 3480.0, 5108.0, 7626.0, 12045.0, 19136.0, 31410.0, 53131.0, 94089.0, 180684.0, 272942.0, 154111.0, 82480.0, 47044.0, 27837.0, 17111.0, 10682.0, 7110.0, 4707.0, 3120.0, 2206.0, 1416.0, 1012.0, 734.0, 518.0, 356.0, 227.0, 177.0, 133.0, 85.0, 65.0, 44.0, 36.0, 25.0, 12.0, 11.0, 6.0, 3.0, 4.0, 1.0, 3.0], "bins": [-0.92919921875, -0.9013671875, -0.87353515625, -0.845703125, -0.81787109375, -0.7900390625, -0.76220703125, -0.734375, -0.70654296875, -0.6787109375, -0.65087890625, -0.623046875, -0.59521484375, -0.5673828125, -0.53955078125, -0.51171875, -0.48388671875, -0.4560546875, -0.42822265625, -0.400390625, -0.37255859375, -0.3447265625, -0.31689453125, -0.2890625, -0.26123046875, -0.2333984375, -0.20556640625, -0.177734375, -0.14990234375, -0.1220703125, -0.09423828125, -0.06640625, -0.03857421875, -0.0107421875, 0.01708984375, 0.044921875, 0.07275390625, 0.1005859375, 0.12841796875, 0.15625, 0.18408203125, 0.2119140625, 0.23974609375, 0.267578125, 0.29541015625, 0.3232421875, 0.35107421875, 0.37890625, 0.40673828125, 0.4345703125, 0.46240234375, 0.490234375, 0.51806640625, 0.5458984375, 0.57373046875, 0.6015625, 0.62939453125, 0.6572265625, 0.68505859375, 0.712890625, 0.74072265625, 0.7685546875, 0.79638671875, 0.82421875, 0.85205078125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 4.0, 4.0, 7.0, 6.0, 4.0, 12.0, 9.0, 12.0, 9.0, 10.0, 18.0, 20.0, 26.0, 23.0, 28.0, 27.0, 28.0, 26.0, 29.0, 32.0, 34.0, 24.0, 29.0, 44.0, 36.0, 37.0, 32.0, 34.0, 32.0, 34.0, 37.0, 31.0, 28.0, 22.0, 24.0, 15.0, 27.0, 23.0, 22.0, 13.0, 6.0, 17.0, 11.0, 15.0, 6.0, 7.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.276611328125, -0.2684040069580078, -0.2601966857910156, -0.25198936462402344, -0.24378204345703125, -0.23557472229003906, -0.22736740112304688, -0.2191600799560547, -0.2109527587890625, -0.2027454376220703, -0.19453811645507812, -0.18633079528808594, -0.17812347412109375, -0.16991615295410156, -0.16170883178710938, -0.1535015106201172, -0.145294189453125, -0.1370868682861328, -0.12887954711914062, -0.12067222595214844, -0.11246490478515625, -0.10425758361816406, -0.09605026245117188, -0.08784294128417969, -0.0796356201171875, -0.07142829895019531, -0.06322097778320312, -0.05501365661621094, -0.04680633544921875, -0.03859901428222656, -0.030391693115234375, -0.022184371948242188, -0.01397705078125, -0.0057697296142578125, 0.002437591552734375, 0.010644912719726562, 0.01885223388671875, 0.027059555053710938, 0.035266876220703125, 0.04347419738769531, 0.0516815185546875, 0.05988883972167969, 0.06809616088867188, 0.07630348205566406, 0.08451080322265625, 0.09271812438964844, 0.10092544555664062, 0.10913276672363281, 0.117340087890625, 0.1255474090576172, 0.13375473022460938, 0.14196205139160156, 0.15016937255859375, 0.15837669372558594, 0.16658401489257812, 0.1747913360595703, 0.1829986572265625, 0.1912059783935547, 0.19941329956054688, 0.20762062072753906, 0.21582794189453125, 0.22403526306152344, 0.23224258422851562, 0.2404499053955078, 0.2486572265625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 7.0, 11.0, 17.0, 25.0, 35.0, 61.0, 91.0, 138.0, 189.0, 256.0, 367.0, 559.0, 795.0, 1087.0, 1620.0, 2401.0, 3438.0, 5489.0, 8841.0, 14474.0, 26434.0, 62057.0, 722032.0, 114476.0, 35294.0, 17977.0, 10633.0, 6590.0, 4283.0, 2793.0, 1888.0, 1260.0, 897.0, 629.0, 433.0, 308.0, 204.0, 135.0, 111.0, 62.0, 49.0, 37.0, 26.0, 20.0, 11.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283203125, -0.27426910400390625, -0.2653350830078125, -0.25640106201171875, -0.247467041015625, -0.23853302001953125, -0.2295989990234375, -0.22066497802734375, -0.21173095703125, -0.20279693603515625, -0.1938629150390625, -0.18492889404296875, -0.175994873046875, -0.16706085205078125, -0.1581268310546875, -0.14919281005859375, -0.1402587890625, -0.13132476806640625, -0.1223907470703125, -0.11345672607421875, -0.104522705078125, -0.09558868408203125, -0.0866546630859375, -0.07772064208984375, -0.06878662109375, -0.05985260009765625, -0.0509185791015625, -0.04198455810546875, -0.033050537109375, -0.02411651611328125, -0.0151824951171875, -0.00624847412109375, 0.002685546875, 0.01161956787109375, 0.0205535888671875, 0.02948760986328125, 0.038421630859375, 0.04735565185546875, 0.0562896728515625, 0.06522369384765625, 0.07415771484375, 0.08309173583984375, 0.0920257568359375, 0.10095977783203125, 0.109893798828125, 0.11882781982421875, 0.1277618408203125, 0.13669586181640625, 0.1456298828125, 0.15456390380859375, 0.1634979248046875, 0.17243194580078125, 0.181365966796875, 0.19029998779296875, 0.1992340087890625, 0.20816802978515625, 0.21710205078125, 0.22603607177734375, 0.2349700927734375, 0.24390411376953125, 0.252838134765625, 0.26177215576171875, 0.2707061767578125, 0.27964019775390625, 0.28857421875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 5.0, 2.0, 9.0, 2.0, 9.0, 9.0, 31.0, 38.0, 79.0, 272.0, 344.0, 58.0, 42.0, 19.0, 23.0, 17.0, 9.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9311904907226562e-05, -1.8863007426261902e-05, -1.841410994529724e-05, -1.796521246433258e-05, -1.751631498336792e-05, -1.706741750240326e-05, -1.66185200214386e-05, -1.6169622540473938e-05, -1.5720725059509277e-05, -1.5271827578544617e-05, -1.4822930097579956e-05, -1.4374032616615295e-05, -1.3925135135650635e-05, -1.3476237654685974e-05, -1.3027340173721313e-05, -1.2578442692756653e-05, -1.2129545211791992e-05, -1.1680647730827332e-05, -1.1231750249862671e-05, -1.078285276889801e-05, -1.033395528793335e-05, -9.885057806968689e-06, -9.436160326004028e-06, -8.987262845039368e-06, -8.538365364074707e-06, -8.089467883110046e-06, -7.640570402145386e-06, -7.191672921180725e-06, -6.7427754402160645e-06, -6.293877959251404e-06, -5.844980478286743e-06, -5.3960829973220825e-06, -4.947185516357422e-06, -4.498288035392761e-06, -4.049390554428101e-06, -3.60049307346344e-06, -3.1515955924987793e-06, -2.7026981115341187e-06, -2.253800630569458e-06, -1.8049031496047974e-06, -1.3560056686401367e-06, -9.071081876754761e-07, -4.5821070671081543e-07, -9.313225746154785e-09, 4.3958425521850586e-07, 8.884817361831665e-07, 1.3373792171478271e-06, 1.7862766981124878e-06, 2.2351741790771484e-06, 2.684071660041809e-06, 3.1329691410064697e-06, 3.5818666219711304e-06, 4.030764102935791e-06, 4.479661583900452e-06, 4.928559064865112e-06, 5.377456545829773e-06, 5.826354026794434e-06, 6.275251507759094e-06, 6.724148988723755e-06, 7.1730464696884155e-06, 7.621943950653076e-06, 8.070841431617737e-06, 8.519738912582397e-06, 8.968636393547058e-06, 9.417533874511719e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 12.0, 15.0, 20.0, 27.0, 34.0, 44.0, 67.0, 92.0, 104.0, 168.0, 219.0, 307.0, 430.0, 571.0, 756.0, 1040.0, 1511.0, 2236.0, 3232.0, 4758.0, 7570.0, 12439.0, 22448.0, 49965.0, 731140.0, 127276.0, 34499.0, 17481.0, 10341.0, 6255.0, 4093.0, 2736.0, 1948.0, 1271.0, 944.0, 665.0, 475.0, 379.0, 246.0, 193.0, 143.0, 97.0, 79.0, 38.0, 56.0, 33.0, 19.0, 25.0, 17.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.371337890625, -0.360015869140625, -0.34869384765625, -0.337371826171875, -0.3260498046875, -0.314727783203125, -0.30340576171875, -0.292083740234375, -0.28076171875, -0.269439697265625, -0.25811767578125, -0.246795654296875, -0.2354736328125, -0.224151611328125, -0.21282958984375, -0.201507568359375, -0.190185546875, -0.178863525390625, -0.16754150390625, -0.156219482421875, -0.1448974609375, -0.133575439453125, -0.12225341796875, -0.110931396484375, -0.099609375, -0.088287353515625, -0.07696533203125, -0.065643310546875, -0.0543212890625, -0.042999267578125, -0.03167724609375, -0.020355224609375, -0.009033203125, 0.002288818359375, 0.01361083984375, 0.024932861328125, 0.0362548828125, 0.047576904296875, 0.05889892578125, 0.070220947265625, 0.08154296875, 0.092864990234375, 0.10418701171875, 0.115509033203125, 0.1268310546875, 0.138153076171875, 0.14947509765625, 0.160797119140625, 0.172119140625, 0.183441162109375, 0.19476318359375, 0.206085205078125, 0.2174072265625, 0.228729248046875, 0.24005126953125, 0.251373291015625, 0.2626953125, 0.274017333984375, 0.28533935546875, 0.296661376953125, 0.3079833984375, 0.319305419921875, 0.33062744140625, 0.341949462890625, 0.353271484375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 7.0, 6.0, 7.0, 15.0, 12.0, 13.0, 23.0, 28.0, 41.0, 182.0, 426.0, 52.0, 33.0, 25.0, 13.0, 14.0, 18.0, 12.0, 14.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11306571960449219, -0.10931015014648438, -0.10555458068847656, -0.10179901123046875, -0.09804344177246094, -0.09428787231445312, -0.09053230285644531, -0.0867767333984375, -0.08302116394042969, -0.07926559448242188, -0.07551002502441406, -0.07175445556640625, -0.06799888610839844, -0.06424331665039062, -0.06048774719238281, -0.056732177734375, -0.05297660827636719, -0.049221038818359375, -0.04546546936035156, -0.04170989990234375, -0.03795433044433594, -0.034198760986328125, -0.030443191528320312, -0.0266876220703125, -0.022932052612304688, -0.019176483154296875, -0.015420913696289062, -0.01166534423828125, -0.007909774780273438, -0.004154205322265625, -0.0003986358642578125, 0.00335693359375, 0.0071125030517578125, 0.010868072509765625, 0.014623641967773438, 0.01837921142578125, 0.022134780883789062, 0.025890350341796875, 0.029645919799804688, 0.0334014892578125, 0.03715705871582031, 0.040912628173828125, 0.04466819763183594, 0.04842376708984375, 0.05217933654785156, 0.055934906005859375, 0.05969047546386719, 0.063446044921875, 0.06720161437988281, 0.07095718383789062, 0.07471275329589844, 0.07846832275390625, 0.08222389221191406, 0.08597946166992188, 0.08973503112792969, 0.0934906005859375, 0.09724617004394531, 0.10100173950195312, 0.10475730895996094, 0.10851287841796875, 0.11226844787597656, 0.11602401733398438, 0.11977958679199219, 0.12353515625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 3.0, 7.0, 3.0, 11.0, 12.0, 11.0, 15.0, 18.0, 18.0, 27.0, 36.0, 38.0, 54.0, 68.0, 57.0, 74.0, 85.0, 92.0, 68.0, 51.0, 35.0, 39.0, 24.0, 23.0, 16.0, 24.0, 17.0, 8.0, 11.0, 7.0, 4.0, 6.0, 5.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5670521259307861, -0.5489276051521301, -0.5308030843734741, -0.5126785039901733, -0.49455398321151733, -0.47642946243286133, -0.45830491185188293, -0.44018036127090454, -0.42205584049224854, -0.40393131971359253, -0.38580676913261414, -0.36768221855163574, -0.34955769777297974, -0.33143317699432373, -0.31330862641334534, -0.29518407583236694, -0.27705955505371094, -0.25893503427505493, -0.24081048369407654, -0.22268594801425934, -0.20456141233444214, -0.18643687665462494, -0.16831234097480774, -0.15018780529499054, -0.13206326961517334, -0.11393873393535614, -0.09581419825553894, -0.07768966257572174, -0.05956512689590454, -0.04144059121608734, -0.02331605553627014, -0.005191519856452942, 0.012933075428009033, 0.031057611107826233, 0.04918214678764343, 0.06730668246746063, 0.08543121814727783, 0.10355575382709503, 0.12168028950691223, 0.13980482518672943, 0.15792936086654663, 0.17605389654636383, 0.19417843222618103, 0.21230296790599823, 0.23042750358581543, 0.24855203926563263, 0.26667657494544983, 0.2848011255264282, 0.30292564630508423, 0.32105016708374023, 0.33917471766471863, 0.357299268245697, 0.375423789024353, 0.39354830980300903, 0.4116728603839874, 0.4297974109649658, 0.4479219317436218, 0.46604645252227783, 0.4841710031032562, 0.5022955536842346, 0.5204200744628906, 0.5385445952415466, 0.5566691160202026, 0.5747936964035034, 0.5929182171821594]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 8.0, 7.0, 5.0, 9.0, 12.0, 13.0, 13.0, 16.0, 15.0, 12.0, 27.0, 22.0, 32.0, 22.0, 32.0, 33.0, 36.0, 39.0, 45.0, 29.0, 32.0, 38.0, 26.0, 36.0, 37.0, 35.0, 31.0, 39.0, 41.0, 27.0, 29.0, 29.0, 27.0, 19.0, 25.0, 13.0, 14.0, 14.0, 11.0, 5.0, 9.0, 4.0, 4.0, 3.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.47422370314598083, -0.4603085517883301, -0.4463934004306793, -0.43247824907302856, -0.4185630977153778, -0.40464794635772705, -0.3907328248023987, -0.37681764364242554, -0.36290252208709717, -0.3489873707294464, -0.33507221937179565, -0.3211570680141449, -0.30724191665649414, -0.2933267652988434, -0.2794116139411926, -0.26549649238586426, -0.2515813112258911, -0.23766615986824036, -0.2237510085105896, -0.20983585715293884, -0.19592070579528809, -0.18200555443763733, -0.16809041798114777, -0.154175266623497, -0.14026011526584625, -0.1263449639081955, -0.11242981255054474, -0.09851466864347458, -0.08459951728582382, -0.07068436592817307, -0.056769222021102905, -0.04285407066345215, -0.028938889503479004, -0.015023740008473396, -0.0011085905134677887, 0.01280655711889267, 0.026721708476543427, 0.04063685983419418, 0.05455200374126434, 0.0684671550989151, 0.08238230645656586, 0.09629745781421661, 0.11021260917186737, 0.12412775307893753, 0.1380428969860077, 0.15195804834365845, 0.1658731997013092, 0.17978835105895996, 0.19370350241661072, 0.20761865377426147, 0.22153380513191223, 0.235448956489563, 0.24936410784721375, 0.2632792592048645, 0.27719438076019287, 0.291109561920166, 0.3050246834754944, 0.31893983483314514, 0.3328549861907959, 0.34677013754844666, 0.3606852889060974, 0.37460044026374817, 0.3885155916213989, 0.4024307131767273, 0.41634589433670044]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 9.0, 16.0, 32.0, 46.0, 69.0, 117.0, 177.0, 380.0, 569.0, 1058.0, 1794.0, 3042.0, 5293.0, 8551.0, 14036.0, 24502.0, 44519.0, 85098.0, 177959.0, 498032.0, 1822299.0, 966672.0, 274865.0, 122626.0, 61955.0, 33682.0, 19218.0, 11197.0, 6634.0, 3940.0, 2519.0, 1398.0, 779.0, 460.0, 279.0, 181.0, 109.0, 53.0, 51.0, 34.0, 10.0, 6.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6615447998046875, -0.638519287109375, -0.6154937744140625, -0.59246826171875, -0.5694427490234375, -0.546417236328125, -0.5233917236328125, -0.5003662109375, -0.4773406982421875, -0.454315185546875, -0.4312896728515625, -0.40826416015625, -0.3852386474609375, -0.362213134765625, -0.3391876220703125, -0.316162109375, -0.2931365966796875, -0.270111083984375, -0.2470855712890625, -0.22406005859375, -0.2010345458984375, -0.178009033203125, -0.1549835205078125, -0.1319580078125, -0.1089324951171875, -0.085906982421875, -0.0628814697265625, -0.03985595703125, -0.0168304443359375, 0.006195068359375, 0.0292205810546875, 0.05224609375, 0.0752716064453125, 0.098297119140625, 0.1213226318359375, 0.14434814453125, 0.1673736572265625, 0.190399169921875, 0.2134246826171875, 0.2364501953125, 0.2594757080078125, 0.282501220703125, 0.3055267333984375, 0.32855224609375, 0.3515777587890625, 0.374603271484375, 0.3976287841796875, 0.420654296875, 0.4436798095703125, 0.466705322265625, 0.4897308349609375, 0.51275634765625, 0.5357818603515625, 0.558807373046875, 0.5818328857421875, 0.6048583984375, 0.6278839111328125, 0.650909423828125, 0.6739349365234375, 0.69696044921875, 0.7199859619140625, 0.743011474609375, 0.7660369873046875, 0.7890625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 10.0, 4.0, 10.0, 11.0, 15.0, 8.0, 13.0, 21.0, 22.0, 25.0, 20.0, 27.0, 31.0, 30.0, 45.0, 36.0, 38.0, 31.0, 31.0, 34.0, 42.0, 37.0, 38.0, 29.0, 41.0, 33.0, 40.0, 29.0, 33.0, 22.0, 26.0, 32.0, 19.0, 11.0, 21.0, 7.0, 10.0, 12.0, 8.0, 5.0, 5.0, 2.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.261962890625, -0.2534675598144531, -0.24497222900390625, -0.23647689819335938, -0.2279815673828125, -0.21948623657226562, -0.21099090576171875, -0.20249557495117188, -0.194000244140625, -0.18550491333007812, -0.17700958251953125, -0.16851425170898438, -0.1600189208984375, -0.15152359008789062, -0.14302825927734375, -0.13453292846679688, -0.12603759765625, -0.11754226684570312, -0.10904693603515625, -0.10055160522460938, -0.0920562744140625, -0.08356094360351562, -0.07506561279296875, -0.06657028198242188, -0.058074951171875, -0.049579620361328125, -0.04108428955078125, -0.032588958740234375, -0.0240936279296875, -0.015598297119140625, -0.00710296630859375, 0.001392364501953125, 0.0098876953125, 0.018383026123046875, 0.02687835693359375, 0.035373687744140625, 0.0438690185546875, 0.052364349365234375, 0.06085968017578125, 0.06935501098632812, 0.077850341796875, 0.08634567260742188, 0.09484100341796875, 0.10333633422851562, 0.1118316650390625, 0.12032699584960938, 0.12882232666015625, 0.13731765747070312, 0.14581298828125, 0.15430831909179688, 0.16280364990234375, 0.17129898071289062, 0.1797943115234375, 0.18828964233398438, 0.19678497314453125, 0.20528030395507812, 0.213775634765625, 0.22227096557617188, 0.23076629638671875, 0.23926162719726562, 0.2477569580078125, 0.2562522888183594, 0.26474761962890625, 0.2732429504394531, 0.28173828125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 12.0, 13.0, 15.0, 21.0, 49.0, 61.0, 90.0, 128.0, 194.0, 383.0, 533.0, 804.0, 1289.0, 1976.0, 3198.0, 5096.0, 8076.0, 13329.0, 21839.0, 36807.0, 64493.0, 116648.0, 223629.0, 479762.0, 1284467.0, 1072113.0, 413755.0, 197381.0, 104625.0, 58112.0, 33246.0, 19914.0, 11953.0, 7443.0, 4663.0, 2918.0, 1813.0, 1243.0, 746.0, 463.0, 361.0, 203.0, 149.0, 86.0, 60.0, 50.0, 36.0, 18.0, 9.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.488037109375, -0.4722480773925781, -0.45645904541015625, -0.4406700134277344, -0.4248809814453125, -0.4090919494628906, -0.39330291748046875, -0.3775138854980469, -0.361724853515625, -0.3459358215332031, -0.33014678955078125, -0.3143577575683594, -0.2985687255859375, -0.2827796936035156, -0.26699066162109375, -0.2512016296386719, -0.23541259765625, -0.21962356567382812, -0.20383453369140625, -0.18804550170898438, -0.1722564697265625, -0.15646743774414062, -0.14067840576171875, -0.12488937377929688, -0.109100341796875, -0.09331130981445312, -0.07752227783203125, -0.061733245849609375, -0.0459442138671875, -0.030155181884765625, -0.01436614990234375, 0.001422882080078125, 0.0172119140625, 0.033000946044921875, 0.04878997802734375, 0.06457901000976562, 0.0803680419921875, 0.09615707397460938, 0.11194610595703125, 0.12773513793945312, 0.143524169921875, 0.15931320190429688, 0.17510223388671875, 0.19089126586914062, 0.2066802978515625, 0.22246932983398438, 0.23825836181640625, 0.2540473937988281, 0.26983642578125, 0.2856254577636719, 0.30141448974609375, 0.3172035217285156, 0.3329925537109375, 0.3487815856933594, 0.36457061767578125, 0.3803596496582031, 0.396148681640625, 0.4119377136230469, 0.42772674560546875, 0.4435157775878906, 0.4593048095703125, 0.4750938415527344, 0.49088287353515625, 0.5066719055175781, 0.5224609375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 6.0, 6.0, 13.0, 9.0, 13.0, 21.0, 28.0, 42.0, 47.0, 33.0, 73.0, 66.0, 101.0, 115.0, 121.0, 152.0, 169.0, 184.0, 227.0, 232.0, 268.0, 316.0, 264.0, 266.0, 191.0, 174.0, 167.0, 128.0, 114.0, 102.0, 97.0, 65.0, 62.0, 28.0, 40.0, 28.0, 23.0, 15.0, 17.0, 7.0, 10.0, 3.0, 12.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1575927734375, -0.15271949768066406, -0.14784622192382812, -0.1429729461669922, -0.13809967041015625, -0.1332263946533203, -0.12835311889648438, -0.12347984313964844, -0.1186065673828125, -0.11373329162597656, -0.10886001586914062, -0.10398674011230469, -0.09911346435546875, -0.09424018859863281, -0.08936691284179688, -0.08449363708496094, -0.079620361328125, -0.07474708557128906, -0.06987380981445312, -0.06500053405761719, -0.06012725830078125, -0.05525398254394531, -0.050380706787109375, -0.04550743103027344, -0.0406341552734375, -0.03576087951660156, -0.030887603759765625, -0.026014328002929688, -0.02114105224609375, -0.016267776489257812, -0.011394500732421875, -0.0065212249755859375, -0.00164794921875, 0.0032253265380859375, 0.008098602294921875, 0.012971878051757812, 0.01784515380859375, 0.022718429565429688, 0.027591705322265625, 0.03246498107910156, 0.0373382568359375, 0.04221153259277344, 0.047084808349609375, 0.05195808410644531, 0.05683135986328125, 0.06170463562011719, 0.06657791137695312, 0.07145118713378906, 0.076324462890625, 0.08119773864746094, 0.08607101440429688, 0.09094429016113281, 0.09581756591796875, 0.10069084167480469, 0.10556411743164062, 0.11043739318847656, 0.1153106689453125, 0.12018394470214844, 0.12505722045898438, 0.1299304962158203, 0.13480377197265625, 0.1396770477294922, 0.14455032348632812, 0.14942359924316406, 0.154296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 8.0, 9.0, 2.0, 7.0, 10.0, 11.0, 14.0, 27.0, 27.0, 37.0, 43.0, 51.0, 55.0, 90.0, 92.0, 80.0, 83.0, 70.0, 50.0, 49.0, 40.0, 27.0, 23.0, 21.0, 14.0, 9.0, 12.0, 8.0, 9.0, 4.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3909737467765808, -0.3766573369503021, -0.36234092712402344, -0.34802454710006714, -0.33370813727378845, -0.31939172744750977, -0.3050753176212311, -0.2907589077949524, -0.2764425277709961, -0.2621261179447174, -0.24780972301959991, -0.23349331319332123, -0.21917691826820374, -0.20486050844192505, -0.19054409861564636, -0.17622770369052887, -0.16191129386425018, -0.1475948840379715, -0.133278489112854, -0.11896207928657532, -0.10464568436145782, -0.09032927453517914, -0.07601287215948105, -0.06169646978378296, -0.04738006740808487, -0.03306366503238678, -0.01874726079404354, -0.004430856555700302, 0.009885545819997787, 0.024201951920986176, 0.038518354296684265, 0.052834756672382355, 0.06715115904808044, 0.08146756142377853, 0.09578396379947662, 0.11010037362575531, 0.1244167685508728, 0.1387331783771515, 0.15304958820343018, 0.16736598312854767, 0.18168237805366516, 0.19599878787994385, 0.21031518280506134, 0.22463159263134003, 0.23894798755645752, 0.2532643973827362, 0.2675808072090149, 0.2818971872329712, 0.29621362686157227, 0.31053003668785095, 0.32484644651412964, 0.33916282653808594, 0.3534792363643646, 0.3677956461906433, 0.382112056016922, 0.3964284658432007, 0.410744845867157, 0.42506125569343567, 0.43937766551971436, 0.45369404554367065, 0.46801045536994934, 0.482326865196228, 0.4966432750225067, 0.5109596848487854, 0.5252760648727417]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 9.0, 3.0, 6.0, 7.0, 9.0, 5.0, 6.0, 19.0, 17.0, 11.0, 20.0, 16.0, 31.0, 40.0, 27.0, 31.0, 35.0, 29.0, 32.0, 41.0, 41.0, 30.0, 41.0, 32.0, 48.0, 31.0, 42.0, 40.0, 46.0, 27.0, 37.0, 24.0, 22.0, 28.0, 14.0, 20.0, 9.0, 12.0, 12.0, 11.0, 9.0, 12.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3135598599910736, -0.3038623332977295, -0.2941648066043854, -0.28446730971336365, -0.27476978302001953, -0.2650722563266754, -0.2553747296333313, -0.24567720293998718, -0.23597969114780426, -0.22628216445446014, -0.21658465266227722, -0.2068871259689331, -0.197189599275589, -0.18749208748340607, -0.17779456079006195, -0.16809704899787903, -0.1583995223045349, -0.1487019956111908, -0.13900448381900787, -0.12930695712566376, -0.11960943788290024, -0.10991191864013672, -0.1002143919467926, -0.09051687270402908, -0.08081935346126556, -0.07112183421850204, -0.06142431125044823, -0.05172678828239441, -0.04202926903963089, -0.03233174979686737, -0.022634226828813553, -0.012936703860759735, -0.0032392144203186035, 0.006458306685090065, 0.016155827790498734, 0.025853348895907402, 0.03555087000131607, 0.04524838924407959, 0.05494591221213341, 0.06464343518018723, 0.07434095442295074, 0.08403847366571426, 0.09373599290847778, 0.1034335196018219, 0.11313103884458542, 0.12282855808734894, 0.13252608478069305, 0.14222359657287598, 0.1519211232662201, 0.1616186499595642, 0.17131616175174713, 0.18101368844509125, 0.19071120023727417, 0.2004087269306183, 0.2101062536239624, 0.21980378031730652, 0.22950129210948944, 0.23919881880283356, 0.24889633059501648, 0.2585938572883606, 0.2682913839817047, 0.27798891067504883, 0.28768640756607056, 0.2973839342594147, 0.3070814609527588]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 11.0, 19.0, 26.0, 33.0, 60.0, 72.0, 171.0, 245.0, 398.0, 671.0, 1237.0, 2189.0, 4104.0, 7495.0, 14709.0, 29335.0, 64149.0, 152088.0, 362159.0, 233476.0, 92804.0, 41287.0, 19647.0, 10070.0, 5378.0, 2917.0, 1549.0, 894.0, 527.0, 303.0, 201.0, 126.0, 73.0, 41.0, 31.0, 14.0, 15.0, 8.0, 4.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1962890625, -0.1894550323486328, -0.18262100219726562, -0.17578697204589844, -0.16895294189453125, -0.16211891174316406, -0.15528488159179688, -0.1484508514404297, -0.1416168212890625, -0.1347827911376953, -0.12794876098632812, -0.12111473083496094, -0.11428070068359375, -0.10744667053222656, -0.10061264038085938, -0.09377861022949219, -0.086944580078125, -0.08011054992675781, -0.07327651977539062, -0.06644248962402344, -0.05960845947265625, -0.05277442932128906, -0.045940399169921875, -0.03910636901855469, -0.0322723388671875, -0.025438308715820312, -0.018604278564453125, -0.011770248413085938, -0.00493621826171875, 0.0018978118896484375, 0.008731842041015625, 0.015565872192382812, 0.02239990234375, 0.029233932495117188, 0.036067962646484375, 0.04290199279785156, 0.04973602294921875, 0.05657005310058594, 0.06340408325195312, 0.07023811340332031, 0.0770721435546875, 0.08390617370605469, 0.09074020385742188, 0.09757423400878906, 0.10440826416015625, 0.11124229431152344, 0.11807632446289062, 0.12491035461425781, 0.131744384765625, 0.1385784149169922, 0.14541244506835938, 0.15224647521972656, 0.15908050537109375, 0.16591453552246094, 0.17274856567382812, 0.1795825958251953, 0.1864166259765625, 0.1932506561279297, 0.20008468627929688, 0.20691871643066406, 0.21375274658203125, 0.22058677673339844, 0.22742080688476562, 0.2342548370361328, 0.2410888671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 12.0, 5.0, 6.0, 5.0, 3.0, 5.0, 9.0, 17.0, 8.0, 18.0, 14.0, 22.0, 26.0, 30.0, 31.0, 19.0, 28.0, 24.0, 33.0, 37.0, 50.0, 37.0, 30.0, 34.0, 41.0, 37.0, 37.0, 40.0, 39.0, 31.0, 37.0, 31.0, 30.0, 25.0, 25.0, 22.0, 21.0, 10.0, 10.0, 12.0, 9.0, 9.0, 7.0, 8.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.311767578125, -0.30217742919921875, -0.2925872802734375, -0.28299713134765625, -0.273406982421875, -0.26381683349609375, -0.2542266845703125, -0.24463653564453125, -0.23504638671875, -0.22545623779296875, -0.2158660888671875, -0.20627593994140625, -0.196685791015625, -0.18709564208984375, -0.1775054931640625, -0.16791534423828125, -0.1583251953125, -0.14873504638671875, -0.1391448974609375, -0.12955474853515625, -0.119964599609375, -0.11037445068359375, -0.1007843017578125, -0.09119415283203125, -0.08160400390625, -0.07201385498046875, -0.0624237060546875, -0.05283355712890625, -0.043243408203125, -0.03365325927734375, -0.0240631103515625, -0.01447296142578125, -0.0048828125, 0.00470733642578125, 0.0142974853515625, 0.02388763427734375, 0.033477783203125, 0.04306793212890625, 0.0526580810546875, 0.06224822998046875, 0.07183837890625, 0.08142852783203125, 0.0910186767578125, 0.10060882568359375, 0.110198974609375, 0.11978912353515625, 0.1293792724609375, 0.13896942138671875, 0.1485595703125, 0.15814971923828125, 0.1677398681640625, 0.17733001708984375, 0.186920166015625, 0.19651031494140625, 0.2061004638671875, 0.21569061279296875, 0.22528076171875, 0.23487091064453125, 0.2444610595703125, 0.25405120849609375, 0.263641357421875, 0.27323150634765625, 0.2828216552734375, 0.29241180419921875, 0.302001953125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 15.0, 11.0, 11.0, 23.0, 38.0, 42.0, 62.0, 94.0, 145.0, 228.0, 404.0, 622.0, 962.0, 1500.0, 2531.0, 4276.0, 8043.0, 17030.0, 47085.0, 198264.0, 588020.0, 116887.0, 33180.0, 13171.0, 6627.0, 3512.0, 2121.0, 1302.0, 840.0, 549.0, 344.0, 231.0, 139.0, 86.0, 61.0, 40.0, 19.0, 13.0, 7.0, 5.0, 6.0, 4.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32080078125, -0.30986785888671875, -0.2989349365234375, -0.28800201416015625, -0.277069091796875, -0.26613616943359375, -0.2552032470703125, -0.24427032470703125, -0.23333740234375, -0.22240447998046875, -0.2114715576171875, -0.20053863525390625, -0.189605712890625, -0.17867279052734375, -0.1677398681640625, -0.15680694580078125, -0.1458740234375, -0.13494110107421875, -0.1240081787109375, -0.11307525634765625, -0.102142333984375, -0.09120941162109375, -0.0802764892578125, -0.06934356689453125, -0.05841064453125, -0.04747772216796875, -0.0365447998046875, -0.02561187744140625, -0.014678955078125, -0.00374603271484375, 0.0071868896484375, 0.01811981201171875, 0.029052734375, 0.03998565673828125, 0.0509185791015625, 0.06185150146484375, 0.072784423828125, 0.08371734619140625, 0.0946502685546875, 0.10558319091796875, 0.11651611328125, 0.12744903564453125, 0.1383819580078125, 0.14931488037109375, 0.160247802734375, 0.17118072509765625, 0.1821136474609375, 0.19304656982421875, 0.2039794921875, 0.21491241455078125, 0.2258453369140625, 0.23677825927734375, 0.247711181640625, 0.25864410400390625, 0.2695770263671875, 0.28050994873046875, 0.29144287109375, 0.30237579345703125, 0.3133087158203125, 0.32424163818359375, 0.335174560546875, 0.34610748291015625, 0.3570404052734375, 0.36797332763671875, 0.37890625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 6.0, 13.0, 6.0, 14.0, 12.0, 15.0, 20.0, 32.0, 20.0, 35.0, 36.0, 35.0, 29.0, 46.0, 55.0, 46.0, 55.0, 39.0, 40.0, 50.0, 41.0, 46.0, 28.0, 36.0, 35.0, 33.0, 31.0, 25.0, 16.0, 12.0, 19.0, 15.0, 12.0, 4.0, 3.0, 9.0, 4.0, 5.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.262939453125, -0.2555122375488281, -0.24808502197265625, -0.24065780639648438, -0.2332305908203125, -0.22580337524414062, -0.21837615966796875, -0.21094894409179688, -0.203521728515625, -0.19609451293945312, -0.18866729736328125, -0.18124008178710938, -0.1738128662109375, -0.16638565063476562, -0.15895843505859375, -0.15153121948242188, -0.14410400390625, -0.13667678833007812, -0.12924957275390625, -0.12182235717773438, -0.1143951416015625, -0.10696792602539062, -0.09954071044921875, -0.09211349487304688, -0.084686279296875, -0.07725906372070312, -0.06983184814453125, -0.062404632568359375, -0.0549774169921875, -0.047550201416015625, -0.04012298583984375, -0.032695770263671875, -0.0252685546875, -0.017841339111328125, -0.01041412353515625, -0.002986907958984375, 0.0044403076171875, 0.011867523193359375, 0.01929473876953125, 0.026721954345703125, 0.034149169921875, 0.041576385498046875, 0.04900360107421875, 0.056430816650390625, 0.0638580322265625, 0.07128524780273438, 0.07871246337890625, 0.08613967895507812, 0.09356689453125, 0.10099411010742188, 0.10842132568359375, 0.11584854125976562, 0.1232757568359375, 0.13070297241210938, 0.13813018798828125, 0.14555740356445312, 0.152984619140625, 0.16041183471679688, 0.16783905029296875, 0.17526626586914062, 0.1826934814453125, 0.19012069702148438, 0.19754791259765625, 0.20497512817382812, 0.21240234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 8.0, 5.0, 1.0, 5.0, 6.0, 15.0, 11.0, 9.0, 16.0, 32.0, 25.0, 53.0, 63.0, 96.0, 79.0, 161.0, 200.0, 355.0, 514.0, 724.0, 1218.0, 2096.0, 3596.0, 6940.0, 15485.0, 48224.0, 630725.0, 275434.0, 35656.0, 12573.0, 5971.0, 3070.0, 1838.0, 1083.0, 723.0, 462.0, 320.0, 193.0, 154.0, 96.0, 89.0, 74.0, 40.0, 27.0, 36.0, 14.0, 9.0, 12.0, 10.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.032257080078125, -0.031212806701660156, -0.030168533325195312, -0.02912425994873047, -0.028079986572265625, -0.02703571319580078, -0.025991439819335938, -0.024947166442871094, -0.02390289306640625, -0.022858619689941406, -0.021814346313476562, -0.02077007293701172, -0.019725799560546875, -0.01868152618408203, -0.017637252807617188, -0.016592979431152344, -0.0155487060546875, -0.014504432678222656, -0.013460159301757812, -0.012415885925292969, -0.011371612548828125, -0.010327339172363281, -0.009283065795898438, -0.008238792419433594, -0.00719451904296875, -0.006150245666503906, -0.0051059722900390625, -0.004061698913574219, -0.003017425537109375, -0.0019731521606445312, -0.0009288787841796875, 0.00011539459228515625, 0.00115966796875, 0.0022039413452148438, 0.0032482147216796875, 0.004292488098144531, 0.005336761474609375, 0.006381034851074219, 0.0074253082275390625, 0.008469581604003906, 0.00951385498046875, 0.010558128356933594, 0.011602401733398438, 0.012646675109863281, 0.013690948486328125, 0.014735221862792969, 0.015779495239257812, 0.016823768615722656, 0.0178680419921875, 0.018912315368652344, 0.019956588745117188, 0.02100086212158203, 0.022045135498046875, 0.02308940887451172, 0.024133682250976562, 0.025177955627441406, 0.02622222900390625, 0.027266502380371094, 0.028310775756835938, 0.02935504913330078, 0.030399322509765625, 0.03144359588623047, 0.03248786926269531, 0.033532142639160156, 0.034576416015625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 3.0, 0.0, 3.0, 7.0, 4.0, 10.0, 27.0, 21.0, 15.0, 29.0, 49.0, 68.0, 57.0, 172.0, 102.0, 81.0, 83.0, 76.0, 47.0, 37.0, 44.0, 14.0, 17.0, 9.0, 6.0, 7.0, 0.0, 12.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4354085326194763e-06, -2.3674219846725464e-06, -2.2994354367256165e-06, -2.2314488887786865e-06, -2.1634623408317566e-06, -2.0954757928848267e-06, -2.0274892449378967e-06, -1.959502696990967e-06, -1.8915161490440369e-06, -1.823529601097107e-06, -1.755543053150177e-06, -1.687556505203247e-06, -1.6195699572563171e-06, -1.5515834093093872e-06, -1.4835968613624573e-06, -1.4156103134155273e-06, -1.3476237654685974e-06, -1.2796372175216675e-06, -1.2116506695747375e-06, -1.1436641216278076e-06, -1.0756775736808777e-06, -1.0076910257339478e-06, -9.397044777870178e-07, -8.717179298400879e-07, -8.03731381893158e-07, -7.35744833946228e-07, -6.677582859992981e-07, -5.997717380523682e-07, -5.317851901054382e-07, -4.637986421585083e-07, -3.9581209421157837e-07, -3.2782554626464844e-07, -2.598389983177185e-07, -1.9185245037078857e-07, -1.2386590242385864e-07, -5.587935447692871e-08, 1.210719347000122e-08, 8.009374141693115e-08, 1.4808028936386108e-07, 2.1606683731079102e-07, 2.8405338525772095e-07, 3.520399332046509e-07, 4.200264811515808e-07, 4.880130290985107e-07, 5.559995770454407e-07, 6.239861249923706e-07, 6.919726729393005e-07, 7.599592208862305e-07, 8.279457688331604e-07, 8.959323167800903e-07, 9.639188647270203e-07, 1.0319054126739502e-06, 1.0998919606208801e-06, 1.16787850856781e-06, 1.23586505651474e-06, 1.30385160446167e-06, 1.3718381524085999e-06, 1.4398247003555298e-06, 1.5078112483024597e-06, 1.5757977962493896e-06, 1.6437843441963196e-06, 1.7117708921432495e-06, 1.7797574400901794e-06, 1.8477439880371094e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 11.0, 13.0, 22.0, 26.0, 39.0, 69.0, 74.0, 98.0, 114.0, 150.0, 207.0, 277.0, 425.0, 671.0, 1109.0, 1876.0, 3133.0, 6091.0, 12810.0, 29823.0, 84664.0, 424774.0, 351833.0, 76687.0, 27722.0, 12124.0, 5792.0, 2950.0, 1735.0, 1001.0, 640.0, 447.0, 265.0, 220.0, 175.0, 117.0, 90.0, 47.0, 49.0, 45.0, 26.0, 33.0, 17.0, 14.0, 18.0, 4.0, 3.0, 3.0, 0.0, 5.0, 1.0, 1.0, 3.0], "bins": [-0.032257080078125, -0.031278371810913086, -0.030299663543701172, -0.029320955276489258, -0.028342247009277344, -0.02736353874206543, -0.026384830474853516, -0.0254061222076416, -0.024427413940429688, -0.023448705673217773, -0.02246999740600586, -0.021491289138793945, -0.02051258087158203, -0.019533872604370117, -0.018555164337158203, -0.01757645606994629, -0.016597747802734375, -0.015619039535522461, -0.014640331268310547, -0.013661623001098633, -0.012682914733886719, -0.011704206466674805, -0.01072549819946289, -0.009746789932250977, -0.008768081665039062, -0.0077893733978271484, -0.006810665130615234, -0.00583195686340332, -0.004853248596191406, -0.003874540328979492, -0.002895832061767578, -0.001917123794555664, -0.00093841552734375, 4.029273986816406e-05, 0.0010190010070800781, 0.001997709274291992, 0.0029764175415039062, 0.00395512580871582, 0.004933834075927734, 0.0059125423431396484, 0.0068912506103515625, 0.007869958877563477, 0.00884866714477539, 0.009827375411987305, 0.010806083679199219, 0.011784791946411133, 0.012763500213623047, 0.013742208480834961, 0.014720916748046875, 0.01569962501525879, 0.016678333282470703, 0.017657041549682617, 0.01863574981689453, 0.019614458084106445, 0.02059316635131836, 0.021571874618530273, 0.022550582885742188, 0.0235292911529541, 0.024507999420166016, 0.02548670768737793, 0.026465415954589844, 0.027444124221801758, 0.028422832489013672, 0.029401540756225586, 0.0303802490234375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 5.0, 9.0, 15.0, 13.0, 7.0, 18.0, 26.0, 19.0, 25.0, 48.0, 41.0, 41.0, 68.0, 59.0, 90.0, 78.0, 81.0, 51.0, 60.0, 45.0, 36.0, 29.0, 24.0, 25.0, 20.0, 11.0, 11.0, 5.0, 7.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004550933837890625, -0.004394948482513428, -0.0042389631271362305, -0.004082977771759033, -0.003926992416381836, -0.0037710070610046387, -0.0036150217056274414, -0.003459036350250244, -0.003303050994873047, -0.0031470656394958496, -0.0029910802841186523, -0.002835094928741455, -0.002679109573364258, -0.0025231242179870605, -0.0023671388626098633, -0.002211153507232666, -0.0020551681518554688, -0.0018991827964782715, -0.0017431974411010742, -0.001587212085723877, -0.0014312267303466797, -0.0012752413749694824, -0.0011192560195922852, -0.0009632706642150879, -0.0008072853088378906, -0.0006512999534606934, -0.0004953145980834961, -0.00033932924270629883, -0.00018334388732910156, -2.7358531951904297e-05, 0.00012862682342529297, 0.00028461217880249023, 0.0004405975341796875, 0.0005965828895568848, 0.000752568244934082, 0.0009085536003112793, 0.0010645389556884766, 0.0012205243110656738, 0.001376509666442871, 0.0015324950218200684, 0.0016884803771972656, 0.0018444657325744629, 0.00200045108795166, 0.0021564364433288574, 0.0023124217987060547, 0.002468407154083252, 0.0026243925094604492, 0.0027803778648376465, 0.0029363632202148438, 0.003092348575592041, 0.0032483339309692383, 0.0034043192863464355, 0.003560304641723633, 0.00371628999710083, 0.0038722753524780273, 0.004028260707855225, 0.004184246063232422, 0.004340231418609619, 0.004496216773986816, 0.004652202129364014, 0.004808187484741211, 0.004964172840118408, 0.0051201581954956055, 0.005276143550872803, 0.00543212890625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 8.0, 7.0, 5.0, 11.0, 5.0, 21.0, 25.0, 23.0, 33.0, 41.0, 47.0, 60.0, 75.0, 98.0, 95.0, 79.0, 57.0, 62.0, 45.0, 48.0, 29.0, 24.0, 21.0, 14.0, 13.0, 9.0, 12.0, 5.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3944133222103119, -0.3800172805786133, -0.3656212091445923, -0.3512251675128937, -0.3368290960788727, -0.3224330544471741, -0.3080369830131531, -0.29364094138145447, -0.27924489974975586, -0.26484885811805725, -0.25045278668403625, -0.23605674505233765, -0.22166067361831665, -0.20726463198661804, -0.19286857545375824, -0.17847251892089844, -0.16407644748687744, -0.14968039095401764, -0.13528433442115784, -0.12088828533887863, -0.10649222880601883, -0.09209617227315903, -0.07770012319087982, -0.06330406665802002, -0.04890801012516022, -0.034511953592300415, -0.02011590078473091, -0.0057198479771614075, 0.008676208555698395, 0.023072265088558197, 0.0374683141708374, 0.051864370703697205, 0.06626039743423462, 0.08065645396709442, 0.09505251049995422, 0.10944855958223343, 0.12384461611509323, 0.13824066519737244, 0.15263672173023224, 0.16703277826309204, 0.18142883479595184, 0.19582489132881165, 0.21022094786167145, 0.22461700439453125, 0.23901304602622986, 0.25340911746025085, 0.26780515909194946, 0.28220123052597046, 0.29659727215766907, 0.3109933137893677, 0.32538938522338867, 0.3397854268550873, 0.3541814982891083, 0.3685775399208069, 0.3829736113548279, 0.3973696529865265, 0.4117656946182251, 0.4261617362499237, 0.4405578076839447, 0.4549538493156433, 0.4693499207496643, 0.4837459623813629, 0.4981420040130615, 0.5125380754470825, 0.5269341468811035]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 4.0, 6.0, 7.0, 9.0, 5.0, 5.0, 20.0, 16.0, 13.0, 19.0, 14.0, 32.0, 39.0, 25.0, 34.0, 35.0, 31.0, 29.0, 39.0, 42.0, 31.0, 41.0, 31.0, 44.0, 37.0, 39.0, 36.0, 48.0, 33.0, 32.0, 26.0, 24.0, 27.0, 14.0, 18.0, 13.0, 11.0, 13.0, 10.0, 11.0, 11.0, 7.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3117205798625946, -0.3021451234817505, -0.292569637298584, -0.28299418091773987, -0.27341872453689575, -0.26384326815605164, -0.2542678117752075, -0.24469232559204102, -0.2351168692111969, -0.22554141283035278, -0.21596594154834747, -0.20639047026634216, -0.19681501388549805, -0.18723955750465393, -0.17766408622264862, -0.1680886149406433, -0.1585131585597992, -0.14893770217895508, -0.13936223089694977, -0.12978675961494446, -0.12021130323410034, -0.11063583940267563, -0.10106037557125092, -0.0914849117398262, -0.08190944790840149, -0.07233398407697678, -0.06275852024555206, -0.05318305641412735, -0.04360759258270264, -0.034032128751277924, -0.02445666491985321, -0.014881201088428497, -0.005305737257003784, 0.004269726574420929, 0.013845190405845642, 0.023420654237270355, 0.03299611806869507, 0.04257158190011978, 0.052147045731544495, 0.06172250956296921, 0.07129797339439392, 0.08087343722581863, 0.09044890105724335, 0.10002436488866806, 0.10959982872009277, 0.11917529255151749, 0.1287507563829422, 0.1383262276649475, 0.14790168404579163, 0.15747714042663574, 0.16705261170864105, 0.17662808299064636, 0.18620353937149048, 0.1957789957523346, 0.2053544670343399, 0.21492993831634521, 0.22450539469718933, 0.23408085107803345, 0.24365632236003876, 0.25323179364204407, 0.2628072500228882, 0.2723827064037323, 0.2819581627845764, 0.2915336489677429, 0.30110910534858704]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 9.0, 15.0, 31.0, 36.0, 67.0, 89.0, 99.0, 149.0, 260.0, 337.0, 507.0, 671.0, 975.0, 1379.0, 2013.0, 2784.0, 4035.0, 6027.0, 8979.0, 13399.0, 19937.0, 31886.0, 51370.0, 86895.0, 156736.0, 247326.0, 168268.0, 92357.0, 53754.0, 33380.0, 21390.0, 13926.0, 9259.0, 6265.0, 4266.0, 2922.0, 1968.0, 1391.0, 1018.0, 715.0, 508.0, 340.0, 257.0, 173.0, 117.0, 92.0, 61.0, 43.0, 25.0, 15.0, 14.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.5458984375, -0.5291290283203125, -0.512359619140625, -0.4955902099609375, -0.47882080078125, -0.4620513916015625, -0.445281982421875, -0.4285125732421875, -0.4117431640625, -0.3949737548828125, -0.378204345703125, -0.3614349365234375, -0.34466552734375, -0.3278961181640625, -0.311126708984375, -0.2943572998046875, -0.277587890625, -0.2608184814453125, -0.244049072265625, -0.2272796630859375, -0.21051025390625, -0.1937408447265625, -0.176971435546875, -0.1602020263671875, -0.1434326171875, -0.1266632080078125, -0.109893798828125, -0.0931243896484375, -0.07635498046875, -0.0595855712890625, -0.042816162109375, -0.0260467529296875, -0.00927734375, 0.0074920654296875, 0.024261474609375, 0.0410308837890625, 0.05780029296875, 0.0745697021484375, 0.091339111328125, 0.1081085205078125, 0.1248779296875, 0.1416473388671875, 0.158416748046875, 0.1751861572265625, 0.19195556640625, 0.2087249755859375, 0.225494384765625, 0.2422637939453125, 0.259033203125, 0.2758026123046875, 0.292572021484375, 0.3093414306640625, 0.32611083984375, 0.3428802490234375, 0.359649658203125, 0.3764190673828125, 0.3931884765625, 0.4099578857421875, 0.426727294921875, 0.4434967041015625, 0.46026611328125, 0.4770355224609375, 0.493804931640625, 0.5105743408203125, 0.52734375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 7.0, 4.0, 3.0, 9.0, 17.0, 17.0, 18.0, 10.0, 12.0, 22.0, 31.0, 41.0, 22.0, 25.0, 33.0, 38.0, 37.0, 33.0, 46.0, 35.0, 38.0, 30.0, 45.0, 43.0, 38.0, 43.0, 40.0, 32.0, 24.0, 27.0, 20.0, 24.0, 24.0, 15.0, 14.0, 10.0, 7.0, 10.0, 4.0, 11.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.289794921875, -0.28133392333984375, -0.2728729248046875, -0.26441192626953125, -0.255950927734375, -0.24748992919921875, -0.2390289306640625, -0.23056793212890625, -0.22210693359375, -0.21364593505859375, -0.2051849365234375, -0.19672393798828125, -0.188262939453125, -0.17980194091796875, -0.1713409423828125, -0.16287994384765625, -0.1544189453125, -0.14595794677734375, -0.1374969482421875, -0.12903594970703125, -0.120574951171875, -0.11211395263671875, -0.1036529541015625, -0.09519195556640625, -0.08673095703125, -0.07826995849609375, -0.0698089599609375, -0.06134796142578125, -0.052886962890625, -0.04442596435546875, -0.0359649658203125, -0.02750396728515625, -0.01904296875, -0.01058197021484375, -0.0021209716796875, 0.00634002685546875, 0.014801025390625, 0.02326202392578125, 0.0317230224609375, 0.04018402099609375, 0.04864501953125, 0.05710601806640625, 0.0655670166015625, 0.07402801513671875, 0.082489013671875, 0.09095001220703125, 0.0994110107421875, 0.10787200927734375, 0.1163330078125, 0.12479400634765625, 0.1332550048828125, 0.14171600341796875, 0.150177001953125, 0.15863800048828125, 0.1670989990234375, 0.17555999755859375, 0.18402099609375, 0.19248199462890625, 0.2009429931640625, 0.20940399169921875, 0.217864990234375, 0.22632598876953125, 0.2347869873046875, 0.24324798583984375, 0.251708984375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 10.0, 11.0, 13.0, 25.0, 28.0, 37.0, 74.0, 104.0, 152.0, 205.0, 247.0, 328.0, 555.0, 706.0, 1041.0, 1419.0, 1983.0, 2953.0, 3982.0, 5682.0, 8456.0, 12713.0, 18773.0, 29455.0, 45960.0, 74604.0, 121552.0, 208951.0, 195863.0, 114255.0, 70130.0, 43609.0, 27779.0, 18248.0, 11862.0, 8086.0, 5596.0, 3771.0, 2696.0, 1943.0, 1327.0, 1004.0, 665.0, 485.0, 387.0, 265.0, 185.0, 121.0, 89.0, 50.0, 37.0, 36.0, 16.0, 18.0, 12.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.50439453125, -0.4886016845703125, -0.472808837890625, -0.4570159912109375, -0.44122314453125, -0.4254302978515625, -0.409637451171875, -0.3938446044921875, -0.3780517578125, -0.3622589111328125, -0.346466064453125, -0.3306732177734375, -0.31488037109375, -0.2990875244140625, -0.283294677734375, -0.2675018310546875, -0.251708984375, -0.2359161376953125, -0.220123291015625, -0.2043304443359375, -0.18853759765625, -0.1727447509765625, -0.156951904296875, -0.1411590576171875, -0.1253662109375, -0.1095733642578125, -0.093780517578125, -0.0779876708984375, -0.06219482421875, -0.0464019775390625, -0.030609130859375, -0.0148162841796875, 0.0009765625, 0.0167694091796875, 0.032562255859375, 0.0483551025390625, 0.06414794921875, 0.0799407958984375, 0.095733642578125, 0.1115264892578125, 0.1273193359375, 0.1431121826171875, 0.158905029296875, 0.1746978759765625, 0.19049072265625, 0.2062835693359375, 0.222076416015625, 0.2378692626953125, 0.253662109375, 0.2694549560546875, 0.285247802734375, 0.3010406494140625, 0.31683349609375, 0.3326263427734375, 0.348419189453125, 0.3642120361328125, 0.3800048828125, 0.3957977294921875, 0.411590576171875, 0.4273834228515625, 0.44317626953125, 0.4589691162109375, 0.474761962890625, 0.4905548095703125, 0.50634765625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 5.0, 4.0, 5.0, 8.0, 4.0, 14.0, 19.0, 17.0, 21.0, 20.0, 37.0, 24.0, 28.0, 32.0, 38.0, 35.0, 45.0, 40.0, 41.0, 29.0, 41.0, 23.0, 38.0, 32.0, 27.0, 37.0, 43.0, 36.0, 34.0, 25.0, 35.0, 25.0, 17.0, 15.0, 21.0, 19.0, 11.0, 10.0, 7.0, 6.0, 14.0, 8.0, 3.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0], "bins": [-0.19580078125, -0.19012451171875, -0.1844482421875, -0.17877197265625, -0.173095703125, -0.16741943359375, -0.1617431640625, -0.15606689453125, -0.150390625, -0.14471435546875, -0.1390380859375, -0.13336181640625, -0.127685546875, -0.12200927734375, -0.1163330078125, -0.11065673828125, -0.10498046875, -0.09930419921875, -0.0936279296875, -0.08795166015625, -0.082275390625, -0.07659912109375, -0.0709228515625, -0.06524658203125, -0.0595703125, -0.05389404296875, -0.0482177734375, -0.04254150390625, -0.036865234375, -0.03118896484375, -0.0255126953125, -0.01983642578125, -0.01416015625, -0.00848388671875, -0.0028076171875, 0.00286865234375, 0.008544921875, 0.01422119140625, 0.0198974609375, 0.02557373046875, 0.03125, 0.03692626953125, 0.0426025390625, 0.04827880859375, 0.053955078125, 0.05963134765625, 0.0653076171875, 0.07098388671875, 0.07666015625, 0.08233642578125, 0.0880126953125, 0.09368896484375, 0.099365234375, 0.10504150390625, 0.1107177734375, 0.11639404296875, 0.1220703125, 0.12774658203125, 0.1334228515625, 0.13909912109375, 0.144775390625, 0.15045166015625, 0.1561279296875, 0.16180419921875, 0.16748046875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 8.0, 11.0, 18.0, 27.0, 36.0, 49.0, 59.0, 75.0, 95.0, 150.0, 189.0, 269.0, 343.0, 497.0, 647.0, 961.0, 1322.0, 2078.0, 3387.0, 5706.0, 10186.0, 24482.0, 200317.0, 735597.0, 32601.0, 11855.0, 6432.0, 3727.0, 2344.0, 1456.0, 1006.0, 680.0, 511.0, 373.0, 249.0, 197.0, 168.0, 126.0, 94.0, 59.0, 47.0, 36.0, 23.0, 24.0, 12.0, 8.0, 5.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.16796875, -0.16304397583007812, -0.15811920166015625, -0.15319442749023438, -0.1482696533203125, -0.14334487915039062, -0.13842010498046875, -0.13349533081054688, -0.128570556640625, -0.12364578247070312, -0.11872100830078125, -0.11379623413085938, -0.1088714599609375, -0.10394668579101562, -0.09902191162109375, -0.09409713745117188, -0.08917236328125, -0.08424758911132812, -0.07932281494140625, -0.07439804077148438, -0.0694732666015625, -0.06454849243164062, -0.05962371826171875, -0.054698944091796875, -0.049774169921875, -0.044849395751953125, -0.03992462158203125, -0.034999847412109375, -0.0300750732421875, -0.025150299072265625, -0.02022552490234375, -0.015300750732421875, -0.0103759765625, -0.005451202392578125, -0.00052642822265625, 0.004398345947265625, 0.0093231201171875, 0.014247894287109375, 0.01917266845703125, 0.024097442626953125, 0.029022216796875, 0.033946990966796875, 0.03887176513671875, 0.043796539306640625, 0.0487213134765625, 0.053646087646484375, 0.05857086181640625, 0.06349563598632812, 0.06842041015625, 0.07334518432617188, 0.07826995849609375, 0.08319473266601562, 0.0881195068359375, 0.09304428100585938, 0.09796905517578125, 0.10289382934570312, 0.107818603515625, 0.11274337768554688, 0.11766815185546875, 0.12259292602539062, 0.1275177001953125, 0.13244247436523438, 0.13736724853515625, 0.14229202270507812, 0.147216796875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 10.0, 13.0, 22.0, 63.0, 240.0, 336.0, 181.0, 63.0, 20.0, 12.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3909759521484375e-06, -7.1106478571891785e-06, -6.8303197622299194e-06, -6.54999166727066e-06, -6.269663572311401e-06, -5.989335477352142e-06, -5.709007382392883e-06, -5.428679287433624e-06, -5.148351192474365e-06, -4.868023097515106e-06, -4.587695002555847e-06, -4.307366907596588e-06, -4.027038812637329e-06, -3.74671071767807e-06, -3.466382622718811e-06, -3.186054527759552e-06, -2.905726432800293e-06, -2.625398337841034e-06, -2.345070242881775e-06, -2.064742147922516e-06, -1.7844140529632568e-06, -1.5040859580039978e-06, -1.2237578630447388e-06, -9.434297680854797e-07, -6.631016731262207e-07, -3.8277357816696167e-07, -1.0244548320770264e-07, 1.778826117515564e-07, 4.5821070671081543e-07, 7.385388016700745e-07, 1.0188668966293335e-06, 1.2991949915885925e-06, 1.5795230865478516e-06, 1.8598511815071106e-06, 2.1401792764663696e-06, 2.4205073714256287e-06, 2.7008354663848877e-06, 2.9811635613441467e-06, 3.2614916563034058e-06, 3.541819751262665e-06, 3.822147846221924e-06, 4.102475941181183e-06, 4.382804036140442e-06, 4.663132131099701e-06, 4.94346022605896e-06, 5.223788321018219e-06, 5.504116415977478e-06, 5.784444510936737e-06, 6.064772605895996e-06, 6.345100700855255e-06, 6.625428795814514e-06, 6.905756890773773e-06, 7.186084985733032e-06, 7.466413080692291e-06, 7.74674117565155e-06, 8.02706927061081e-06, 8.307397365570068e-06, 8.587725460529327e-06, 8.868053555488586e-06, 9.148381650447845e-06, 9.428709745407104e-06, 9.709037840366364e-06, 9.989365935325623e-06, 1.0269694030284882e-05, 1.055002212524414e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 18.0, 15.0, 20.0, 35.0, 44.0, 63.0, 83.0, 129.0, 173.0, 257.0, 381.0, 557.0, 804.0, 1159.0, 1949.0, 3045.0, 5226.0, 9927.0, 23532.0, 110721.0, 805117.0, 50206.0, 15976.0, 7609.0, 4193.0, 2514.0, 1561.0, 994.0, 671.0, 509.0, 307.0, 240.0, 155.0, 98.0, 69.0, 61.0, 40.0, 29.0, 15.0, 11.0, 10.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1739501953125, -0.16887855529785156, -0.16380691528320312, -0.1587352752685547, -0.15366363525390625, -0.1485919952392578, -0.14352035522460938, -0.13844871520996094, -0.1333770751953125, -0.12830543518066406, -0.12323379516601562, -0.11816215515136719, -0.11309051513671875, -0.10801887512207031, -0.10294723510742188, -0.09787559509277344, -0.092803955078125, -0.08773231506347656, -0.08266067504882812, -0.07758903503417969, -0.07251739501953125, -0.06744575500488281, -0.062374114990234375, -0.05730247497558594, -0.0522308349609375, -0.04715919494628906, -0.042087554931640625, -0.03701591491699219, -0.03194427490234375, -0.026872634887695312, -0.021800994873046875, -0.016729354858398438, -0.01165771484375, -0.0065860748291015625, -0.001514434814453125, 0.0035572052001953125, 0.00862884521484375, 0.013700485229492188, 0.018772125244140625, 0.023843765258789062, 0.0289154052734375, 0.03398704528808594, 0.039058685302734375, 0.04413032531738281, 0.04920196533203125, 0.05427360534667969, 0.059345245361328125, 0.06441688537597656, 0.069488525390625, 0.07456016540527344, 0.07963180541992188, 0.08470344543457031, 0.08977508544921875, 0.09484672546386719, 0.09991836547851562, 0.10499000549316406, 0.1100616455078125, 0.11513328552246094, 0.12020492553710938, 0.1252765655517578, 0.13034820556640625, 0.1354198455810547, 0.14049148559570312, 0.14556312561035156, 0.150634765625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 4.0, 5.0, 7.0, 7.0, 6.0, 17.0, 16.0, 36.0, 67.0, 164.0, 421.0, 96.0, 46.0, 28.0, 12.0, 13.0, 14.0, 8.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038970947265625, -0.03754091262817383, -0.036110877990722656, -0.034680843353271484, -0.03325080871582031, -0.03182077407836914, -0.03039073944091797, -0.028960704803466797, -0.027530670166015625, -0.026100635528564453, -0.02467060089111328, -0.02324056625366211, -0.021810531616210938, -0.020380496978759766, -0.018950462341308594, -0.017520427703857422, -0.01609039306640625, -0.014660358428955078, -0.013230323791503906, -0.011800289154052734, -0.010370254516601562, -0.00894021987915039, -0.007510185241699219, -0.006080150604248047, -0.004650115966796875, -0.003220081329345703, -0.0017900466918945312, -0.0003600120544433594, 0.0010700225830078125, 0.0025000572204589844, 0.003930091857910156, 0.005360126495361328, 0.0067901611328125, 0.008220195770263672, 0.009650230407714844, 0.011080265045166016, 0.012510299682617188, 0.01394033432006836, 0.015370368957519531, 0.016800403594970703, 0.018230438232421875, 0.019660472869873047, 0.02109050750732422, 0.02252054214477539, 0.023950576782226562, 0.025380611419677734, 0.026810646057128906, 0.028240680694580078, 0.02967071533203125, 0.031100749969482422, 0.032530784606933594, 0.033960819244384766, 0.03539085388183594, 0.03682088851928711, 0.03825092315673828, 0.03968095779418945, 0.041110992431640625, 0.0425410270690918, 0.04397106170654297, 0.04540109634399414, 0.04683113098144531, 0.048261165618896484, 0.049691200256347656, 0.05112123489379883, 0.05255126953125]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 4.0, 8.0, 15.0, 19.0, 17.0, 32.0, 45.0, 41.0, 54.0, 58.0, 88.0, 109.0, 103.0, 72.0, 80.0, 55.0, 36.0, 34.0, 18.0, 23.0, 14.0, 8.0, 15.0, 6.0, 8.0, 3.0, 7.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.483429491519928, -0.46918609738349915, -0.4549426734447479, -0.4406992793083191, -0.42645585536956787, -0.41221246123313904, -0.3979690372943878, -0.383725643157959, -0.36948221921920776, -0.35523882508277893, -0.3409954011440277, -0.3267520070075989, -0.31250858306884766, -0.2982651889324188, -0.2840217649936676, -0.26977837085723877, -0.25553494691848755, -0.24129153788089752, -0.2270481288433075, -0.21280471980571747, -0.19856131076812744, -0.1843179166316986, -0.1700744926929474, -0.15583109855651855, -0.14158770442008972, -0.1273442953824997, -0.11310088634490967, -0.09885747730731964, -0.08461406826972961, -0.07037066668272018, -0.05612725764513016, -0.04188384860754013, -0.027640432119369507, -0.013397024013102055, 0.0008463840931653976, 0.015089791268110275, 0.029333200305700302, 0.04357660561800003, 0.05782001465559006, 0.07206342369318008, 0.08630683273077011, 0.10055024176836014, 0.11479365080595016, 0.1290370523929596, 0.14328046143054962, 0.15752387046813965, 0.17176727950572968, 0.1860106885433197, 0.20025409758090973, 0.21449750661849976, 0.22874091565608978, 0.2429843246936798, 0.25722771883010864, 0.27147114276885986, 0.2857145369052887, 0.2999579608440399, 0.31420135498046875, 0.3284447491168976, 0.3426881730556488, 0.35693156719207764, 0.37117499113082886, 0.3854183852672577, 0.3996618092060089, 0.41390520334243774, 0.42814862728118896]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 3.0, 12.0, 11.0, 7.0, 14.0, 16.0, 10.0, 19.0, 13.0, 17.0, 19.0, 21.0, 34.0, 34.0, 40.0, 34.0, 29.0, 40.0, 38.0, 37.0, 39.0, 46.0, 44.0, 30.0, 43.0, 37.0, 40.0, 25.0, 28.0, 33.0, 23.0, 26.0, 22.0, 17.0, 7.0, 15.0, 13.0, 10.0, 11.0, 8.0, 6.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2655802369117737, -0.2566578984260559, -0.24773554503917694, -0.23881320655345917, -0.2298908531665802, -0.22096851468086243, -0.21204617619514465, -0.20312383770942688, -0.1942014843225479, -0.18527914583683014, -0.17635679244995117, -0.1674344539642334, -0.15851211547851562, -0.14958976209163666, -0.14066742360591888, -0.13174507021903992, -0.12282273173332214, -0.11390038579702377, -0.1049780398607254, -0.09605570137500763, -0.08713335543870926, -0.07821100950241089, -0.06928867101669312, -0.060366325080394745, -0.051443979144096375, -0.042521633207798004, -0.03359929099678993, -0.02467694692313671, -0.01575460284948349, -0.00683225691318512, 0.0020900852978229523, 0.011012427508831024, 0.019934773445129395, 0.028857117518782616, 0.03777946159243584, 0.04670180380344391, 0.05562414973974228, 0.06454649567604065, 0.07346883416175842, 0.0823911800980568, 0.09131352603435516, 0.10023587197065353, 0.1091582179069519, 0.11808055639266968, 0.12700289487838745, 0.13592524826526642, 0.1448475867509842, 0.15376994013786316, 0.16269227862358093, 0.1716146171092987, 0.18053697049617767, 0.18945930898189545, 0.19838166236877441, 0.2073040008544922, 0.21622633934020996, 0.22514867782592773, 0.2340710312128067, 0.24299336969852448, 0.25191572308540344, 0.2608380615711212, 0.269760400056839, 0.27868276834487915, 0.2876051068305969, 0.2965274453163147, 0.30544978380203247]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 8.0, 8.0, 11.0, 13.0, 32.0, 33.0, 63.0, 92.0, 141.0, 246.0, 390.0, 612.0, 919.0, 1518.0, 2320.0, 3680.0, 5761.0, 9368.0, 15275.0, 25670.0, 43602.0, 77197.0, 150713.0, 364201.0, 1332599.0, 1420079.0, 379576.0, 157903.0, 82369.0, 46809.0, 27651.0, 16735.0, 10460.0, 6623.0, 4280.0, 2590.0, 1731.0, 1083.0, 740.0, 428.0, 293.0, 153.0, 113.0, 66.0, 55.0, 21.0, 23.0, 13.0, 8.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.435546875, -0.42236328125, -0.4091796875, -0.39599609375, -0.3828125, -0.36962890625, -0.3564453125, -0.34326171875, -0.330078125, -0.31689453125, -0.3037109375, -0.29052734375, -0.27734375, -0.26416015625, -0.2509765625, -0.23779296875, -0.224609375, -0.21142578125, -0.1982421875, -0.18505859375, -0.171875, -0.15869140625, -0.1455078125, -0.13232421875, -0.119140625, -0.10595703125, -0.0927734375, -0.07958984375, -0.06640625, -0.05322265625, -0.0400390625, -0.02685546875, -0.013671875, -0.00048828125, 0.0126953125, 0.02587890625, 0.0390625, 0.05224609375, 0.0654296875, 0.07861328125, 0.091796875, 0.10498046875, 0.1181640625, 0.13134765625, 0.14453125, 0.15771484375, 0.1708984375, 0.18408203125, 0.197265625, 0.21044921875, 0.2236328125, 0.23681640625, 0.25, 0.26318359375, 0.2763671875, 0.28955078125, 0.302734375, 0.31591796875, 0.3291015625, 0.34228515625, 0.35546875, 0.36865234375, 0.3818359375, 0.39501953125, 0.408203125]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 6.0, 6.0, 8.0, 11.0, 13.0, 15.0, 20.0, 17.0, 16.0, 16.0, 22.0, 41.0, 28.0, 37.0, 31.0, 30.0, 44.0, 45.0, 37.0, 42.0, 39.0, 43.0, 36.0, 42.0, 35.0, 35.0, 34.0, 26.0, 35.0, 24.0, 20.0, 20.0, 14.0, 17.0, 15.0, 7.0, 12.0, 9.0, 9.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.16015625, -0.1547832489013672, -0.14941024780273438, -0.14403724670410156, -0.13866424560546875, -0.13329124450683594, -0.12791824340820312, -0.12254524230957031, -0.1171722412109375, -0.11179924011230469, -0.10642623901367188, -0.10105323791503906, -0.09568023681640625, -0.09030723571777344, -0.08493423461914062, -0.07956123352050781, -0.074188232421875, -0.06881523132324219, -0.06344223022460938, -0.05806922912597656, -0.05269622802734375, -0.04732322692871094, -0.041950225830078125, -0.03657722473144531, -0.0312042236328125, -0.025831222534179688, -0.020458221435546875, -0.015085220336914062, -0.00971221923828125, -0.0043392181396484375, 0.001033782958984375, 0.0064067840576171875, 0.01177978515625, 0.017152786254882812, 0.022525787353515625, 0.027898788452148438, 0.03327178955078125, 0.03864479064941406, 0.044017791748046875, 0.04939079284667969, 0.0547637939453125, 0.06013679504394531, 0.06550979614257812, 0.07088279724121094, 0.07625579833984375, 0.08162879943847656, 0.08700180053710938, 0.09237480163574219, 0.097747802734375, 0.10312080383300781, 0.10849380493164062, 0.11386680603027344, 0.11923980712890625, 0.12461280822753906, 0.12998580932617188, 0.1353588104248047, 0.1407318115234375, 0.1461048126220703, 0.15147781372070312, 0.15685081481933594, 0.16222381591796875, 0.16759681701660156, 0.17296981811523438, 0.1783428192138672, 0.1837158203125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 7.0, 9.0, 14.0, 14.0, 32.0, 44.0, 66.0, 97.0, 139.0, 233.0, 292.0, 488.0, 717.0, 1063.0, 1503.0, 2335.0, 3659.0, 5644.0, 8469.0, 13648.0, 21430.0, 34786.0, 58319.0, 100834.0, 182678.0, 363169.0, 860958.0, 1353386.0, 573142.0, 264982.0, 139396.0, 78829.0, 46173.0, 28446.0, 17702.0, 10980.0, 7057.0, 4500.0, 3069.0, 2030.0, 1289.0, 879.0, 562.0, 378.0, 300.0, 190.0, 107.0, 86.0, 54.0, 44.0, 23.0, 26.0, 9.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.268798828125, -0.2599220275878906, -0.25104522705078125, -0.24216842651367188, -0.2332916259765625, -0.22441482543945312, -0.21553802490234375, -0.20666122436523438, -0.197784423828125, -0.18890762329101562, -0.18003082275390625, -0.17115402221679688, -0.1622772216796875, -0.15340042114257812, -0.14452362060546875, -0.13564682006835938, -0.12677001953125, -0.11789321899414062, -0.10901641845703125, -0.10013961791992188, -0.0912628173828125, -0.08238601684570312, -0.07350921630859375, -0.06463241577148438, -0.055755615234375, -0.046878814697265625, -0.03800201416015625, -0.029125213623046875, -0.0202484130859375, -0.011371612548828125, -0.00249481201171875, 0.006381988525390625, 0.0152587890625, 0.024135589599609375, 0.03301239013671875, 0.041889190673828125, 0.0507659912109375, 0.059642791748046875, 0.06851959228515625, 0.07739639282226562, 0.086273193359375, 0.09514999389648438, 0.10402679443359375, 0.11290359497070312, 0.1217803955078125, 0.13065719604492188, 0.13953399658203125, 0.14841079711914062, 0.15728759765625, 0.16616439819335938, 0.17504119873046875, 0.18391799926757812, 0.1927947998046875, 0.20167160034179688, 0.21054840087890625, 0.21942520141601562, 0.228302001953125, 0.23717880249023438, 0.24605560302734375, 0.2549324035644531, 0.2638092041015625, 0.2726860046386719, 0.28156280517578125, 0.2904396057128906, 0.29931640625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 15.0, 10.0, 11.0, 19.0, 28.0, 31.0, 36.0, 43.0, 50.0, 61.0, 86.0, 100.0, 124.0, 126.0, 164.0, 192.0, 240.0, 258.0, 316.0, 305.0, 274.0, 263.0, 225.0, 178.0, 181.0, 138.0, 117.0, 91.0, 89.0, 69.0, 57.0, 39.0, 32.0, 25.0, 18.0, 16.0, 12.0, 11.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.11798095703125, -0.11475372314453125, -0.1115264892578125, -0.10829925537109375, -0.105072021484375, -0.10184478759765625, -0.0986175537109375, -0.09539031982421875, -0.0921630859375, -0.08893585205078125, -0.0857086181640625, -0.08248138427734375, -0.079254150390625, -0.07602691650390625, -0.0727996826171875, -0.06957244873046875, -0.06634521484375, -0.06311798095703125, -0.0598907470703125, -0.05666351318359375, -0.053436279296875, -0.05020904541015625, -0.0469818115234375, -0.04375457763671875, -0.04052734375, -0.03730010986328125, -0.0340728759765625, -0.03084564208984375, -0.027618408203125, -0.02439117431640625, -0.0211639404296875, -0.01793670654296875, -0.01470947265625, -0.01148223876953125, -0.0082550048828125, -0.00502777099609375, -0.001800537109375, 0.00142669677734375, 0.0046539306640625, 0.00788116455078125, 0.0111083984375, 0.01433563232421875, 0.0175628662109375, 0.02079010009765625, 0.024017333984375, 0.02724456787109375, 0.0304718017578125, 0.03369903564453125, 0.03692626953125, 0.04015350341796875, 0.0433807373046875, 0.04660797119140625, 0.049835205078125, 0.05306243896484375, 0.0562896728515625, 0.05951690673828125, 0.062744140625, 0.06597137451171875, 0.0691986083984375, 0.07242584228515625, 0.075653076171875, 0.07888031005859375, 0.0821075439453125, 0.08533477783203125, 0.08856201171875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 5.0, 10.0, 8.0, 9.0, 11.0, 16.0, 18.0, 30.0, 29.0, 41.0, 71.0, 56.0, 76.0, 98.0, 102.0, 85.0, 68.0, 53.0, 45.0, 37.0, 29.0, 21.0, 16.0, 9.0, 12.0, 10.0, 9.0, 7.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.26908209919929504, -0.25990164279937744, -0.25072118639945984, -0.24154074490070343, -0.23236030340194702, -0.22317984700202942, -0.21399939060211182, -0.2048189342021942, -0.1956384927034378, -0.1864580363035202, -0.1772775948047638, -0.1680971384048462, -0.1589166820049286, -0.14973624050617218, -0.14055578410625458, -0.13137534260749817, -0.12219488620758057, -0.11301443725824356, -0.10383398830890656, -0.09465353190898895, -0.08547308295965195, -0.07629263401031494, -0.06711217761039734, -0.05793172866106033, -0.04875127971172333, -0.03957083076238632, -0.030390378087759018, -0.021209927275776863, -0.012029476463794708, -0.0028490275144577026, 0.0063314251601696014, 0.015511877834796906, 0.024692296981811523, 0.03387274593114853, 0.04305319860577583, 0.05223365128040314, 0.06141410022974014, 0.07059454917907715, 0.07977500557899475, 0.08895545452833176, 0.09813590347766876, 0.10731635242700577, 0.11649680137634277, 0.12567725777626038, 0.13485771417617798, 0.1440381556749344, 0.153218612074852, 0.1623990535736084, 0.171579509973526, 0.1807599663734436, 0.1899404078722, 0.19912086427211761, 0.20830130577087402, 0.21748176217079163, 0.22666221857070923, 0.23584267497062683, 0.24502311646938324, 0.25420355796813965, 0.26338401436805725, 0.27256447076797485, 0.28174492716789246, 0.29092538356781006, 0.3001058101654053, 0.3092862665653229, 0.3184667229652405]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 8.0, 7.0, 2.0, 10.0, 9.0, 7.0, 14.0, 11.0, 27.0, 22.0, 16.0, 23.0, 32.0, 22.0, 35.0, 29.0, 31.0, 42.0, 37.0, 35.0, 37.0, 46.0, 47.0, 35.0, 43.0, 39.0, 38.0, 26.0, 33.0, 33.0, 25.0, 27.0, 19.0, 27.0, 19.0, 16.0, 11.0, 8.0, 9.0, 10.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.18095916509628296, -0.1750214397907257, -0.16908372938632965, -0.1631460040807724, -0.15720829367637634, -0.1512705683708191, -0.14533284306526184, -0.13939513266086578, -0.13345742225646973, -0.12751969695091248, -0.12158198654651642, -0.11564426124095917, -0.10970655083656311, -0.10376882553100586, -0.0978311076760292, -0.09189338982105255, -0.0859556645154953, -0.08001794666051865, -0.07408022880554199, -0.06814250349998474, -0.062204789370298386, -0.05626707151532173, -0.05032934993505478, -0.044391632080078125, -0.03845391422510147, -0.03251619637012482, -0.026578476652503014, -0.02064075693488121, -0.014703039079904556, -0.008765321224927902, -0.0028275996446609497, 0.0031101182103157043, 0.009047836065292358, 0.014985554851591587, 0.020923273637890816, 0.02686099335551262, 0.03279871121048927, 0.03873642906546593, 0.04467415064573288, 0.050611868500709534, 0.05654958635568619, 0.06248730421066284, 0.0684250220656395, 0.07436273992061615, 0.0803004652261734, 0.08623817563056946, 0.09217590093612671, 0.09811361879110336, 0.10405133664608002, 0.10998905450105667, 0.11592677235603333, 0.12186449766159058, 0.12780220806598663, 0.13373993337154388, 0.13967764377593994, 0.1456153690814972, 0.15155309438705444, 0.1574908196926117, 0.16342853009700775, 0.169366255402565, 0.17530396580696106, 0.1812416911125183, 0.18717941641807556, 0.19311712682247162, 0.19905483722686768]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 8.0, 12.0, 16.0, 28.0, 37.0, 68.0, 96.0, 162.0, 215.0, 373.0, 560.0, 951.0, 1379.0, 2167.0, 3310.0, 4963.0, 8021.0, 12609.0, 19973.0, 32739.0, 54652.0, 96429.0, 183490.0, 272100.0, 150001.0, 81301.0, 46859.0, 28109.0, 17364.0, 10909.0, 7050.0, 4332.0, 2889.0, 1864.0, 1299.0, 785.0, 533.0, 325.0, 196.0, 133.0, 110.0, 62.0, 26.0, 29.0, 11.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.10037517547607422, -0.09717369079589844, -0.09397220611572266, -0.09077072143554688, -0.0875692367553711, -0.08436775207519531, -0.08116626739501953, -0.07796478271484375, -0.07476329803466797, -0.07156181335449219, -0.0683603286743164, -0.06515884399414062, -0.061957359313964844, -0.05875587463378906, -0.05555438995361328, -0.0523529052734375, -0.04915142059326172, -0.04594993591308594, -0.042748451232910156, -0.039546966552734375, -0.036345481872558594, -0.03314399719238281, -0.02994251251220703, -0.02674102783203125, -0.02353954315185547, -0.020338058471679688, -0.017136573791503906, -0.013935089111328125, -0.010733604431152344, -0.0075321197509765625, -0.004330635070800781, -0.001129150390625, 0.0020723342895507812, 0.0052738189697265625, 0.008475303649902344, 0.011676788330078125, 0.014878273010253906, 0.018079757690429688, 0.02128124237060547, 0.02448272705078125, 0.02768421173095703, 0.030885696411132812, 0.034087181091308594, 0.037288665771484375, 0.040490150451660156, 0.04369163513183594, 0.04689311981201172, 0.0500946044921875, 0.05329608917236328, 0.05649757385253906, 0.059699058532714844, 0.06290054321289062, 0.0661020278930664, 0.06930351257324219, 0.07250499725341797, 0.07570648193359375, 0.07890796661376953, 0.08210945129394531, 0.0853109359741211, 0.08851242065429688, 0.09171390533447266, 0.09491539001464844, 0.09811687469482422, 0.101318359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 8.0, 8.0, 8.0, 5.0, 8.0, 4.0, 12.0, 15.0, 24.0, 26.0, 12.0, 26.0, 32.0, 31.0, 35.0, 21.0, 25.0, 42.0, 42.0, 30.0, 50.0, 54.0, 49.0, 32.0, 48.0, 37.0, 35.0, 36.0, 32.0, 30.0, 21.0, 27.0, 24.0, 19.0, 14.0, 12.0, 11.0, 9.0, 16.0, 5.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.195068359375, -0.1888141632080078, -0.18255996704101562, -0.17630577087402344, -0.17005157470703125, -0.16379737854003906, -0.15754318237304688, -0.1512889862060547, -0.1450347900390625, -0.1387805938720703, -0.13252639770507812, -0.12627220153808594, -0.12001800537109375, -0.11376380920410156, -0.10750961303710938, -0.10125541687011719, -0.095001220703125, -0.08874702453613281, -0.08249282836914062, -0.07623863220214844, -0.06998443603515625, -0.06373023986816406, -0.057476043701171875, -0.05122184753417969, -0.0449676513671875, -0.03871345520019531, -0.032459259033203125, -0.026205062866210938, -0.01995086669921875, -0.013696670532226562, -0.007442474365234375, -0.0011882781982421875, 0.00506591796875, 0.011320114135742188, 0.017574310302734375, 0.023828506469726562, 0.03008270263671875, 0.03633689880371094, 0.042591094970703125, 0.04884529113769531, 0.0550994873046875, 0.06135368347167969, 0.06760787963867188, 0.07386207580566406, 0.08011627197265625, 0.08637046813964844, 0.09262466430664062, 0.09887886047363281, 0.105133056640625, 0.11138725280761719, 0.11764144897460938, 0.12389564514160156, 0.13014984130859375, 0.13640403747558594, 0.14265823364257812, 0.1489124298095703, 0.1551666259765625, 0.1614208221435547, 0.16767501831054688, 0.17392921447753906, 0.18018341064453125, 0.18643760681152344, 0.19269180297851562, 0.1989459991455078, 0.2052001953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 12.0, 20.0, 29.0, 33.0, 57.0, 79.0, 111.0, 170.0, 254.0, 424.0, 645.0, 1011.0, 1642.0, 2684.0, 4261.0, 7371.0, 14620.0, 35127.0, 116040.0, 554173.0, 213257.0, 53313.0, 19954.0, 9549.0, 5256.0, 3103.0, 1933.0, 1091.0, 797.0, 515.0, 324.0, 183.0, 155.0, 107.0, 63.0, 51.0, 31.0, 26.0, 18.0, 11.0, 12.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.19921875, -0.19272804260253906, -0.18623733520507812, -0.1797466278076172, -0.17325592041015625, -0.1667652130126953, -0.16027450561523438, -0.15378379821777344, -0.1472930908203125, -0.14080238342285156, -0.13431167602539062, -0.1278209686279297, -0.12133026123046875, -0.11483955383300781, -0.10834884643554688, -0.10185813903808594, -0.095367431640625, -0.08887672424316406, -0.08238601684570312, -0.07589530944824219, -0.06940460205078125, -0.06291389465332031, -0.056423187255859375, -0.04993247985839844, -0.0434417724609375, -0.03695106506347656, -0.030460357666015625, -0.023969650268554688, -0.01747894287109375, -0.010988235473632812, -0.004497528076171875, 0.0019931793212890625, 0.00848388671875, 0.014974594116210938, 0.021465301513671875, 0.027956008911132812, 0.03444671630859375, 0.04093742370605469, 0.047428131103515625, 0.05391883850097656, 0.0604095458984375, 0.06690025329589844, 0.07339096069335938, 0.07988166809082031, 0.08637237548828125, 0.09286308288574219, 0.09935379028320312, 0.10584449768066406, 0.112335205078125, 0.11882591247558594, 0.12531661987304688, 0.1318073272705078, 0.13829803466796875, 0.1447887420654297, 0.15127944946289062, 0.15777015686035156, 0.1642608642578125, 0.17075157165527344, 0.17724227905273438, 0.1837329864501953, 0.19022369384765625, 0.1967144012451172, 0.20320510864257812, 0.20969581604003906, 0.2161865234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 19.0, 9.0, 19.0, 21.0, 27.0, 19.0, 18.0, 24.0, 31.0, 37.0, 37.0, 42.0, 33.0, 30.0, 39.0, 40.0, 31.0, 32.0, 49.0, 30.0, 30.0, 33.0, 33.0, 29.0, 31.0, 27.0, 19.0, 23.0, 19.0, 22.0, 13.0, 11.0, 17.0, 10.0, 10.0, 15.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1123046875, -0.10864448547363281, -0.10498428344726562, -0.10132408142089844, -0.09766387939453125, -0.09400367736816406, -0.09034347534179688, -0.08668327331542969, -0.0830230712890625, -0.07936286926269531, -0.07570266723632812, -0.07204246520996094, -0.06838226318359375, -0.06472206115722656, -0.061061859130859375, -0.05740165710449219, -0.053741455078125, -0.05008125305175781, -0.046421051025390625, -0.04276084899902344, -0.03910064697265625, -0.03544044494628906, -0.031780242919921875, -0.028120040893554688, -0.0244598388671875, -0.020799636840820312, -0.017139434814453125, -0.013479232788085938, -0.00981903076171875, -0.0061588287353515625, -0.002498626708984375, 0.0011615753173828125, 0.00482177734375, 0.008481979370117188, 0.012142181396484375, 0.015802383422851562, 0.01946258544921875, 0.023122787475585938, 0.026782989501953125, 0.030443191528320312, 0.0341033935546875, 0.03776359558105469, 0.041423797607421875, 0.04508399963378906, 0.04874420166015625, 0.05240440368652344, 0.056064605712890625, 0.05972480773925781, 0.063385009765625, 0.06704521179199219, 0.07070541381835938, 0.07436561584472656, 0.07802581787109375, 0.08168601989746094, 0.08534622192382812, 0.08900642395019531, 0.0926666259765625, 0.09632682800292969, 0.09998703002929688, 0.10364723205566406, 0.10730743408203125, 0.11096763610839844, 0.11462783813476562, 0.11828804016113281, 0.1219482421875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 11.0, 6.0, 14.0, 27.0, 30.0, 45.0, 59.0, 81.0, 107.0, 157.0, 210.0, 292.0, 442.0, 590.0, 882.0, 1366.0, 2116.0, 3660.0, 6859.0, 14435.0, 38052.0, 205499.0, 658569.0, 71717.0, 21062.0, 9150.0, 4895.0, 2807.0, 1827.0, 1152.0, 754.0, 484.0, 372.0, 222.0, 152.0, 100.0, 88.0, 69.0, 49.0, 30.0, 33.0, 19.0, 15.0, 3.0, 8.0, 8.0, 2.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01264190673828125, -0.01222372055053711, -0.011805534362792969, -0.011387348175048828, -0.010969161987304688, -0.010550975799560547, -0.010132789611816406, -0.009714603424072266, -0.009296417236328125, -0.008878231048583984, -0.008460044860839844, -0.008041858673095703, -0.0076236724853515625, -0.007205486297607422, -0.006787300109863281, -0.006369113922119141, -0.005950927734375, -0.005532741546630859, -0.005114555358886719, -0.004696369171142578, -0.0042781829833984375, -0.003859996795654297, -0.0034418106079101562, -0.0030236244201660156, -0.002605438232421875, -0.0021872520446777344, -0.0017690658569335938, -0.0013508796691894531, -0.0009326934814453125, -0.0005145072937011719, -9.632110595703125e-05, 0.0003218650817871094, 0.00074005126953125, 0.0011582374572753906, 0.0015764236450195312, 0.001994609832763672, 0.0024127960205078125, 0.002830982208251953, 0.0032491683959960938, 0.0036673545837402344, 0.004085540771484375, 0.004503726959228516, 0.004921913146972656, 0.005340099334716797, 0.0057582855224609375, 0.006176471710205078, 0.006594657897949219, 0.007012844085693359, 0.0074310302734375, 0.00784921646118164, 0.008267402648925781, 0.008685588836669922, 0.009103775024414062, 0.009521961212158203, 0.009940147399902344, 0.010358333587646484, 0.010776519775390625, 0.011194705963134766, 0.011612892150878906, 0.012031078338623047, 0.012449264526367188, 0.012867450714111328, 0.013285636901855469, 0.01370382308959961, 0.01412200927734375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 0.0, 3.0, 3.0, 11.0, 0.0, 10.0, 13.0, 13.0, 22.0, 0.0, 20.0, 26.0, 36.0, 0.0, 57.0, 67.0, 76.0, 93.0, 0.0, 87.0, 111.0, 80.0, 0.0, 63.0, 46.0, 40.0, 23.0, 0.0, 21.0, 19.0, 10.0, 8.0, 0.0, 4.0, 13.0, 7.0, 0.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3113021850585938e-06, -1.2647360563278198e-06, -1.218169927597046e-06, -1.171603798866272e-06, -1.125037670135498e-06, -1.0784715414047241e-06, -1.0319054126739502e-06, -9.853392839431763e-07, -9.387731552124023e-07, -8.922070264816284e-07, -8.456408977508545e-07, -7.990747690200806e-07, -7.525086402893066e-07, -7.059425115585327e-07, -6.593763828277588e-07, -6.128102540969849e-07, -5.662441253662109e-07, -5.19677996635437e-07, -4.731118679046631e-07, -4.2654573917388916e-07, -3.7997961044311523e-07, -3.334134817123413e-07, -2.868473529815674e-07, -2.4028122425079346e-07, -1.9371509552001953e-07, -1.471489667892456e-07, -1.0058283805847168e-07, -5.4016709327697754e-08, -7.450580596923828e-09, 3.91155481338501e-08, 8.568167686462402e-08, 1.3224780559539795e-07, 1.7881393432617188e-07, 2.253800630569458e-07, 2.7194619178771973e-07, 3.1851232051849365e-07, 3.650784492492676e-07, 4.116445779800415e-07, 4.5821070671081543e-07, 5.047768354415894e-07, 5.513429641723633e-07, 5.979090929031372e-07, 6.444752216339111e-07, 6.910413503646851e-07, 7.37607479095459e-07, 7.841736078262329e-07, 8.307397365570068e-07, 8.773058652877808e-07, 9.238719940185547e-07, 9.704381227493286e-07, 1.0170042514801025e-06, 1.0635703802108765e-06, 1.1101365089416504e-06, 1.1567026376724243e-06, 1.2032687664031982e-06, 1.2498348951339722e-06, 1.296401023864746e-06, 1.34296715259552e-06, 1.389533281326294e-06, 1.4360994100570679e-06, 1.4826655387878418e-06, 1.5292316675186157e-06, 1.5757977962493896e-06, 1.6223639249801636e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 12.0, 18.0, 32.0, 31.0, 59.0, 74.0, 89.0, 171.0, 206.0, 347.0, 450.0, 669.0, 892.0, 1436.0, 2101.0, 3330.0, 5088.0, 8627.0, 14683.0, 26843.0, 56767.0, 147458.0, 462323.0, 180236.0, 64559.0, 30314.0, 16210.0, 9329.0, 5567.0, 3553.0, 2295.0, 1519.0, 1004.0, 700.0, 485.0, 293.0, 193.0, 163.0, 135.0, 87.0, 55.0, 35.0, 28.0, 27.0, 19.0, 11.0, 9.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.01110076904296875, -0.010760068893432617, -0.010419368743896484, -0.010078668594360352, -0.009737968444824219, -0.009397268295288086, -0.009056568145751953, -0.00871586799621582, -0.008375167846679688, -0.008034467697143555, -0.007693767547607422, -0.007353067398071289, -0.007012367248535156, -0.0066716670989990234, -0.006330966949462891, -0.005990266799926758, -0.005649566650390625, -0.005308866500854492, -0.004968166351318359, -0.0046274662017822266, -0.004286766052246094, -0.003946065902709961, -0.003605365753173828, -0.0032646656036376953, -0.0029239654541015625, -0.0025832653045654297, -0.002242565155029297, -0.001901865005493164, -0.0015611648559570312, -0.0012204647064208984, -0.0008797645568847656, -0.0005390644073486328, -0.0001983642578125, 0.0001423358917236328, 0.0004830360412597656, 0.0008237361907958984, 0.0011644363403320312, 0.001505136489868164, 0.0018458366394042969, 0.0021865367889404297, 0.0025272369384765625, 0.0028679370880126953, 0.003208637237548828, 0.003549337387084961, 0.0038900375366210938, 0.0042307376861572266, 0.004571437835693359, 0.004912137985229492, 0.005252838134765625, 0.005593538284301758, 0.005934238433837891, 0.0062749385833740234, 0.006615638732910156, 0.006956338882446289, 0.007297039031982422, 0.007637739181518555, 0.007978439331054688, 0.00831913948059082, 0.008659839630126953, 0.009000539779663086, 0.009341239929199219, 0.009681940078735352, 0.010022640228271484, 0.010363340377807617, 0.01070404052734375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 4.0, 6.0, 8.0, 7.0, 8.0, 9.0, 13.0, 14.0, 13.0, 26.0, 29.0, 34.0, 34.0, 51.0, 63.0, 95.0, 154.0, 103.0, 63.0, 47.0, 46.0, 44.0, 28.0, 19.0, 24.0, 7.0, 13.0, 13.0, 6.0, 6.0, 7.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0035858154296875, -0.0034759044647216797, -0.0033659934997558594, -0.003256082534790039, -0.0031461715698242188, -0.0030362606048583984, -0.002926349639892578, -0.002816438674926758, -0.0027065277099609375, -0.002596616744995117, -0.002486705780029297, -0.0023767948150634766, -0.0022668838500976562, -0.002156972885131836, -0.0020470619201660156, -0.0019371509552001953, -0.001827239990234375, -0.0017173290252685547, -0.0016074180603027344, -0.001497507095336914, -0.0013875961303710938, -0.0012776851654052734, -0.0011677742004394531, -0.0010578632354736328, -0.0009479522705078125, -0.0008380413055419922, -0.0007281303405761719, -0.0006182193756103516, -0.0005083084106445312, -0.00039839744567871094, -0.0002884864807128906, -0.0001785755157470703, -6.866455078125e-05, 4.124641418457031e-05, 0.00015115737915039062, 0.00026106834411621094, 0.00037097930908203125, 0.00048089027404785156, 0.0005908012390136719, 0.0007007122039794922, 0.0008106231689453125, 0.0009205341339111328, 0.0010304450988769531, 0.0011403560638427734, 0.0012502670288085938, 0.001360177993774414, 0.0014700889587402344, 0.0015799999237060547, 0.001689910888671875, 0.0017998218536376953, 0.0019097328186035156, 0.002019643783569336, 0.0021295547485351562, 0.0022394657135009766, 0.002349376678466797, 0.002459287643432617, 0.0025691986083984375, 0.002679109573364258, 0.002789020538330078, 0.0028989315032958984, 0.0030088424682617188, 0.003118753433227539, 0.0032286643981933594, 0.0033385753631591797, 0.003448486328125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 8.0, 9.0, 10.0, 15.0, 24.0, 21.0, 25.0, 34.0, 60.0, 62.0, 67.0, 83.0, 109.0, 95.0, 66.0, 60.0, 46.0, 43.0, 31.0, 26.0, 21.0, 10.0, 10.0, 8.0, 13.0, 6.0, 7.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.25644850730895996, -0.24750417470932007, -0.23855982720851898, -0.2296154946088791, -0.220671147108078, -0.2117268145084381, -0.20278248190879822, -0.19383814930915833, -0.18489380180835724, -0.17594946920871735, -0.16700512170791626, -0.15806078910827637, -0.14911645650863647, -0.1401721090078354, -0.1312277764081955, -0.122283436357975, -0.11333909630775452, -0.10439475625753403, -0.09545041620731354, -0.08650608360767365, -0.07756174355745316, -0.06861740350723267, -0.059673067182302475, -0.050728730857372284, -0.041784390807151794, -0.032840050756931305, -0.023895714432001114, -0.014951376244425774, -0.006007038056850433, 0.002937301993370056, 0.011881638318300247, 0.020825974643230438, 0.02977028489112854, 0.03871462494134903, 0.04765896126627922, 0.05660329759120941, 0.0655476376414299, 0.07449197769165039, 0.08343631029129028, 0.09238065034151077, 0.10132499039173126, 0.11026933044195175, 0.11921367049217224, 0.12815800309181213, 0.13710233569145203, 0.1460466831922531, 0.154991015791893, 0.1639353632926941, 0.17287969589233398, 0.18182402849197388, 0.19076837599277496, 0.19971270859241486, 0.20865705609321594, 0.21760138869285583, 0.22654572129249573, 0.23549005389213562, 0.2444344013929367, 0.2533787488937378, 0.2623230814933777, 0.2712674140930176, 0.28021174669265747, 0.28915607929229736, 0.29810044169425964, 0.30704477429389954, 0.31598910689353943]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 6.0, 9.0, 6.0, 6.0, 9.0, 10.0, 11.0, 11.0, 26.0, 26.0, 16.0, 28.0, 26.0, 24.0, 31.0, 34.0, 31.0, 38.0, 41.0, 33.0, 39.0, 48.0, 44.0, 36.0, 45.0, 37.0, 36.0, 33.0, 29.0, 31.0, 26.0, 25.0, 22.0, 23.0, 19.0, 15.0, 11.0, 8.0, 10.0, 10.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.17870250344276428, -0.17279301583766937, -0.16688351333141327, -0.16097402572631836, -0.15506453812122345, -0.14915505051612854, -0.14324554800987244, -0.13733606040477753, -0.13142657279968262, -0.1255170851945877, -0.1196075901389122, -0.1136980950832367, -0.10778860747814178, -0.10187911242246628, -0.09596961736679077, -0.09006012976169586, -0.08415062725543976, -0.07824113219976425, -0.07233164459466934, -0.06642214953899384, -0.06051265820860863, -0.05460316687822342, -0.04869367182254791, -0.042784180492162704, -0.036874689161777496, -0.030965197831392288, -0.02505570463836193, -0.019146211445331573, -0.013236720114946365, -0.007327228784561157, -0.0014177337288856506, 0.0044917576014995575, 0.010401248931884766, 0.016310740262269974, 0.02222023345530033, 0.02812972664833069, 0.0340392179787159, 0.039948709309101105, 0.04585820436477661, 0.05176769569516182, 0.05767718702554703, 0.06358668208122253, 0.06949616968631744, 0.07540566474199295, 0.08131515979766846, 0.08722464740276337, 0.09313414245843887, 0.09904363751411438, 0.10495312511920929, 0.1108626201748848, 0.1167721077799797, 0.12268160283565521, 0.12859109044075012, 0.13450059294700623, 0.14041008055210114, 0.14631956815719604, 0.15222907066345215, 0.15813855826854706, 0.16404806077480316, 0.16995754837989807, 0.17586703598499298, 0.1817765235900879, 0.187686026096344, 0.1935955137014389, 0.1995050013065338]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 9.0, 15.0, 16.0, 32.0, 41.0, 76.0, 97.0, 194.0, 302.0, 462.0, 805.0, 1195.0, 1902.0, 3264.0, 5415.0, 9061.0, 15462.0, 27477.0, 50441.0, 95087.0, 197395.0, 309848.0, 154951.0, 77434.0, 41861.0, 23169.0, 13066.0, 7716.0, 4512.0, 2802.0, 1661.0, 1035.0, 643.0, 394.0, 250.0, 166.0, 118.0, 58.0, 42.0, 31.0, 19.0, 13.0, 9.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.486083984375, -0.4723320007324219, -0.45858001708984375, -0.4448280334472656, -0.4310760498046875, -0.4173240661621094, -0.40357208251953125, -0.3898200988769531, -0.376068115234375, -0.3623161315917969, -0.34856414794921875, -0.3348121643066406, -0.3210601806640625, -0.3073081970214844, -0.29355621337890625, -0.2798042297363281, -0.26605224609375, -0.2523002624511719, -0.23854827880859375, -0.22479629516601562, -0.2110443115234375, -0.19729232788085938, -0.18354034423828125, -0.16978836059570312, -0.156036376953125, -0.14228439331054688, -0.12853240966796875, -0.11478042602539062, -0.1010284423828125, -0.08727645874023438, -0.07352447509765625, -0.059772491455078125, -0.0460205078125, -0.032268524169921875, -0.01851654052734375, -0.004764556884765625, 0.0089874267578125, 0.022739410400390625, 0.03649139404296875, 0.050243377685546875, 0.063995361328125, 0.07774734497070312, 0.09149932861328125, 0.10525131225585938, 0.1190032958984375, 0.13275527954101562, 0.14650726318359375, 0.16025924682617188, 0.17401123046875, 0.18776321411132812, 0.20151519775390625, 0.21526718139648438, 0.2290191650390625, 0.24277114868164062, 0.25652313232421875, 0.2702751159667969, 0.284027099609375, 0.2977790832519531, 0.31153106689453125, 0.3252830505371094, 0.3390350341796875, 0.3527870178222656, 0.36653900146484375, 0.3802909851074219, 0.39404296875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 6.0, 8.0, 7.0, 14.0, 16.0, 18.0, 16.0, 25.0, 27.0, 30.0, 35.0, 23.0, 34.0, 47.0, 43.0, 46.0, 25.0, 39.0, 50.0, 56.0, 38.0, 33.0, 45.0, 35.0, 44.0, 32.0, 26.0, 24.0, 26.0, 23.0, 18.0, 17.0, 8.0, 16.0, 8.0, 5.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171875, -0.16617774963378906, -0.16048049926757812, -0.1547832489013672, -0.14908599853515625, -0.1433887481689453, -0.13769149780273438, -0.13199424743652344, -0.1262969970703125, -0.12059974670410156, -0.11490249633789062, -0.10920524597167969, -0.10350799560546875, -0.09781074523925781, -0.09211349487304688, -0.08641624450683594, -0.080718994140625, -0.07502174377441406, -0.06932449340820312, -0.06362724304199219, -0.05792999267578125, -0.05223274230957031, -0.046535491943359375, -0.04083824157714844, -0.0351409912109375, -0.029443740844726562, -0.023746490478515625, -0.018049240112304688, -0.01235198974609375, -0.0066547393798828125, -0.000957489013671875, 0.0047397613525390625, 0.01043701171875, 0.016134262084960938, 0.021831512451171875, 0.027528762817382812, 0.03322601318359375, 0.03892326354980469, 0.044620513916015625, 0.05031776428222656, 0.0560150146484375, 0.06171226501464844, 0.06740951538085938, 0.07310676574707031, 0.07880401611328125, 0.08450126647949219, 0.09019851684570312, 0.09589576721191406, 0.101593017578125, 0.10729026794433594, 0.11298751831054688, 0.11868476867675781, 0.12438201904296875, 0.1300792694091797, 0.13577651977539062, 0.14147377014160156, 0.1471710205078125, 0.15286827087402344, 0.15856552124023438, 0.1642627716064453, 0.16996002197265625, 0.1756572723388672, 0.18135452270507812, 0.18705177307128906, 0.1927490234375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 2.0, 6.0, 14.0, 13.0, 19.0, 37.0, 56.0, 72.0, 102.0, 152.0, 239.0, 351.0, 482.0, 778.0, 1133.0, 1694.0, 2541.0, 3741.0, 5730.0, 8848.0, 13538.0, 20961.0, 33553.0, 54898.0, 94006.0, 175073.0, 264356.0, 150041.0, 82668.0, 48709.0, 29843.0, 18967.0, 12236.0, 7888.0, 5331.0, 3551.0, 2324.0, 1505.0, 1013.0, 699.0, 421.0, 301.0, 198.0, 156.0, 97.0, 76.0, 46.0, 32.0, 22.0, 10.0, 10.0, 12.0, 6.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.353515625, -0.342926025390625, -0.33233642578125, -0.321746826171875, -0.3111572265625, -0.300567626953125, -0.28997802734375, -0.279388427734375, -0.268798828125, -0.258209228515625, -0.24761962890625, -0.237030029296875, -0.2264404296875, -0.215850830078125, -0.20526123046875, -0.194671630859375, -0.18408203125, -0.173492431640625, -0.16290283203125, -0.152313232421875, -0.1417236328125, -0.131134033203125, -0.12054443359375, -0.109954833984375, -0.099365234375, -0.088775634765625, -0.07818603515625, -0.067596435546875, -0.0570068359375, -0.046417236328125, -0.03582763671875, -0.025238037109375, -0.0146484375, -0.004058837890625, 0.00653076171875, 0.017120361328125, 0.0277099609375, 0.038299560546875, 0.04888916015625, 0.059478759765625, 0.070068359375, 0.080657958984375, 0.09124755859375, 0.101837158203125, 0.1124267578125, 0.123016357421875, 0.13360595703125, 0.144195556640625, 0.15478515625, 0.165374755859375, 0.17596435546875, 0.186553955078125, 0.1971435546875, 0.207733154296875, 0.21832275390625, 0.228912353515625, 0.239501953125, 0.250091552734375, 0.26068115234375, 0.271270751953125, 0.2818603515625, 0.292449951171875, 0.30303955078125, 0.313629150390625, 0.32421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 9.0, 10.0, 8.0, 7.0, 7.0, 18.0, 13.0, 16.0, 15.0, 17.0, 22.0, 25.0, 22.0, 35.0, 40.0, 35.0, 34.0, 35.0, 40.0, 34.0, 33.0, 38.0, 37.0, 42.0, 27.0, 36.0, 41.0, 32.0, 30.0, 36.0, 23.0, 24.0, 26.0, 22.0, 26.0, 8.0, 14.0, 9.0, 7.0, 9.0, 7.0, 5.0, 8.0, 3.0, 2.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.10430908203125, -0.10111808776855469, -0.09792709350585938, -0.09473609924316406, -0.09154510498046875, -0.08835411071777344, -0.08516311645507812, -0.08197212219238281, -0.0787811279296875, -0.07559013366699219, -0.07239913940429688, -0.06920814514160156, -0.06601715087890625, -0.06282615661621094, -0.059635162353515625, -0.05644416809082031, -0.053253173828125, -0.05006217956542969, -0.046871185302734375, -0.04368019104003906, -0.04048919677734375, -0.03729820251464844, -0.034107208251953125, -0.030916213989257812, -0.0277252197265625, -0.024534225463867188, -0.021343231201171875, -0.018152236938476562, -0.01496124267578125, -0.011770248413085938, -0.008579254150390625, -0.0053882598876953125, -0.002197265625, 0.0009937286376953125, 0.004184722900390625, 0.0073757171630859375, 0.01056671142578125, 0.013757705688476562, 0.016948699951171875, 0.020139694213867188, 0.0233306884765625, 0.026521682739257812, 0.029712677001953125, 0.03290367126464844, 0.03609466552734375, 0.03928565979003906, 0.042476654052734375, 0.04566764831542969, 0.048858642578125, 0.05204963684082031, 0.055240631103515625, 0.05843162536621094, 0.06162261962890625, 0.06481361389160156, 0.06800460815429688, 0.07119560241699219, 0.0743865966796875, 0.07757759094238281, 0.08076858520507812, 0.08395957946777344, 0.08715057373046875, 0.09034156799316406, 0.09353256225585938, 0.09672355651855469, 0.09991455078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 9.0, 14.0, 14.0, 27.0, 34.0, 53.0, 70.0, 90.0, 151.0, 222.0, 299.0, 473.0, 769.0, 1172.0, 1771.0, 2744.0, 4374.0, 7097.0, 12541.0, 24299.0, 75115.0, 791979.0, 70319.0, 24001.0, 11894.0, 6956.0, 4183.0, 2766.0, 1794.0, 1090.0, 709.0, 510.0, 332.0, 222.0, 143.0, 92.0, 75.0, 41.0, 37.0, 22.0, 9.0, 13.0, 9.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03497314453125, -0.033786773681640625, -0.03260040283203125, -0.031414031982421875, -0.0302276611328125, -0.029041290283203125, -0.02785491943359375, -0.026668548583984375, -0.025482177734375, -0.024295806884765625, -0.02310943603515625, -0.021923065185546875, -0.0207366943359375, -0.019550323486328125, -0.01836395263671875, -0.017177581787109375, -0.0159912109375, -0.014804840087890625, -0.01361846923828125, -0.012432098388671875, -0.0112457275390625, -0.010059356689453125, -0.00887298583984375, -0.007686614990234375, -0.006500244140625, -0.005313873291015625, -0.00412750244140625, -0.002941131591796875, -0.0017547607421875, -0.000568389892578125, 0.00061798095703125, 0.001804351806640625, 0.00299072265625, 0.004177093505859375, 0.00536346435546875, 0.006549835205078125, 0.0077362060546875, 0.008922576904296875, 0.01010894775390625, 0.011295318603515625, 0.012481689453125, 0.013668060302734375, 0.01485443115234375, 0.016040802001953125, 0.0172271728515625, 0.018413543701171875, 0.01959991455078125, 0.020786285400390625, 0.02197265625, 0.023159027099609375, 0.02434539794921875, 0.025531768798828125, 0.0267181396484375, 0.027904510498046875, 0.02909088134765625, 0.030277252197265625, 0.031463623046875, 0.032649993896484375, 0.03383636474609375, 0.035022735595703125, 0.0362091064453125, 0.037395477294921875, 0.03858184814453125, 0.039768218994140625, 0.04095458984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 10.0, 13.0, 30.0, 43.0, 52.0, 83.0, 83.0, 107.0, 94.0, 100.0, 98.0, 60.0, 41.0, 42.0, 35.0, 18.0, 14.0, 9.0, 11.0, 7.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.3245811462402344e-06, -2.2640451788902283e-06, -2.203509211540222e-06, -2.142973244190216e-06, -2.08243727684021e-06, -2.021901309490204e-06, -1.9613653421401978e-06, -1.9008293747901917e-06, -1.8402934074401855e-06, -1.7797574400901794e-06, -1.7192214727401733e-06, -1.6586855053901672e-06, -1.5981495380401611e-06, -1.537613570690155e-06, -1.477077603340149e-06, -1.4165416359901428e-06, -1.3560056686401367e-06, -1.2954697012901306e-06, -1.2349337339401245e-06, -1.1743977665901184e-06, -1.1138617992401123e-06, -1.0533258318901062e-06, -9.927898645401e-07, -9.32253897190094e-07, -8.717179298400879e-07, -8.111819624900818e-07, -7.506459951400757e-07, -6.901100277900696e-07, -6.295740604400635e-07, -5.690380930900574e-07, -5.085021257400513e-07, -4.4796615839004517e-07, -3.8743019104003906e-07, -3.2689422369003296e-07, -2.6635825634002686e-07, -2.0582228899002075e-07, -1.4528632164001465e-07, -8.475035429000854e-08, -2.421438694000244e-08, 3.632158041000366e-08, 9.685754776000977e-08, 1.5739351511001587e-07, 2.1792948246002197e-07, 2.784654498100281e-07, 3.390014171600342e-07, 3.995373845100403e-07, 4.600733518600464e-07, 5.206093192100525e-07, 5.811452865600586e-07, 6.416812539100647e-07, 7.022172212600708e-07, 7.627531886100769e-07, 8.23289155960083e-07, 8.838251233100891e-07, 9.443610906600952e-07, 1.0048970580101013e-06, 1.0654330253601074e-06, 1.1259689927101135e-06, 1.1865049600601196e-06, 1.2470409274101257e-06, 1.3075768947601318e-06, 1.368112862110138e-06, 1.428648829460144e-06, 1.4891847968101501e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 10.0, 12.0, 15.0, 31.0, 37.0, 59.0, 77.0, 127.0, 171.0, 259.0, 342.0, 491.0, 749.0, 1062.0, 1648.0, 2420.0, 3836.0, 6522.0, 12297.0, 27174.0, 111428.0, 790013.0, 47951.0, 18217.0, 9181.0, 5120.0, 3132.0, 2015.0, 1342.0, 818.0, 583.0, 432.0, 300.0, 190.0, 143.0, 105.0, 70.0, 46.0, 39.0, 17.0, 17.0, 12.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.03875732421875, -0.03743314743041992, -0.036108970642089844, -0.034784793853759766, -0.03346061706542969, -0.03213644027709961, -0.03081226348876953, -0.029488086700439453, -0.028163909912109375, -0.026839733123779297, -0.02551555633544922, -0.02419137954711914, -0.022867202758789062, -0.021543025970458984, -0.020218849182128906, -0.018894672393798828, -0.01757049560546875, -0.016246318817138672, -0.014922142028808594, -0.013597965240478516, -0.012273788452148438, -0.01094961166381836, -0.009625434875488281, -0.008301258087158203, -0.006977081298828125, -0.005652904510498047, -0.004328727722167969, -0.0030045509338378906, -0.0016803741455078125, -0.0003561973571777344, 0.0009679794311523438, 0.002292156219482422, 0.0036163330078125, 0.004940509796142578, 0.006264686584472656, 0.007588863372802734, 0.008913040161132812, 0.01023721694946289, 0.011561393737792969, 0.012885570526123047, 0.014209747314453125, 0.015533924102783203, 0.01685810089111328, 0.01818227767944336, 0.019506454467773438, 0.020830631256103516, 0.022154808044433594, 0.023478984832763672, 0.02480316162109375, 0.026127338409423828, 0.027451515197753906, 0.028775691986083984, 0.030099868774414062, 0.03142404556274414, 0.03274822235107422, 0.0340723991394043, 0.035396575927734375, 0.03672075271606445, 0.03804492950439453, 0.03936910629272461, 0.04069328308105469, 0.042017459869384766, 0.043341636657714844, 0.04466581344604492, 0.045989990234375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 3.0, 3.0, 6.0, 5.0, 10.0, 15.0, 18.0, 16.0, 20.0, 48.0, 191.0, 418.0, 76.0, 29.0, 21.0, 16.0, 14.0, 11.0, 13.0, 9.0, 9.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0112152099609375, -0.01088714599609375, -0.01055908203125, -0.01023101806640625, -0.0099029541015625, -0.00957489013671875, -0.009246826171875, -0.00891876220703125, -0.0085906982421875, -0.00826263427734375, -0.0079345703125, -0.00760650634765625, -0.0072784423828125, -0.00695037841796875, -0.006622314453125, -0.00629425048828125, -0.0059661865234375, -0.00563812255859375, -0.00531005859375, -0.00498199462890625, -0.0046539306640625, -0.00432586669921875, -0.003997802734375, -0.00366973876953125, -0.0033416748046875, -0.00301361083984375, -0.002685546875, -0.00235748291015625, -0.0020294189453125, -0.00170135498046875, -0.001373291015625, -0.00104522705078125, -0.0007171630859375, -0.00038909912109375, -6.103515625e-05, 0.00026702880859375, 0.0005950927734375, 0.00092315673828125, 0.001251220703125, 0.00157928466796875, 0.0019073486328125, 0.00223541259765625, 0.0025634765625, 0.00289154052734375, 0.0032196044921875, 0.00354766845703125, 0.003875732421875, 0.00420379638671875, 0.0045318603515625, 0.00485992431640625, 0.00518798828125, 0.00551605224609375, 0.0058441162109375, 0.00617218017578125, 0.006500244140625, 0.00682830810546875, 0.0071563720703125, 0.00748443603515625, 0.0078125, 0.00814056396484375, 0.0084686279296875, 0.00879669189453125, 0.009124755859375, 0.00945281982421875, 0.0097808837890625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 12.0, 13.0, 16.0, 16.0, 26.0, 29.0, 33.0, 36.0, 42.0, 73.0, 83.0, 110.0, 95.0, 70.0, 60.0, 50.0, 44.0, 26.0, 24.0, 25.0, 11.0, 16.0, 12.0, 11.0, 7.0, 12.0, 9.0, 7.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.21030063927173615, -0.20282134413719177, -0.1953420490026474, -0.18786275386810303, -0.18038344383239746, -0.17290416359901428, -0.16542485356330872, -0.15794555842876434, -0.15046626329421997, -0.1429869681596756, -0.13550767302513123, -0.12802837789058685, -0.12054907530546188, -0.11306978017091751, -0.10559047758579254, -0.09811118245124817, -0.0906318873167038, -0.08315259218215942, -0.07567329704761505, -0.06819399446249008, -0.06071469932794571, -0.05323540419340134, -0.045756105333566666, -0.038276806473731995, -0.030797511339187622, -0.0233182143419981, -0.01583891734480858, -0.008359620347619057, -0.0008803233504295349, 0.006598971784114838, 0.014078270643949509, 0.02155756950378418, 0.029036879539489746, 0.03651617467403412, 0.04399547353386879, 0.05147477239370346, 0.05895406752824783, 0.0664333626627922, 0.07391266524791718, 0.08139196038246155, 0.08887125551700592, 0.09635055065155029, 0.10382984578609467, 0.11130914837121964, 0.11878844350576401, 0.12626773118972778, 0.13374704122543335, 0.14122633635997772, 0.1487056314945221, 0.15618492662906647, 0.16366422176361084, 0.1711435168981552, 0.17862281203269958, 0.18610212206840515, 0.19358141720294952, 0.2010607123374939, 0.20854000747203827, 0.21601930260658264, 0.22349859774112701, 0.2309778928756714, 0.23845720291137695, 0.24593648314476013, 0.2534157931804657, 0.2608950734138489, 0.26837438344955444]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 10.0, 7.0, 21.0, 14.0, 15.0, 15.0, 20.0, 21.0, 19.0, 20.0, 28.0, 26.0, 30.0, 39.0, 24.0, 37.0, 40.0, 33.0, 33.0, 42.0, 58.0, 34.0, 39.0, 37.0, 43.0, 29.0, 33.0, 28.0, 38.0, 25.0, 23.0, 17.0, 15.0, 20.0, 12.0, 8.0, 6.0, 8.0, 8.0, 5.0, 1.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16520121693611145, -0.15962985157966614, -0.15405847132205963, -0.14848710596561432, -0.1429157257080078, -0.1373443603515625, -0.131772980093956, -0.12620161473751068, -0.12063023447990417, -0.11505886167287827, -0.10948748886585236, -0.10391611605882645, -0.09834474325180054, -0.09277337044477463, -0.08720199763774872, -0.0816306322813034, -0.0760592594742775, -0.07048788666725159, -0.06491651386022568, -0.05934514105319977, -0.05377376824617386, -0.04820239543914795, -0.04263102635741234, -0.03705965355038643, -0.03148828074336052, -0.02591690793633461, -0.0203455351293087, -0.01477416418492794, -0.009202791377902031, -0.0036314185708761215, 0.0019399523735046387, 0.007511325180530548, 0.013082697987556458, 0.018654070794582367, 0.024225443601608276, 0.029796814545989037, 0.035368189215660095, 0.040939562022686005, 0.046510931104421616, 0.052082303911447525, 0.057653676718473434, 0.06322504580020905, 0.06879641860723495, 0.07436779141426086, 0.07993916422128677, 0.08551053702831268, 0.09108190983533859, 0.0966532826423645, 0.10222465544939041, 0.10779602825641632, 0.11336740106344223, 0.11893877387046814, 0.12451014667749405, 0.13008151948451996, 0.13565288484096527, 0.14122426509857178, 0.1467956304550171, 0.1523669958114624, 0.1579383760690689, 0.16350974142551422, 0.16908112168312073, 0.17465248703956604, 0.18022386729717255, 0.18579523265361786, 0.19136661291122437]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 14.0, 14.0, 20.0, 30.0, 44.0, 52.0, 88.0, 128.0, 192.0, 291.0, 461.0, 704.0, 1047.0, 1824.0, 2908.0, 4440.0, 7709.0, 12268.0, 20682.0, 35159.0, 63400.0, 119891.0, 258158.0, 924092.0, 1820082.0, 519056.0, 186088.0, 91212.0, 49929.0, 28322.0, 17177.0, 10413.0, 6638.0, 4138.0, 2679.0, 1777.0, 1099.0, 704.0, 458.0, 314.0, 215.0, 119.0, 79.0, 60.0, 35.0, 25.0, 14.0, 15.0, 8.0, 4.0, 3.0, 1.0], "bins": [-0.2919921875, -0.2839488983154297, -0.2759056091308594, -0.26786231994628906, -0.25981903076171875, -0.25177574157714844, -0.24373245239257812, -0.2356891632080078, -0.2276458740234375, -0.2196025848388672, -0.21155929565429688, -0.20351600646972656, -0.19547271728515625, -0.18742942810058594, -0.17938613891601562, -0.1713428497314453, -0.163299560546875, -0.1552562713623047, -0.14721298217773438, -0.13916969299316406, -0.13112640380859375, -0.12308311462402344, -0.11503982543945312, -0.10699653625488281, -0.0989532470703125, -0.09090995788574219, -0.08286666870117188, -0.07482337951660156, -0.06678009033203125, -0.05873680114746094, -0.050693511962890625, -0.04265022277832031, -0.03460693359375, -0.026563644409179688, -0.018520355224609375, -0.010477066040039062, -0.00243377685546875, 0.0056095123291015625, 0.013652801513671875, 0.021696090698242188, 0.0297393798828125, 0.03778266906738281, 0.045825958251953125, 0.05386924743652344, 0.06191253662109375, 0.06995582580566406, 0.07799911499023438, 0.08604240417480469, 0.094085693359375, 0.10212898254394531, 0.11017227172851562, 0.11821556091308594, 0.12625885009765625, 0.13430213928222656, 0.14234542846679688, 0.1503887176513672, 0.1584320068359375, 0.1664752960205078, 0.17451858520507812, 0.18256187438964844, 0.19060516357421875, 0.19864845275878906, 0.20669174194335938, 0.2147350311279297, 0.2227783203125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 9.0, 10.0, 16.0, 11.0, 15.0, 17.0, 10.0, 16.0, 33.0, 21.0, 31.0, 19.0, 38.0, 23.0, 37.0, 29.0, 45.0, 32.0, 50.0, 46.0, 47.0, 41.0, 37.0, 37.0, 44.0, 22.0, 38.0, 20.0, 30.0, 26.0, 22.0, 29.0, 23.0, 11.0, 13.0, 8.0, 6.0, 8.0, 6.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.09662437438964844, -0.09333419799804688, -0.09004402160644531, -0.08675384521484375, -0.08346366882324219, -0.08017349243164062, -0.07688331604003906, -0.0735931396484375, -0.07030296325683594, -0.06701278686523438, -0.06372261047363281, -0.06043243408203125, -0.05714225769042969, -0.053852081298828125, -0.05056190490722656, -0.047271728515625, -0.04398155212402344, -0.040691375732421875, -0.03740119934082031, -0.03411102294921875, -0.030820846557617188, -0.027530670166015625, -0.024240493774414062, -0.0209503173828125, -0.017660140991210938, -0.014369964599609375, -0.011079788208007812, -0.00778961181640625, -0.0044994354248046875, -0.001209259033203125, 0.0020809173583984375, 0.00537109375, 0.008661270141601562, 0.011951446533203125, 0.015241622924804688, 0.01853179931640625, 0.021821975708007812, 0.025112152099609375, 0.028402328491210938, 0.0316925048828125, 0.03498268127441406, 0.038272857666015625, 0.04156303405761719, 0.04485321044921875, 0.04814338684082031, 0.051433563232421875, 0.05472373962402344, 0.058013916015625, 0.06130409240722656, 0.06459426879882812, 0.06788444519042969, 0.07117462158203125, 0.07446479797363281, 0.07775497436523438, 0.08104515075683594, 0.0843353271484375, 0.08762550354003906, 0.09091567993164062, 0.09420585632324219, 0.09749603271484375, 0.10078620910644531, 0.10407638549804688, 0.10736656188964844, 0.11065673828125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 3.0, 6.0, 8.0, 18.0, 30.0, 36.0, 50.0, 70.0, 123.0, 165.0, 226.0, 375.0, 493.0, 721.0, 1124.0, 1635.0, 2436.0, 3841.0, 5855.0, 9025.0, 14116.0, 22492.0, 35978.0, 59552.0, 101015.0, 181951.0, 356384.0, 834348.0, 1367530.0, 573243.0, 267659.0, 142767.0, 80928.0, 48271.0, 29373.0, 18603.0, 11785.0, 7522.0, 4809.0, 3200.0, 2168.0, 1422.0, 903.0, 662.0, 438.0, 319.0, 192.0, 130.0, 91.0, 58.0, 52.0, 29.0, 20.0, 13.0, 11.0, 3.0, 7.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.1602783203125, -0.15515708923339844, -0.15003585815429688, -0.1449146270751953, -0.13979339599609375, -0.1346721649169922, -0.12955093383789062, -0.12442970275878906, -0.1193084716796875, -0.11418724060058594, -0.10906600952148438, -0.10394477844238281, -0.09882354736328125, -0.09370231628417969, -0.08858108520507812, -0.08345985412597656, -0.078338623046875, -0.07321739196777344, -0.06809616088867188, -0.06297492980957031, -0.05785369873046875, -0.05273246765136719, -0.047611236572265625, -0.04249000549316406, -0.0373687744140625, -0.03224754333496094, -0.027126312255859375, -0.022005081176757812, -0.01688385009765625, -0.011762619018554688, -0.006641387939453125, -0.0015201568603515625, 0.00360107421875, 0.008722305297851562, 0.013843536376953125, 0.018964767456054688, 0.02408599853515625, 0.029207229614257812, 0.034328460693359375, 0.03944969177246094, 0.0445709228515625, 0.04969215393066406, 0.054813385009765625, 0.05993461608886719, 0.06505584716796875, 0.07017707824707031, 0.07529830932617188, 0.08041954040527344, 0.085540771484375, 0.09066200256347656, 0.09578323364257812, 0.10090446472167969, 0.10602569580078125, 0.11114692687988281, 0.11626815795898438, 0.12138938903808594, 0.1265106201171875, 0.13163185119628906, 0.13675308227539062, 0.1418743133544922, 0.14699554443359375, 0.1521167755126953, 0.15723800659179688, 0.16235923767089844, 0.16748046875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 12.0, 24.0, 34.0, 21.0, 36.0, 76.0, 80.0, 98.0, 109.0, 134.0, 181.0, 214.0, 277.0, 316.0, 431.0, 386.0, 319.0, 284.0, 202.0, 180.0, 161.0, 93.0, 119.0, 65.0, 51.0, 40.0, 34.0, 24.0, 19.0, 17.0, 8.0, 8.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.09442138671875, -0.09212255477905273, -0.08982372283935547, -0.0875248908996582, -0.08522605895996094, -0.08292722702026367, -0.0806283950805664, -0.07832956314086914, -0.07603073120117188, -0.07373189926147461, -0.07143306732177734, -0.06913423538208008, -0.06683540344238281, -0.06453657150268555, -0.06223773956298828, -0.059938907623291016, -0.05764007568359375, -0.055341243743896484, -0.05304241180419922, -0.05074357986450195, -0.04844474792480469, -0.04614591598510742, -0.043847084045410156, -0.04154825210571289, -0.039249420166015625, -0.03695058822631836, -0.034651756286621094, -0.03235292434692383, -0.030054092407226562, -0.027755260467529297, -0.02545642852783203, -0.023157596588134766, -0.0208587646484375, -0.018559932708740234, -0.01626110076904297, -0.013962268829345703, -0.011663436889648438, -0.009364604949951172, -0.007065773010253906, -0.004766941070556641, -0.002468109130859375, -0.00016927719116210938, 0.0021295547485351562, 0.004428386688232422, 0.0067272186279296875, 0.009026050567626953, 0.011324882507324219, 0.013623714447021484, 0.01592254638671875, 0.018221378326416016, 0.02052021026611328, 0.022819042205810547, 0.025117874145507812, 0.027416706085205078, 0.029715538024902344, 0.03201436996459961, 0.034313201904296875, 0.03661203384399414, 0.038910865783691406, 0.04120969772338867, 0.04350852966308594, 0.0458073616027832, 0.04810619354248047, 0.050405025482177734, 0.052703857421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 7.0, 6.0, 6.0, 11.0, 10.0, 11.0, 19.0, 28.0, 31.0, 21.0, 33.0, 55.0, 73.0, 75.0, 87.0, 100.0, 84.0, 72.0, 62.0, 30.0, 43.0, 24.0, 26.0, 18.0, 14.0, 10.0, 8.0, 4.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15568487346172333, -0.15036946535110474, -0.14505407214164734, -0.13973866403102875, -0.13442327082157135, -0.12910786271095276, -0.12379246950149536, -0.11847706139087677, -0.11316166818141937, -0.10784626752138138, -0.10253086686134338, -0.09721546620130539, -0.0919000655412674, -0.0865846648812294, -0.0812692642211914, -0.07595385611057281, -0.07063845545053482, -0.06532305479049683, -0.06000765413045883, -0.05469225347042084, -0.04937685281038284, -0.04406145215034485, -0.038746047765016556, -0.03343064710497856, -0.028115246444940567, -0.022799845784902573, -0.017484445124864578, -0.012169042602181435, -0.00685364194214344, -0.0015382412821054459, 0.0037771612405776978, 0.009092561900615692, 0.014407962560653687, 0.01972336322069168, 0.025038763880729675, 0.03035416640341282, 0.035669565200805664, 0.04098496586084366, 0.04630037024617195, 0.051615770906209946, 0.05693117156624794, 0.062246572226285934, 0.06756197661161423, 0.07287737727165222, 0.07819277793169022, 0.08350817859172821, 0.0888235792517662, 0.0941389799118042, 0.0994543805718422, 0.10476978123188019, 0.11008518189191818, 0.11540058255195618, 0.12071598321199417, 0.12603138387203217, 0.13134679198265076, 0.13666218519210815, 0.14197759330272675, 0.14729300141334534, 0.15260839462280273, 0.15792380273342133, 0.16323919594287872, 0.16855460405349731, 0.1738699972629547, 0.1791854053735733, 0.1845007985830307]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 3.0, 9.0, 10.0, 6.0, 6.0, 14.0, 16.0, 18.0, 22.0, 21.0, 24.0, 25.0, 34.0, 30.0, 20.0, 32.0, 32.0, 42.0, 36.0, 41.0, 38.0, 26.0, 50.0, 35.0, 37.0, 36.0, 34.0, 44.0, 26.0, 21.0, 25.0, 30.0, 32.0, 19.0, 12.0, 17.0, 9.0, 14.0, 11.0, 9.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.11413748562335968, -0.11069007962942123, -0.10724266618490219, -0.10379526019096375, -0.1003478467464447, -0.09690044075250626, -0.09345303475856781, -0.09000562131404877, -0.08655821532011032, -0.08311080932617188, -0.07966339588165283, -0.07621598988771439, -0.07276858389377594, -0.0693211704492569, -0.06587376445531845, -0.062426354736089706, -0.05897894501686096, -0.05553153529763222, -0.05208412557840347, -0.04863671958446503, -0.04518930986523628, -0.04174190014600754, -0.03829449415206909, -0.03484708443284035, -0.0313996747136116, -0.02795226499438286, -0.024504857137799263, -0.021057449281215668, -0.017610039561986923, -0.014162629842758179, -0.010715221986174583, -0.007267814129590988, -0.0038204044103622437, -0.00037299562245607376, 0.003074413165450096, 0.006521821953356266, 0.009969230741262436, 0.01341664046049118, 0.016864048317074776, 0.02031145617365837, 0.023758865892887115, 0.02720627561211586, 0.030653683468699455, 0.03410109132528305, 0.037548501044511795, 0.04099591076374054, 0.044443316757678986, 0.04789072647690773, 0.051338136196136475, 0.05478554591536522, 0.058232955634593964, 0.06168036162853241, 0.06512777507305145, 0.0685751810669899, 0.07202258706092834, 0.07547000050544739, 0.07891740649938583, 0.08236481249332428, 0.08581222593784332, 0.08925963193178177, 0.09270703792572021, 0.09615445137023926, 0.0996018573641777, 0.10304926335811615, 0.10649667680263519]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 8.0, 10.0, 11.0, 12.0, 10.0, 25.0, 29.0, 49.0, 58.0, 99.0, 147.0, 192.0, 258.0, 446.0, 681.0, 1008.0, 1425.0, 2251.0, 3378.0, 5337.0, 8260.0, 13285.0, 21038.0, 35632.0, 60729.0, 109340.0, 207121.0, 253064.0, 137730.0, 75317.0, 42760.0, 25401.0, 15511.0, 9832.0, 6291.0, 3963.0, 2610.0, 1726.0, 1104.0, 796.0, 507.0, 371.0, 223.0, 164.0, 113.0, 71.0, 55.0, 31.0, 32.0, 19.0, 10.0, 9.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.054840087890625, -0.053081512451171875, -0.05132293701171875, -0.049564361572265625, -0.0478057861328125, -0.046047210693359375, -0.04428863525390625, -0.042530059814453125, -0.040771484375, -0.039012908935546875, -0.03725433349609375, -0.035495758056640625, -0.0337371826171875, -0.031978607177734375, -0.03022003173828125, -0.028461456298828125, -0.026702880859375, -0.024944305419921875, -0.02318572998046875, -0.021427154541015625, -0.0196685791015625, -0.017910003662109375, -0.01615142822265625, -0.014392852783203125, -0.01263427734375, -0.010875701904296875, -0.00911712646484375, -0.007358551025390625, -0.0055999755859375, -0.003841400146484375, -0.00208282470703125, -0.000324249267578125, 0.001434326171875, 0.003192901611328125, 0.00495147705078125, 0.006710052490234375, 0.0084686279296875, 0.010227203369140625, 0.01198577880859375, 0.013744354248046875, 0.0155029296875, 0.017261505126953125, 0.01902008056640625, 0.020778656005859375, 0.0225372314453125, 0.024295806884765625, 0.02605438232421875, 0.027812957763671875, 0.029571533203125, 0.031330108642578125, 0.03308868408203125, 0.034847259521484375, 0.0366058349609375, 0.038364410400390625, 0.04012298583984375, 0.041881561279296875, 0.04364013671875, 0.045398712158203125, 0.04715728759765625, 0.048915863037109375, 0.0506744384765625, 0.052433013916015625, 0.05419158935546875, 0.055950164794921875, 0.057708740234375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 3.0, 6.0, 10.0, 6.0, 8.0, 6.0, 8.0, 16.0, 13.0, 14.0, 19.0, 20.0, 21.0, 27.0, 24.0, 39.0, 26.0, 41.0, 28.0, 36.0, 40.0, 43.0, 44.0, 36.0, 43.0, 45.0, 25.0, 48.0, 32.0, 36.0, 32.0, 26.0, 26.0, 27.0, 23.0, 20.0, 20.0, 14.0, 6.0, 9.0, 12.0, 5.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.12298583984375, -0.11935138702392578, -0.11571693420410156, -0.11208248138427734, -0.10844802856445312, -0.1048135757446289, -0.10117912292480469, -0.09754467010498047, -0.09391021728515625, -0.09027576446533203, -0.08664131164550781, -0.0830068588256836, -0.07937240600585938, -0.07573795318603516, -0.07210350036621094, -0.06846904754638672, -0.0648345947265625, -0.06120014190673828, -0.05756568908691406, -0.053931236267089844, -0.050296783447265625, -0.046662330627441406, -0.04302787780761719, -0.03939342498779297, -0.03575897216796875, -0.03212451934814453, -0.028490066528320312, -0.024855613708496094, -0.021221160888671875, -0.017586708068847656, -0.013952255249023438, -0.010317802429199219, -0.006683349609375, -0.0030488967895507812, 0.0005855560302734375, 0.004220008850097656, 0.007854461669921875, 0.011488914489746094, 0.015123367309570312, 0.01875782012939453, 0.02239227294921875, 0.02602672576904297, 0.029661178588867188, 0.033295631408691406, 0.036930084228515625, 0.040564537048339844, 0.04419898986816406, 0.04783344268798828, 0.0514678955078125, 0.05510234832763672, 0.05873680114746094, 0.062371253967285156, 0.06600570678710938, 0.0696401596069336, 0.07327461242675781, 0.07690906524658203, 0.08054351806640625, 0.08417797088623047, 0.08781242370605469, 0.0914468765258789, 0.09508132934570312, 0.09871578216552734, 0.10235023498535156, 0.10598468780517578, 0.109619140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 9.0, 16.0, 21.0, 42.0, 45.0, 81.0, 108.0, 147.0, 222.0, 332.0, 514.0, 721.0, 1066.0, 1612.0, 2425.0, 3830.0, 5951.0, 10656.0, 21539.0, 54528.0, 197127.0, 540498.0, 125659.0, 40299.0, 17346.0, 8868.0, 5142.0, 3257.0, 2091.0, 1425.0, 866.0, 639.0, 455.0, 318.0, 193.0, 152.0, 100.0, 88.0, 36.0, 44.0, 19.0, 15.0, 11.0, 9.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11822509765625, -0.11478328704833984, -0.11134147644042969, -0.10789966583251953, -0.10445785522460938, -0.10101604461669922, -0.09757423400878906, -0.0941324234008789, -0.09069061279296875, -0.0872488021850586, -0.08380699157714844, -0.08036518096923828, -0.07692337036132812, -0.07348155975341797, -0.07003974914550781, -0.06659793853759766, -0.0631561279296875, -0.059714317321777344, -0.05627250671386719, -0.05283069610595703, -0.049388885498046875, -0.04594707489013672, -0.04250526428222656, -0.039063453674316406, -0.03562164306640625, -0.032179832458496094, -0.028738021850585938, -0.02529621124267578, -0.021854400634765625, -0.01841259002685547, -0.014970779418945312, -0.011528968811035156, -0.008087158203125, -0.004645347595214844, -0.0012035369873046875, 0.0022382736206054688, 0.005680084228515625, 0.009121894836425781, 0.012563705444335938, 0.016005516052246094, 0.01944732666015625, 0.022889137268066406, 0.026330947875976562, 0.02977275848388672, 0.033214569091796875, 0.03665637969970703, 0.04009819030761719, 0.043540000915527344, 0.0469818115234375, 0.050423622131347656, 0.05386543273925781, 0.05730724334716797, 0.060749053955078125, 0.06419086456298828, 0.06763267517089844, 0.0710744857788086, 0.07451629638671875, 0.0779581069946289, 0.08139991760253906, 0.08484172821044922, 0.08828353881835938, 0.09172534942626953, 0.09516716003417969, 0.09860897064208984, 0.10205078125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 9.0, 9.0, 3.0, 9.0, 12.0, 17.0, 14.0, 20.0, 25.0, 23.0, 26.0, 30.0, 31.0, 42.0, 38.0, 40.0, 42.0, 38.0, 49.0, 43.0, 47.0, 28.0, 42.0, 49.0, 34.0, 34.0, 35.0, 42.0, 23.0, 24.0, 23.0, 18.0, 17.0, 10.0, 10.0, 8.0, 10.0, 9.0, 3.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0809326171875, -0.07844257354736328, -0.07595252990722656, -0.07346248626708984, -0.07097244262695312, -0.0684823989868164, -0.06599235534667969, -0.06350231170654297, -0.06101226806640625, -0.05852222442626953, -0.05603218078613281, -0.053542137145996094, -0.051052093505859375, -0.048562049865722656, -0.04607200622558594, -0.04358196258544922, -0.0410919189453125, -0.03860187530517578, -0.03611183166503906, -0.033621788024902344, -0.031131744384765625, -0.028641700744628906, -0.026151657104492188, -0.02366161346435547, -0.02117156982421875, -0.01868152618408203, -0.016191482543945312, -0.013701438903808594, -0.011211395263671875, -0.008721351623535156, -0.0062313079833984375, -0.0037412643432617188, -0.001251220703125, 0.0012388229370117188, 0.0037288665771484375, 0.006218910217285156, 0.008708953857421875, 0.011198997497558594, 0.013689041137695312, 0.01617908477783203, 0.01866912841796875, 0.02115917205810547, 0.023649215698242188, 0.026139259338378906, 0.028629302978515625, 0.031119346618652344, 0.03360939025878906, 0.03609943389892578, 0.0385894775390625, 0.04107952117919922, 0.04356956481933594, 0.046059608459472656, 0.048549652099609375, 0.051039695739746094, 0.05352973937988281, 0.05601978302001953, 0.05850982666015625, 0.06099987030029297, 0.06348991394042969, 0.0659799575805664, 0.06847000122070312, 0.07096004486083984, 0.07345008850097656, 0.07594013214111328, 0.07843017578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 11.0, 7.0, 4.0, 3.0, 15.0, 10.0, 25.0, 25.0, 24.0, 54.0, 63.0, 108.0, 130.0, 155.0, 219.0, 311.0, 408.0, 578.0, 856.0, 1165.0, 1768.0, 2878.0, 4808.0, 8869.0, 19559.0, 65797.0, 750792.0, 134602.0, 27985.0, 11254.0, 5858.0, 3307.0, 2093.0, 1469.0, 920.0, 658.0, 485.0, 326.0, 240.0, 183.0, 144.0, 101.0, 66.0, 67.0, 44.0, 28.0, 28.0, 17.0, 15.0, 11.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01033782958984375, -0.010000824928283691, -0.009663820266723633, -0.009326815605163574, -0.008989810943603516, -0.008652806282043457, -0.008315801620483398, -0.00797879695892334, -0.007641792297363281, -0.007304787635803223, -0.006967782974243164, -0.0066307783126831055, -0.006293773651123047, -0.005956768989562988, -0.00561976432800293, -0.005282759666442871, -0.0049457550048828125, -0.004608750343322754, -0.004271745681762695, -0.003934741020202637, -0.003597736358642578, -0.0032607316970825195, -0.002923727035522461, -0.0025867223739624023, -0.0022497177124023438, -0.0019127130508422852, -0.0015757083892822266, -0.001238703727722168, -0.0009016990661621094, -0.0005646944046020508, -0.0002276897430419922, 0.0001093149185180664, 0.000446319580078125, 0.0007833242416381836, 0.0011203289031982422, 0.0014573335647583008, 0.0017943382263183594, 0.002131342887878418, 0.0024683475494384766, 0.002805352210998535, 0.0031423568725585938, 0.0034793615341186523, 0.003816366195678711, 0.0041533708572387695, 0.004490375518798828, 0.004827380180358887, 0.005164384841918945, 0.005501389503479004, 0.0058383941650390625, 0.006175398826599121, 0.00651240348815918, 0.006849408149719238, 0.007186412811279297, 0.0075234174728393555, 0.007860422134399414, 0.008197426795959473, 0.008534431457519531, 0.00887143611907959, 0.009208440780639648, 0.009545445442199707, 0.009882450103759766, 0.010219454765319824, 0.010556459426879883, 0.010893464088439941, 0.01123046875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 9.0, 0.0, 10.0, 14.0, 0.0, 17.0, 31.0, 0.0, 39.0, 0.0, 51.0, 69.0, 0.0, 78.0, 122.0, 0.0, 116.0, 101.0, 0.0, 105.0, 61.0, 0.0, 48.0, 24.0, 0.0, 30.0, 21.0, 0.0, 23.0, 11.0, 0.0, 6.0, 8.0, 0.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.4901161193847656e-06, -1.4510005712509155e-06, -1.4118850231170654e-06, -1.3727694749832153e-06, -1.3336539268493652e-06, -1.2945383787155151e-06, -1.255422830581665e-06, -1.216307282447815e-06, -1.1771917343139648e-06, -1.1380761861801147e-06, -1.0989606380462646e-06, -1.0598450899124146e-06, -1.0207295417785645e-06, -9.816139936447144e-07, -9.424984455108643e-07, -9.033828973770142e-07, -8.642673492431641e-07, -8.25151801109314e-07, -7.860362529754639e-07, -7.469207048416138e-07, -7.078051567077637e-07, -6.686896085739136e-07, -6.295740604400635e-07, -5.904585123062134e-07, -5.513429641723633e-07, -5.122274160385132e-07, -4.731118679046631e-07, -4.33996319770813e-07, -3.948807716369629e-07, -3.557652235031128e-07, -3.166496753692627e-07, -2.775341272354126e-07, -2.384185791015625e-07, -1.993030309677124e-07, -1.601874828338623e-07, -1.210719347000122e-07, -8.195638656616211e-08, -4.284083843231201e-08, -3.725290298461914e-09, 3.5390257835388184e-08, 7.450580596923828e-08, 1.1362135410308838e-07, 1.5273690223693848e-07, 1.9185245037078857e-07, 2.3096799850463867e-07, 2.7008354663848877e-07, 3.0919909477233887e-07, 3.4831464290618896e-07, 3.8743019104003906e-07, 4.2654573917388916e-07, 4.6566128730773926e-07, 5.047768354415894e-07, 5.438923835754395e-07, 5.830079317092896e-07, 6.221234798431396e-07, 6.612390279769897e-07, 7.003545761108398e-07, 7.394701242446899e-07, 7.7858567237854e-07, 8.177012205123901e-07, 8.568167686462402e-07, 8.959323167800903e-07, 9.350478649139404e-07, 9.741634130477905e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 3.0, 12.0, 15.0, 19.0, 33.0, 44.0, 39.0, 82.0, 117.0, 144.0, 218.0, 285.0, 413.0, 588.0, 851.0, 1152.0, 1756.0, 2886.0, 4605.0, 8050.0, 14497.0, 29322.0, 71138.0, 303502.0, 448549.0, 86873.0, 33804.0, 16244.0, 8814.0, 4998.0, 3134.0, 2015.0, 1313.0, 888.0, 638.0, 467.0, 310.0, 192.0, 167.0, 108.0, 71.0, 58.0, 38.0, 27.0, 22.0, 16.0, 8.0, 8.0, 10.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0083465576171875, -0.008094310760498047, -0.007842063903808594, -0.007589817047119141, -0.0073375701904296875, -0.007085323333740234, -0.006833076477050781, -0.006580829620361328, -0.006328582763671875, -0.006076335906982422, -0.005824089050292969, -0.005571842193603516, -0.0053195953369140625, -0.005067348480224609, -0.004815101623535156, -0.004562854766845703, -0.00431060791015625, -0.004058361053466797, -0.0038061141967773438, -0.0035538673400878906, -0.0033016204833984375, -0.0030493736267089844, -0.0027971267700195312, -0.002544879913330078, -0.002292633056640625, -0.002040386199951172, -0.0017881393432617188, -0.0015358924865722656, -0.0012836456298828125, -0.0010313987731933594, -0.0007791519165039062, -0.0005269050598144531, -0.000274658203125, -2.2411346435546875e-05, 0.00022983551025390625, 0.0004820823669433594, 0.0007343292236328125, 0.0009865760803222656, 0.0012388229370117188, 0.0014910697937011719, 0.001743316650390625, 0.001995563507080078, 0.0022478103637695312, 0.0025000572204589844, 0.0027523040771484375, 0.0030045509338378906, 0.0032567977905273438, 0.003509044647216797, 0.00376129150390625, 0.004013538360595703, 0.004265785217285156, 0.004518032073974609, 0.0047702789306640625, 0.005022525787353516, 0.005274772644042969, 0.005527019500732422, 0.005779266357421875, 0.006031513214111328, 0.006283760070800781, 0.006536006927490234, 0.0067882537841796875, 0.007040500640869141, 0.007292747497558594, 0.007544994354248047, 0.0077972412109375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 7.0, 9.0, 16.0, 22.0, 23.0, 47.0, 77.0, 109.0, 210.0, 201.0, 94.0, 58.0, 30.0, 24.0, 16.0, 11.0, 6.0, 13.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003520965576171875, -0.0033950209617614746, -0.0032690763473510742, -0.003143131732940674, -0.0030171871185302734, -0.002891242504119873, -0.0027652978897094727, -0.0026393532752990723, -0.002513408660888672, -0.0023874640464782715, -0.002261519432067871, -0.0021355748176574707, -0.0020096302032470703, -0.00188368558883667, -0.0017577409744262695, -0.0016317963600158691, -0.0015058517456054688, -0.0013799071311950684, -0.001253962516784668, -0.0011280179023742676, -0.0010020732879638672, -0.0008761286735534668, -0.0007501840591430664, -0.000624239444732666, -0.0004982948303222656, -0.00037235021591186523, -0.00024640560150146484, -0.00012046098709106445, 5.4836273193359375e-06, 0.00013142824172973633, 0.0002573728561401367, 0.0003833174705505371, 0.0005092620849609375, 0.0006352066993713379, 0.0007611513137817383, 0.0008870959281921387, 0.001013040542602539, 0.0011389851570129395, 0.0012649297714233398, 0.0013908743858337402, 0.0015168190002441406, 0.001642763614654541, 0.0017687082290649414, 0.0018946528434753418, 0.002020597457885742, 0.0021465420722961426, 0.002272486686706543, 0.0023984313011169434, 0.0025243759155273438, 0.002650320529937744, 0.0027762651443481445, 0.002902209758758545, 0.0030281543731689453, 0.0031540989875793457, 0.003280043601989746, 0.0034059882164001465, 0.003531932830810547, 0.0036578774452209473, 0.0037838220596313477, 0.003909766674041748, 0.0040357112884521484, 0.004161655902862549, 0.004287600517272949, 0.00441354513168335, 0.00453948974609375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 3.0, 7.0, 6.0, 10.0, 11.0, 11.0, 19.0, 24.0, 30.0, 32.0, 27.0, 55.0, 66.0, 80.0, 93.0, 99.0, 85.0, 64.0, 57.0, 45.0, 31.0, 28.0, 35.0, 12.0, 15.0, 11.0, 7.0, 9.0, 5.0, 3.0, 8.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14991508424282074, -0.14460378885269165, -0.13929247856140137, -0.13398116827011108, -0.128669872879982, -0.12335857003927231, -0.11804726719856262, -0.11273596435785294, -0.10742466151714325, -0.10211335867643356, -0.09680205583572388, -0.09149075299501419, -0.0861794501543045, -0.08086814731359482, -0.07555684447288513, -0.07024554163217545, -0.06493423879146576, -0.05962293595075607, -0.05431163311004639, -0.0490003302693367, -0.043689027428627014, -0.03837772458791733, -0.03306642174720764, -0.027755118906497955, -0.02244381606578827, -0.017132513225078583, -0.011821210384368896, -0.00650990754365921, -0.001198604702949524, 0.004112698137760162, 0.009424000978469849, 0.014735303819179535, 0.020046621561050415, 0.0253579244017601, 0.030669227242469788, 0.035980530083179474, 0.04129183292388916, 0.046603135764598846, 0.05191443860530853, 0.05722574144601822, 0.0625370442867279, 0.06784834712743759, 0.07315964996814728, 0.07847095280885696, 0.08378225564956665, 0.08909355849027634, 0.09440486133098602, 0.09971616417169571, 0.1050274670124054, 0.11033876985311508, 0.11565007269382477, 0.12096137553453445, 0.12627267837524414, 0.13158398866653442, 0.1368952840566635, 0.1422065794467926, 0.14751788973808289, 0.15282920002937317, 0.15814049541950226, 0.16345179080963135, 0.16876310110092163, 0.17407441139221191, 0.179385706782341, 0.1846970021724701, 0.19000831246376038]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 5.0, 5.0, 7.0, 11.0, 6.0, 8.0, 15.0, 14.0, 22.0, 19.0, 22.0, 27.0, 24.0, 31.0, 28.0, 24.0, 32.0, 30.0, 47.0, 34.0, 40.0, 37.0, 33.0, 42.0, 37.0, 35.0, 39.0, 38.0, 38.0, 28.0, 21.0, 23.0, 31.0, 30.0, 19.0, 12.0, 15.0, 10.0, 14.0, 12.0, 6.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.11247317492961884, -0.10905071347951889, -0.10562824457883835, -0.1022057831287384, -0.09878331422805786, -0.09536085277795792, -0.09193839132785797, -0.08851592242717743, -0.08509346097707748, -0.08167099952697754, -0.078248530626297, -0.07482606917619705, -0.07140360027551651, -0.06798113882541656, -0.06455866992473602, -0.06113620847463608, -0.057713743299245834, -0.05429127812385559, -0.05086881294846535, -0.047446347773075104, -0.04402388632297516, -0.040601421147584915, -0.03717895597219467, -0.03375649452209473, -0.030334027484059334, -0.02691156230866909, -0.023489098995923996, -0.020066633820533752, -0.01664416864514351, -0.013221705332398415, -0.009799240157008171, -0.006376776844263077, -0.0029543116688728333, 0.0004681528080254793, 0.003890617284923792, 0.007313081994652748, 0.010735546238720417, 0.014158010482788086, 0.01758047565817833, 0.021002938970923424, 0.024425404146313667, 0.02784786932170391, 0.031270332634449005, 0.03469279780983925, 0.03811526298522949, 0.04153772443532944, 0.04496019333600998, 0.048382654786109924, 0.05180511996150017, 0.05522758513689041, 0.058650050312280655, 0.0620725154876709, 0.06549497693777084, 0.06891743838787079, 0.07233990728855133, 0.07576236873865128, 0.07918483763933182, 0.08260729908943176, 0.0860297679901123, 0.08945222944021225, 0.09287469834089279, 0.09629715979099274, 0.09971962869167328, 0.10314209014177322, 0.10656455159187317]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 7.0, 10.0, 14.0, 18.0, 21.0, 38.0, 48.0, 90.0, 119.0, 161.0, 254.0, 377.0, 549.0, 780.0, 1080.0, 1620.0, 2315.0, 3427.0, 4877.0, 6968.0, 10225.0, 15002.0, 22849.0, 35456.0, 58475.0, 102147.0, 192440.0, 247898.0, 135835.0, 75231.0, 44618.0, 27885.0, 18175.0, 12361.0, 8396.0, 5810.0, 4037.0, 2747.0, 1889.0, 1354.0, 924.0, 624.0, 442.0, 312.0, 201.0, 153.0, 102.0, 60.0, 44.0, 35.0, 31.0, 13.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.194580078125, -0.18835067749023438, -0.18212127685546875, -0.17589187622070312, -0.1696624755859375, -0.16343307495117188, -0.15720367431640625, -0.15097427368164062, -0.144744873046875, -0.13851547241210938, -0.13228607177734375, -0.12605667114257812, -0.1198272705078125, -0.11359786987304688, -0.10736846923828125, -0.10113906860351562, -0.09490966796875, -0.08868026733398438, -0.08245086669921875, -0.07622146606445312, -0.0699920654296875, -0.06376266479492188, -0.05753326416015625, -0.051303863525390625, -0.045074462890625, -0.038845062255859375, -0.03261566162109375, -0.026386260986328125, -0.0201568603515625, -0.013927459716796875, -0.00769805908203125, -0.001468658447265625, 0.0047607421875, 0.010990142822265625, 0.01721954345703125, 0.023448944091796875, 0.0296783447265625, 0.035907745361328125, 0.04213714599609375, 0.048366546630859375, 0.054595947265625, 0.060825347900390625, 0.06705474853515625, 0.07328414916992188, 0.0795135498046875, 0.08574295043945312, 0.09197235107421875, 0.09820175170898438, 0.10443115234375, 0.11066055297851562, 0.11688995361328125, 0.12311935424804688, 0.1293487548828125, 0.13557815551757812, 0.14180755615234375, 0.14803695678710938, 0.154266357421875, 0.16049575805664062, 0.16672515869140625, 0.17295455932617188, 0.1791839599609375, 0.18541336059570312, 0.19164276123046875, 0.19787216186523438, 0.2041015625]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 6.0, 5.0, 7.0, 5.0, 7.0, 11.0, 9.0, 13.0, 16.0, 14.0, 23.0, 22.0, 18.0, 36.0, 25.0, 22.0, 35.0, 31.0, 36.0, 48.0, 45.0, 36.0, 39.0, 34.0, 30.0, 48.0, 46.0, 37.0, 35.0, 29.0, 29.0, 23.0, 24.0, 26.0, 23.0, 19.0, 22.0, 15.0, 11.0, 10.0, 7.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10137939453125, -0.09828662872314453, -0.09519386291503906, -0.0921010971069336, -0.08900833129882812, -0.08591556549072266, -0.08282279968261719, -0.07973003387451172, -0.07663726806640625, -0.07354450225830078, -0.07045173645019531, -0.06735897064208984, -0.06426620483398438, -0.061173439025878906, -0.05808067321777344, -0.05498790740966797, -0.0518951416015625, -0.04880237579345703, -0.04570960998535156, -0.042616844177246094, -0.039524078369140625, -0.036431312561035156, -0.03333854675292969, -0.03024578094482422, -0.02715301513671875, -0.02406024932861328, -0.020967483520507812, -0.017874717712402344, -0.014781951904296875, -0.011689186096191406, -0.008596420288085938, -0.005503654479980469, -0.002410888671875, 0.0006818771362304688, 0.0037746429443359375, 0.006867408752441406, 0.009960174560546875, 0.013052940368652344, 0.016145706176757812, 0.01923847198486328, 0.02233123779296875, 0.02542400360107422, 0.028516769409179688, 0.031609535217285156, 0.034702301025390625, 0.037795066833496094, 0.04088783264160156, 0.04398059844970703, 0.0470733642578125, 0.05016613006591797, 0.05325889587402344, 0.056351661682128906, 0.059444427490234375, 0.06253719329833984, 0.06562995910644531, 0.06872272491455078, 0.07181549072265625, 0.07490825653076172, 0.07800102233886719, 0.08109378814697266, 0.08418655395507812, 0.0872793197631836, 0.09037208557128906, 0.09346485137939453, 0.0965576171875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 10.0, 19.0, 29.0, 25.0, 38.0, 48.0, 70.0, 127.0, 165.0, 234.0, 350.0, 437.0, 696.0, 972.0, 1490.0, 2141.0, 3256.0, 4848.0, 7139.0, 10680.0, 16643.0, 25007.0, 39247.0, 62833.0, 105524.0, 205162.0, 241392.0, 122210.0, 71284.0, 43806.0, 28197.0, 18069.0, 12080.0, 7894.0, 5321.0, 3569.0, 2438.0, 1570.0, 1076.0, 747.0, 511.0, 366.0, 274.0, 174.0, 116.0, 86.0, 49.0, 41.0, 31.0, 22.0, 16.0, 12.0, 9.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1895751953125, -0.18367385864257812, -0.17777252197265625, -0.17187118530273438, -0.1659698486328125, -0.16006851196289062, -0.15416717529296875, -0.14826583862304688, -0.142364501953125, -0.13646316528320312, -0.13056182861328125, -0.12466049194335938, -0.1187591552734375, -0.11285781860351562, -0.10695648193359375, -0.10105514526367188, -0.09515380859375, -0.08925247192382812, -0.08335113525390625, -0.07744979858398438, -0.0715484619140625, -0.06564712524414062, -0.05974578857421875, -0.053844451904296875, -0.047943115234375, -0.042041778564453125, -0.03614044189453125, -0.030239105224609375, -0.0243377685546875, -0.018436431884765625, -0.01253509521484375, -0.006633758544921875, -0.000732421875, 0.005168914794921875, 0.01107025146484375, 0.016971588134765625, 0.0228729248046875, 0.028774261474609375, 0.03467559814453125, 0.040576934814453125, 0.046478271484375, 0.052379608154296875, 0.05828094482421875, 0.06418228149414062, 0.0700836181640625, 0.07598495483398438, 0.08188629150390625, 0.08778762817382812, 0.09368896484375, 0.09959030151367188, 0.10549163818359375, 0.11139297485351562, 0.1172943115234375, 0.12319564819335938, 0.12909698486328125, 0.13499832153320312, 0.140899658203125, 0.14680099487304688, 0.15270233154296875, 0.15860366821289062, 0.1645050048828125, 0.17040634155273438, 0.17630767822265625, 0.18220901489257812, 0.1881103515625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 20.0, 9.0, 10.0, 15.0, 14.0, 16.0, 17.0, 29.0, 36.0, 27.0, 37.0, 32.0, 42.0, 44.0, 37.0, 39.0, 34.0, 44.0, 27.0, 46.0, 40.0, 41.0, 30.0, 40.0, 32.0, 20.0, 22.0, 28.0, 24.0, 18.0, 22.0, 21.0, 13.0, 11.0, 10.0, 6.0, 10.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06451416015625, -0.06258249282836914, -0.06065082550048828, -0.05871915817260742, -0.05678749084472656, -0.0548558235168457, -0.052924156188964844, -0.050992488861083984, -0.049060821533203125, -0.047129154205322266, -0.045197486877441406, -0.04326581954956055, -0.04133415222167969, -0.03940248489379883, -0.03747081756591797, -0.03553915023803711, -0.03360748291015625, -0.03167581558227539, -0.02974414825439453, -0.027812480926513672, -0.025880813598632812, -0.023949146270751953, -0.022017478942871094, -0.020085811614990234, -0.018154144287109375, -0.016222476959228516, -0.014290809631347656, -0.012359142303466797, -0.010427474975585938, -0.008495807647705078, -0.006564140319824219, -0.004632472991943359, -0.0027008056640625, -0.0007691383361816406, 0.0011625289916992188, 0.003094196319580078, 0.0050258636474609375, 0.006957530975341797, 0.008889198303222656, 0.010820865631103516, 0.012752532958984375, 0.014684200286865234, 0.016615867614746094, 0.018547534942626953, 0.020479202270507812, 0.022410869598388672, 0.02434253692626953, 0.02627420425415039, 0.02820587158203125, 0.03013753890991211, 0.03206920623779297, 0.03400087356567383, 0.03593254089355469, 0.03786420822143555, 0.039795875549316406, 0.041727542877197266, 0.043659210205078125, 0.045590877532958984, 0.047522544860839844, 0.0494542121887207, 0.05138587951660156, 0.05331754684448242, 0.05524921417236328, 0.05718088150024414, 0.059112548828125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 9.0, 7.0, 9.0, 15.0, 19.0, 40.0, 59.0, 77.0, 71.0, 130.0, 137.0, 197.0, 271.0, 378.0, 515.0, 743.0, 1075.0, 1560.0, 2309.0, 3587.0, 7691.0, 52042.0, 943559.0, 18996.0, 5516.0, 3014.0, 1887.0, 1328.0, 929.0, 623.0, 476.0, 339.0, 239.0, 174.0, 131.0, 98.0, 73.0, 73.0, 41.0, 36.0, 19.0, 13.0, 16.0, 5.0, 6.0, 8.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0631103515625, -0.06109428405761719, -0.059078216552734375, -0.05706214904785156, -0.05504608154296875, -0.05303001403808594, -0.051013946533203125, -0.04899787902832031, -0.0469818115234375, -0.04496574401855469, -0.042949676513671875, -0.04093360900878906, -0.03891754150390625, -0.03690147399902344, -0.034885406494140625, -0.03286933898925781, -0.030853271484375, -0.028837203979492188, -0.026821136474609375, -0.024805068969726562, -0.02278900146484375, -0.020772933959960938, -0.018756866455078125, -0.016740798950195312, -0.0147247314453125, -0.012708663940429688, -0.010692596435546875, -0.008676528930664062, -0.00666046142578125, -0.0046443939208984375, -0.002628326416015625, -0.0006122589111328125, 0.00140380859375, 0.0034198760986328125, 0.005435943603515625, 0.0074520111083984375, 0.00946807861328125, 0.011484146118164062, 0.013500213623046875, 0.015516281127929688, 0.0175323486328125, 0.019548416137695312, 0.021564483642578125, 0.023580551147460938, 0.02559661865234375, 0.027612686157226562, 0.029628753662109375, 0.03164482116699219, 0.033660888671875, 0.03567695617675781, 0.037693023681640625, 0.03970909118652344, 0.04172515869140625, 0.04374122619628906, 0.045757293701171875, 0.04777336120605469, 0.0497894287109375, 0.05180549621582031, 0.053821563720703125, 0.05583763122558594, 0.05785369873046875, 0.05986976623535156, 0.061885833740234375, 0.06390190124511719, 0.06591796875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 8.0, 13.0, 20.0, 60.0, 182.0, 293.0, 235.0, 127.0, 24.0, 22.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.3934990167617798e-06, -2.2836029529571533e-06, -2.173706889152527e-06, -2.0638108253479004e-06, -1.953914761543274e-06, -1.8440186977386475e-06, -1.734122633934021e-06, -1.6242265701293945e-06, -1.514330506324768e-06, -1.4044344425201416e-06, -1.2945383787155151e-06, -1.1846423149108887e-06, -1.0747462511062622e-06, -9.648501873016357e-07, -8.549541234970093e-07, -7.450580596923828e-07, -6.351619958877563e-07, -5.252659320831299e-07, -4.153698682785034e-07, -3.0547380447387695e-07, -1.955777406692505e-07, -8.568167686462402e-08, 2.421438694000244e-08, 1.341104507446289e-07, 2.4400651454925537e-07, 3.5390257835388184e-07, 4.637986421585083e-07, 5.736947059631348e-07, 6.835907697677612e-07, 7.934868335723877e-07, 9.033828973770142e-07, 1.0132789611816406e-06, 1.123175024986267e-06, 1.2330710887908936e-06, 1.34296715259552e-06, 1.4528632164001465e-06, 1.562759280204773e-06, 1.6726553440093994e-06, 1.7825514078140259e-06, 1.8924474716186523e-06, 2.002343535423279e-06, 2.1122395992279053e-06, 2.2221356630325317e-06, 2.332031726837158e-06, 2.4419277906417847e-06, 2.551823854446411e-06, 2.6617199182510376e-06, 2.771615982055664e-06, 2.8815120458602905e-06, 2.991408109664917e-06, 3.1013041734695435e-06, 3.21120023727417e-06, 3.3210963010787964e-06, 3.430992364883423e-06, 3.5408884286880493e-06, 3.6507844924926758e-06, 3.7606805562973022e-06, 3.870576620101929e-06, 3.980472683906555e-06, 4.090368747711182e-06, 4.200264811515808e-06, 4.3101608753204346e-06, 4.420056939125061e-06, 4.5299530029296875e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 11.0, 3.0, 11.0, 18.0, 31.0, 28.0, 45.0, 77.0, 112.0, 145.0, 234.0, 368.0, 567.0, 869.0, 1298.0, 1985.0, 3242.0, 7069.0, 47270.0, 956945.0, 15889.0, 4853.0, 2625.0, 1652.0, 1116.0, 717.0, 473.0, 290.0, 188.0, 126.0, 90.0, 74.0, 31.0, 28.0, 22.0, 20.0, 10.0, 4.0, 7.0, 7.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0770263671875, -0.07471275329589844, -0.07239913940429688, -0.07008552551269531, -0.06777191162109375, -0.06545829772949219, -0.06314468383789062, -0.06083106994628906, -0.0585174560546875, -0.05620384216308594, -0.053890228271484375, -0.05157661437988281, -0.04926300048828125, -0.04694938659667969, -0.044635772705078125, -0.04232215881347656, -0.040008544921875, -0.03769493103027344, -0.035381317138671875, -0.03306770324707031, -0.03075408935546875, -0.028440475463867188, -0.026126861572265625, -0.023813247680664062, -0.0214996337890625, -0.019186019897460938, -0.016872406005859375, -0.014558792114257812, -0.01224517822265625, -0.009931564331054688, -0.007617950439453125, -0.0053043365478515625, -0.00299072265625, -0.0006771087646484375, 0.001636505126953125, 0.0039501190185546875, 0.00626373291015625, 0.008577346801757812, 0.010890960693359375, 0.013204574584960938, 0.0155181884765625, 0.017831802368164062, 0.020145416259765625, 0.022459030151367188, 0.02477264404296875, 0.027086257934570312, 0.029399871826171875, 0.03171348571777344, 0.034027099609375, 0.03634071350097656, 0.038654327392578125, 0.04096794128417969, 0.04328155517578125, 0.04559516906738281, 0.047908782958984375, 0.05022239685058594, 0.0525360107421875, 0.05484962463378906, 0.057163238525390625, 0.05947685241699219, 0.06179046630859375, 0.06410408020019531, 0.06641769409179688, 0.06873130798339844, 0.071044921875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 8.0, 7.0, 12.0, 30.0, 132.0, 669.0, 85.0, 21.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015960693359375, -0.015449762344360352, -0.014938831329345703, -0.014427900314331055, -0.013916969299316406, -0.013406038284301758, -0.01289510726928711, -0.012384176254272461, -0.011873245239257812, -0.011362314224243164, -0.010851383209228516, -0.010340452194213867, -0.009829521179199219, -0.00931859016418457, -0.008807659149169922, -0.008296728134155273, -0.007785797119140625, -0.0072748661041259766, -0.006763935089111328, -0.00625300407409668, -0.005742073059082031, -0.005231142044067383, -0.004720211029052734, -0.004209280014038086, -0.0036983489990234375, -0.003187417984008789, -0.0026764869689941406, -0.002165555953979492, -0.0016546249389648438, -0.0011436939239501953, -0.0006327629089355469, -0.00012183189392089844, 0.00038909912109375, 0.0009000301361083984, 0.0014109611511230469, 0.0019218921661376953, 0.0024328231811523438, 0.002943754196166992, 0.0034546852111816406, 0.003965616226196289, 0.0044765472412109375, 0.004987478256225586, 0.005498409271240234, 0.006009340286254883, 0.006520271301269531, 0.00703120231628418, 0.007542133331298828, 0.008053064346313477, 0.008563995361328125, 0.009074926376342773, 0.009585857391357422, 0.01009678840637207, 0.010607719421386719, 0.011118650436401367, 0.011629581451416016, 0.012140512466430664, 0.012651443481445312, 0.013162374496459961, 0.01367330551147461, 0.014184236526489258, 0.014695167541503906, 0.015206098556518555, 0.015717029571533203, 0.01622796058654785, 0.0167388916015625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 9.0, 19.0, 18.0, 19.0, 24.0, 29.0, 50.0, 70.0, 85.0, 110.0, 115.0, 112.0, 83.0, 51.0, 40.0, 33.0, 35.0, 16.0, 14.0, 22.0, 6.0, 8.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19458512961864471, -0.18875442445278168, -0.18292370438575745, -0.1770929992198944, -0.17126227915287018, -0.16543157398700714, -0.1596008539199829, -0.15377014875411987, -0.14793944358825684, -0.1421087384223938, -0.13627801835536957, -0.13044731318950653, -0.1246165931224823, -0.11878588795661926, -0.11295517534017563, -0.107124462723732, -0.10129374265670776, -0.09546303004026413, -0.0896323174238205, -0.08380161225795746, -0.07797089219093323, -0.07214018702507019, -0.06630947440862656, -0.06047876179218292, -0.05464804917573929, -0.048817336559295654, -0.04298662394285202, -0.037155915051698685, -0.03132520243525505, -0.025494489818811417, -0.01966378092765808, -0.013833068311214447, -0.008002355694770813, -0.0021716440096497536, 0.003659067675471306, 0.00948977842926979, 0.015320491045713425, 0.02115120366215706, 0.026981912553310394, 0.03281262516975403, 0.03864333778619766, 0.044474050402641296, 0.05030476301908493, 0.056135471910238266, 0.0619661845266819, 0.06779690086841583, 0.07362760603427887, 0.0794583186507225, 0.08528903126716614, 0.09111974388360977, 0.0969504565000534, 0.10278116166591644, 0.10861188173294067, 0.11444258689880371, 0.12027329951524734, 0.12610401213169098, 0.1319347321987152, 0.13776543736457825, 0.14359615743160248, 0.14942686259746552, 0.15525758266448975, 0.16108828783035278, 0.16691899299621582, 0.17274971306324005, 0.1785804182291031]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 6.0, 4.0, 3.0, 6.0, 5.0, 10.0, 13.0, 6.0, 11.0, 16.0, 14.0, 13.0, 14.0, 21.0, 25.0, 28.0, 27.0, 37.0, 21.0, 29.0, 24.0, 37.0, 26.0, 31.0, 23.0, 47.0, 45.0, 39.0, 31.0, 44.0, 35.0, 33.0, 19.0, 31.0, 28.0, 30.0, 23.0, 21.0, 10.0, 16.0, 14.0, 13.0, 22.0, 8.0, 7.0, 11.0, 8.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.09476493299007416, -0.09184814244508743, -0.08893135190010071, -0.08601456135511398, -0.08309777081012726, -0.08018098026514053, -0.07726418972015381, -0.07434739917516708, -0.07143060863018036, -0.06851381808519363, -0.06559702754020691, -0.06268023699522018, -0.05976344645023346, -0.056846655905246735, -0.05392986536026001, -0.051013074815273285, -0.04809628054499626, -0.04517949000000954, -0.04226269945502281, -0.03934590891003609, -0.03642911836504936, -0.03351232782006264, -0.030595535412430763, -0.02767874486744404, -0.024761954322457314, -0.02184516377747059, -0.018928373232483864, -0.01601158082485199, -0.01309479121118784, -0.010178000666201115, -0.007261209189891815, -0.00434441864490509, -0.0014276280999183655, 0.001489162677899003, 0.0044059534557163715, 0.007322744466364384, 0.010239535011351109, 0.013156325556337833, 0.016073117032647133, 0.018989907577633858, 0.021906698122620583, 0.024823488667607307, 0.027740279212594032, 0.030657071620225906, 0.03357386216521263, 0.036490652710199356, 0.03940744325518608, 0.042324233800172806, 0.04524102434515953, 0.048157814890146255, 0.05107460543513298, 0.053991395980119705, 0.05690818652510643, 0.059824977070093155, 0.06274177134037018, 0.0656585618853569, 0.06857535243034363, 0.07149214297533035, 0.07440893352031708, 0.0773257240653038, 0.08024251461029053, 0.08315930515527725, 0.08607609570026398, 0.0889928862452507, 0.09190967679023743]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 9.0, 10.0, 14.0, 18.0, 14.0, 31.0, 51.0, 68.0, 109.0, 149.0, 211.0, 313.0, 492.0, 722.0, 1198.0, 1818.0, 2714.0, 4350.0, 6961.0, 10902.0, 17796.0, 29025.0, 50218.0, 87553.0, 169937.0, 427329.0, 1471892.0, 1231350.0, 338303.0, 146190.0, 77743.0, 43786.0, 26151.0, 16534.0, 10160.0, 6692.0, 4447.0, 2960.0, 1910.0, 1270.0, 860.0, 678.0, 426.0, 302.0, 175.0, 135.0, 115.0, 69.0, 51.0, 32.0, 22.0, 9.0, 6.0, 6.0, 3.0, 5.0, 2.0], "bins": [-0.1461181640625, -0.14180946350097656, -0.13750076293945312, -0.1331920623779297, -0.12888336181640625, -0.12457466125488281, -0.12026596069335938, -0.11595726013183594, -0.1116485595703125, -0.10733985900878906, -0.10303115844726562, -0.09872245788574219, -0.09441375732421875, -0.09010505676269531, -0.08579635620117188, -0.08148765563964844, -0.077178955078125, -0.07287025451660156, -0.06856155395507812, -0.06425285339355469, -0.05994415283203125, -0.05563545227050781, -0.051326751708984375, -0.04701805114746094, -0.0427093505859375, -0.03840065002441406, -0.034091949462890625, -0.029783248901367188, -0.02547454833984375, -0.021165847778320312, -0.016857147216796875, -0.012548446655273438, -0.00823974609375, -0.0039310455322265625, 0.000377655029296875, 0.0046863555908203125, 0.00899505615234375, 0.013303756713867188, 0.017612457275390625, 0.021921157836914062, 0.0262298583984375, 0.030538558959960938, 0.034847259521484375, 0.03915596008300781, 0.04346466064453125, 0.04777336120605469, 0.052082061767578125, 0.05639076232910156, 0.060699462890625, 0.06500816345214844, 0.06931686401367188, 0.07362556457519531, 0.07793426513671875, 0.08224296569824219, 0.08655166625976562, 0.09086036682128906, 0.0951690673828125, 0.09947776794433594, 0.10378646850585938, 0.10809516906738281, 0.11240386962890625, 0.11671257019042969, 0.12102127075195312, 0.12532997131347656, 0.129638671875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 6.0, 11.0, 8.0, 20.0, 14.0, 8.0, 8.0, 15.0, 27.0, 25.0, 28.0, 31.0, 22.0, 35.0, 17.0, 29.0, 33.0, 37.0, 38.0, 43.0, 33.0, 45.0, 33.0, 48.0, 38.0, 35.0, 25.0, 31.0, 39.0, 25.0, 21.0, 32.0, 15.0, 13.0, 19.0, 17.0, 11.0, 13.0, 13.0, 7.0, 8.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.062103271484375, -0.06027650833129883, -0.058449745178222656, -0.056622982025146484, -0.05479621887207031, -0.05296945571899414, -0.05114269256591797, -0.0493159294128418, -0.047489166259765625, -0.04566240310668945, -0.04383563995361328, -0.04200887680053711, -0.04018211364746094, -0.038355350494384766, -0.036528587341308594, -0.03470182418823242, -0.03287506103515625, -0.031048297882080078, -0.029221534729003906, -0.027394771575927734, -0.025568008422851562, -0.02374124526977539, -0.02191448211669922, -0.020087718963623047, -0.018260955810546875, -0.016434192657470703, -0.014607429504394531, -0.01278066635131836, -0.010953903198242188, -0.009127140045166016, -0.007300376892089844, -0.005473613739013672, -0.0036468505859375, -0.0018200874328613281, 6.67572021484375e-06, 0.0018334388732910156, 0.0036602020263671875, 0.005486965179443359, 0.007313728332519531, 0.009140491485595703, 0.010967254638671875, 0.012794017791748047, 0.014620780944824219, 0.01644754409790039, 0.018274307250976562, 0.020101070404052734, 0.021927833557128906, 0.023754596710205078, 0.02558135986328125, 0.027408123016357422, 0.029234886169433594, 0.031061649322509766, 0.03288841247558594, 0.03471517562866211, 0.03654193878173828, 0.03836870193481445, 0.040195465087890625, 0.0420222282409668, 0.04384899139404297, 0.04567575454711914, 0.04750251770019531, 0.049329280853271484, 0.051156044006347656, 0.05298280715942383, 0.0548095703125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 12.0, 10.0, 30.0, 36.0, 78.0, 103.0, 173.0, 240.0, 415.0, 586.0, 941.0, 1542.0, 2517.0, 4161.0, 6543.0, 11222.0, 18891.0, 32929.0, 59792.0, 114914.0, 237376.0, 562145.0, 1543254.0, 910008.0, 344584.0, 158712.0, 80042.0, 43009.0, 24377.0, 13850.0, 8288.0, 5080.0, 3124.0, 1910.0, 1262.0, 770.0, 461.0, 329.0, 195.0, 118.0, 91.0, 59.0, 34.0, 23.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1141357421875, -0.11053848266601562, -0.10694122314453125, -0.10334396362304688, -0.0997467041015625, -0.09614944458007812, -0.09255218505859375, -0.08895492553710938, -0.085357666015625, -0.08176040649414062, -0.07816314697265625, -0.07456588745117188, -0.0709686279296875, -0.06737136840820312, -0.06377410888671875, -0.060176849365234375, -0.05657958984375, -0.052982330322265625, -0.04938507080078125, -0.045787811279296875, -0.0421905517578125, -0.038593292236328125, -0.03499603271484375, -0.031398773193359375, -0.027801513671875, -0.024204254150390625, -0.02060699462890625, -0.017009735107421875, -0.0134124755859375, -0.009815216064453125, -0.00621795654296875, -0.002620697021484375, 0.0009765625, 0.004573822021484375, 0.00817108154296875, 0.011768341064453125, 0.0153656005859375, 0.018962860107421875, 0.02256011962890625, 0.026157379150390625, 0.029754638671875, 0.033351898193359375, 0.03694915771484375, 0.040546417236328125, 0.0441436767578125, 0.047740936279296875, 0.05133819580078125, 0.054935455322265625, 0.05853271484375, 0.062129974365234375, 0.06572723388671875, 0.06932449340820312, 0.0729217529296875, 0.07651901245117188, 0.08011627197265625, 0.08371353149414062, 0.087310791015625, 0.09090805053710938, 0.09450531005859375, 0.09810256958007812, 0.1016998291015625, 0.10529708862304688, 0.10889434814453125, 0.11249160766601562, 0.1160888671875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 11.0, 7.0, 11.0, 11.0, 25.0, 33.0, 38.0, 48.0, 69.0, 70.0, 113.0, 114.0, 180.0, 182.0, 214.0, 252.0, 298.0, 352.0, 351.0, 296.0, 275.0, 217.0, 180.0, 143.0, 125.0, 87.0, 70.0, 64.0, 56.0, 45.0, 34.0, 33.0, 19.0, 11.0, 12.0, 10.0, 10.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.034942626953125, -0.03374147415161133, -0.032540321350097656, -0.031339168548583984, -0.030138015747070312, -0.02893686294555664, -0.02773571014404297, -0.026534557342529297, -0.025333404541015625, -0.024132251739501953, -0.02293109893798828, -0.02172994613647461, -0.020528793334960938, -0.019327640533447266, -0.018126487731933594, -0.016925334930419922, -0.01572418212890625, -0.014523029327392578, -0.013321876525878906, -0.012120723724365234, -0.010919570922851562, -0.00971841812133789, -0.008517265319824219, -0.007316112518310547, -0.006114959716796875, -0.004913806915283203, -0.0037126541137695312, -0.0025115013122558594, -0.0013103485107421875, -0.00010919570922851562, 0.0010919570922851562, 0.002293109893798828, 0.0034942626953125, 0.004695415496826172, 0.005896568298339844, 0.007097721099853516, 0.008298873901367188, 0.00950002670288086, 0.010701179504394531, 0.011902332305908203, 0.013103485107421875, 0.014304637908935547, 0.015505790710449219, 0.01670694351196289, 0.017908096313476562, 0.019109249114990234, 0.020310401916503906, 0.021511554718017578, 0.02271270751953125, 0.023913860321044922, 0.025115013122558594, 0.026316165924072266, 0.027517318725585938, 0.02871847152709961, 0.02991962432861328, 0.031120777130126953, 0.032321929931640625, 0.0335230827331543, 0.03472423553466797, 0.03592538833618164, 0.03712654113769531, 0.038327693939208984, 0.039528846740722656, 0.04072999954223633, 0.04193115234375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 15.0, 12.0, 25.0, 24.0, 42.0, 33.0, 57.0, 62.0, 86.0, 91.0, 109.0, 80.0, 66.0, 61.0, 41.0, 35.0, 25.0, 18.0, 20.0, 19.0, 15.0, 10.0, 9.0, 7.0, 5.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.086305171251297, -0.08304010331630707, -0.07977503538131714, -0.07650996744632721, -0.07324489951133728, -0.06997983157634735, -0.06671475619077682, -0.0634496882557869, -0.06018462032079697, -0.05691955238580704, -0.05365448445081711, -0.05038941279053688, -0.04712434485554695, -0.04385927692055702, -0.040594205260276794, -0.037329137325286865, -0.034064069390296936, -0.030799001455307007, -0.02753393165767193, -0.02426886186003685, -0.02100379392504692, -0.01773872599005699, -0.014473656192421913, -0.011208586394786835, -0.007943518459796906, -0.004678449593484402, -0.0014133807271718979, 0.001851688139140606, 0.00511675700545311, 0.008381824940443039, 0.011646894738078117, 0.014911964535713196, 0.018177025020122528, 0.021442092955112457, 0.024707162752747536, 0.027972232550382614, 0.031237300485372543, 0.03450236842036247, 0.0377674400806427, 0.04103250801563263, 0.04429757595062256, 0.04756264388561249, 0.05082771182060242, 0.054092783480882645, 0.057357851415872574, 0.0606229193508625, 0.06388799101114273, 0.06715305894613266, 0.07041812688112259, 0.07368319481611252, 0.07694826275110245, 0.08021333068609238, 0.0834784060716629, 0.08674347400665283, 0.09000854194164276, 0.09327360987663269, 0.09653867781162262, 0.09980374574661255, 0.10306881368160248, 0.10633388161659241, 0.10959894955158234, 0.11286401748657227, 0.11612909287214279, 0.11939416080713272, 0.12265922874212265]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 11.0, 7.0, 10.0, 9.0, 13.0, 15.0, 19.0, 22.0, 17.0, 18.0, 24.0, 26.0, 27.0, 31.0, 35.0, 48.0, 28.0, 37.0, 40.0, 42.0, 42.0, 50.0, 41.0, 32.0, 39.0, 27.0, 31.0, 25.0, 28.0, 32.0, 21.0, 26.0, 21.0, 16.0, 14.0, 12.0, 10.0, 11.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06868283450603485, -0.06658975034952164, -0.06449666619300842, -0.06240358203649521, -0.060310497879981995, -0.05821741372346878, -0.056124329566955566, -0.05403124541044235, -0.05193816125392914, -0.049845077097415924, -0.04775199294090271, -0.045658908784389496, -0.04356582462787628, -0.04147274047136307, -0.039379656314849854, -0.03728657215833664, -0.035193488001823425, -0.03310040384531021, -0.031007319688796997, -0.028914235532283783, -0.02682115137577057, -0.024728067219257355, -0.02263498306274414, -0.020541898906230927, -0.018448814749717712, -0.0163557305932045, -0.014262646436691284, -0.01216956228017807, -0.010076478123664856, -0.007983393967151642, -0.005890309810638428, -0.0037972256541252136, -0.0017041414976119995, 0.0003889426589012146, 0.0024820268154144287, 0.004575110971927643, 0.006668195128440857, 0.008761279284954071, 0.010854363441467285, 0.0129474475979805, 0.015040531754493713, 0.017133615911006927, 0.01922670006752014, 0.021319784224033356, 0.02341286838054657, 0.025505952537059784, 0.027599036693572998, 0.029692120850086212, 0.031785205006599426, 0.03387828916311264, 0.035971373319625854, 0.03806445747613907, 0.04015754163265228, 0.0422506257891655, 0.04434370994567871, 0.046436794102191925, 0.04852987825870514, 0.05062296241521835, 0.05271604657173157, 0.05480913072824478, 0.056902214884757996, 0.05899529904127121, 0.061088383197784424, 0.06318146735429764, 0.06527455151081085]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 9.0, 18.0, 28.0, 25.0, 38.0, 78.0, 93.0, 106.0, 206.0, 283.0, 402.0, 536.0, 804.0, 1090.0, 1622.0, 2261.0, 3385.0, 4984.0, 7233.0, 11082.0, 17042.0, 26491.0, 43420.0, 72172.0, 125765.0, 221339.0, 207079.0, 118364.0, 68098.0, 40430.0, 25205.0, 16043.0, 10506.0, 7091.0, 4683.0, 3167.0, 2266.0, 1492.0, 1091.0, 780.0, 494.0, 362.0, 278.0, 202.0, 126.0, 86.0, 58.0, 44.0, 37.0, 24.0, 15.0, 11.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.029266357421875, -0.028350114822387695, -0.02743387222290039, -0.026517629623413086, -0.02560138702392578, -0.024685144424438477, -0.023768901824951172, -0.022852659225463867, -0.021936416625976562, -0.021020174026489258, -0.020103931427001953, -0.01918768882751465, -0.018271446228027344, -0.01735520362854004, -0.016438961029052734, -0.01552271842956543, -0.014606475830078125, -0.01369023323059082, -0.012773990631103516, -0.011857748031616211, -0.010941505432128906, -0.010025262832641602, -0.009109020233154297, -0.008192777633666992, -0.0072765350341796875, -0.006360292434692383, -0.005444049835205078, -0.0045278072357177734, -0.0036115646362304688, -0.002695322036743164, -0.0017790794372558594, -0.0008628368377685547, 5.340576171875e-05, 0.0009696483612060547, 0.0018858909606933594, 0.002802133560180664, 0.0037183761596679688, 0.0046346187591552734, 0.005550861358642578, 0.006467103958129883, 0.0073833465576171875, 0.008299589157104492, 0.009215831756591797, 0.010132074356079102, 0.011048316955566406, 0.011964559555053711, 0.012880802154541016, 0.01379704475402832, 0.014713287353515625, 0.01562952995300293, 0.016545772552490234, 0.01746201515197754, 0.018378257751464844, 0.01929450035095215, 0.020210742950439453, 0.021126985549926758, 0.022043228149414062, 0.022959470748901367, 0.023875713348388672, 0.024791955947875977, 0.02570819854736328, 0.026624441146850586, 0.02754068374633789, 0.028456926345825195, 0.0293731689453125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 8.0, 7.0, 8.0, 9.0, 9.0, 17.0, 17.0, 20.0, 16.0, 22.0, 21.0, 30.0, 33.0, 36.0, 29.0, 37.0, 42.0, 51.0, 40.0, 51.0, 47.0, 46.0, 36.0, 38.0, 42.0, 36.0, 26.0, 29.0, 41.0, 24.0, 21.0, 25.0, 17.0, 12.0, 8.0, 6.0, 11.0, 7.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.0811767578125, -0.0788259506225586, -0.07647514343261719, -0.07412433624267578, -0.07177352905273438, -0.06942272186279297, -0.06707191467285156, -0.06472110748291016, -0.06237030029296875, -0.060019493103027344, -0.05766868591308594, -0.05531787872314453, -0.052967071533203125, -0.05061626434326172, -0.04826545715332031, -0.045914649963378906, -0.0435638427734375, -0.041213035583496094, -0.03886222839355469, -0.03651142120361328, -0.034160614013671875, -0.03180980682373047, -0.029458999633789062, -0.027108192443847656, -0.02475738525390625, -0.022406578063964844, -0.020055770874023438, -0.01770496368408203, -0.015354156494140625, -0.013003349304199219, -0.010652542114257812, -0.008301734924316406, -0.005950927734375, -0.0036001205444335938, -0.0012493133544921875, 0.0011014938354492188, 0.003452301025390625, 0.005803108215332031, 0.008153915405273438, 0.010504722595214844, 0.01285552978515625, 0.015206336975097656, 0.017557144165039062, 0.01990795135498047, 0.022258758544921875, 0.02460956573486328, 0.026960372924804688, 0.029311180114746094, 0.0316619873046875, 0.034012794494628906, 0.03636360168457031, 0.03871440887451172, 0.041065216064453125, 0.04341602325439453, 0.04576683044433594, 0.048117637634277344, 0.05046844482421875, 0.052819252014160156, 0.05517005920410156, 0.05752086639404297, 0.059871673583984375, 0.06222248077392578, 0.06457328796386719, 0.0669240951538086, 0.06927490234375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 2.0, 7.0, 8.0, 11.0, 29.0, 31.0, 44.0, 72.0, 104.0, 115.0, 195.0, 278.0, 369.0, 544.0, 783.0, 1261.0, 1794.0, 2770.0, 4448.0, 7504.0, 13715.0, 29816.0, 81579.0, 366639.0, 387322.0, 83997.0, 30423.0, 13984.0, 7717.0, 4471.0, 2855.0, 1772.0, 1264.0, 812.0, 547.0, 387.0, 258.0, 189.0, 113.0, 95.0, 67.0, 46.0, 33.0, 26.0, 19.0, 11.0, 7.0, 5.0, 9.0, 5.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.0626220703125, -0.060781002044677734, -0.05893993377685547, -0.0570988655090332, -0.05525779724121094, -0.05341672897338867, -0.051575660705566406, -0.04973459243774414, -0.047893524169921875, -0.04605245590209961, -0.044211387634277344, -0.04237031936645508, -0.04052925109863281, -0.03868818283081055, -0.03684711456298828, -0.035006046295166016, -0.03316497802734375, -0.031323909759521484, -0.02948284149169922, -0.027641773223876953, -0.025800704956054688, -0.023959636688232422, -0.022118568420410156, -0.02027750015258789, -0.018436431884765625, -0.01659536361694336, -0.014754295349121094, -0.012913227081298828, -0.011072158813476562, -0.009231090545654297, -0.007390022277832031, -0.005548954010009766, -0.0037078857421875, -0.0018668174743652344, -2.574920654296875e-05, 0.0018153190612792969, 0.0036563873291015625, 0.005497455596923828, 0.007338523864746094, 0.00917959213256836, 0.011020660400390625, 0.01286172866821289, 0.014702796936035156, 0.016543865203857422, 0.018384933471679688, 0.020226001739501953, 0.02206707000732422, 0.023908138275146484, 0.02574920654296875, 0.027590274810791016, 0.02943134307861328, 0.03127241134643555, 0.03311347961425781, 0.03495454788208008, 0.036795616149902344, 0.03863668441772461, 0.040477752685546875, 0.04231882095336914, 0.044159889221191406, 0.04600095748901367, 0.04784202575683594, 0.0496830940246582, 0.05152416229248047, 0.053365230560302734, 0.055206298828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 6.0, 8.0, 14.0, 16.0, 20.0, 20.0, 17.0, 21.0, 33.0, 29.0, 28.0, 36.0, 39.0, 47.0, 38.0, 44.0, 45.0, 44.0, 53.0, 47.0, 40.0, 26.0, 36.0, 34.0, 31.0, 33.0, 34.0, 20.0, 22.0, 17.0, 17.0, 13.0, 14.0, 10.0, 10.0, 6.0, 9.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04766845703125, -0.046236515045166016, -0.04480457305908203, -0.04337263107299805, -0.04194068908691406, -0.04050874710083008, -0.039076805114746094, -0.03764486312866211, -0.036212921142578125, -0.03478097915649414, -0.033349037170410156, -0.03191709518432617, -0.030485153198242188, -0.029053211212158203, -0.02762126922607422, -0.026189327239990234, -0.02475738525390625, -0.023325443267822266, -0.02189350128173828, -0.020461559295654297, -0.019029617309570312, -0.017597675323486328, -0.016165733337402344, -0.01473379135131836, -0.013301849365234375, -0.01186990737915039, -0.010437965393066406, -0.009006023406982422, -0.0075740814208984375, -0.006142139434814453, -0.004710197448730469, -0.0032782554626464844, -0.0018463134765625, -0.0004143714904785156, 0.0010175704956054688, 0.002449512481689453, 0.0038814544677734375, 0.005313396453857422, 0.006745338439941406, 0.00817728042602539, 0.009609222412109375, 0.01104116439819336, 0.012473106384277344, 0.013905048370361328, 0.015336990356445312, 0.016768932342529297, 0.01820087432861328, 0.019632816314697266, 0.02106475830078125, 0.022496700286865234, 0.02392864227294922, 0.025360584259033203, 0.026792526245117188, 0.028224468231201172, 0.029656410217285156, 0.03108835220336914, 0.032520294189453125, 0.03395223617553711, 0.035384178161621094, 0.03681612014770508, 0.03824806213378906, 0.03968000411987305, 0.04111194610595703, 0.042543888092041016, 0.043975830078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 1.0, 10.0, 20.0, 26.0, 23.0, 37.0, 53.0, 45.0, 68.0, 100.0, 118.0, 160.0, 238.0, 306.0, 375.0, 527.0, 767.0, 1303.0, 2018.0, 3596.0, 6929.0, 14292.0, 44657.0, 653457.0, 259433.0, 33353.0, 11943.0, 5769.0, 3149.0, 1756.0, 1145.0, 787.0, 513.0, 413.0, 289.0, 238.0, 162.0, 129.0, 80.0, 65.0, 60.0, 41.0, 30.0, 17.0, 10.0, 7.0, 8.0, 11.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0], "bins": [-0.006061553955078125, -0.005865335464477539, -0.005669116973876953, -0.005472898483276367, -0.005276679992675781, -0.005080461502075195, -0.004884243011474609, -0.0046880245208740234, -0.0044918060302734375, -0.0042955875396728516, -0.004099369049072266, -0.0039031505584716797, -0.0037069320678710938, -0.003510713577270508, -0.003314495086669922, -0.003118276596069336, -0.00292205810546875, -0.002725839614868164, -0.002529621124267578, -0.002333402633666992, -0.0021371841430664062, -0.0019409656524658203, -0.0017447471618652344, -0.0015485286712646484, -0.0013523101806640625, -0.0011560916900634766, -0.0009598731994628906, -0.0007636547088623047, -0.0005674362182617188, -0.0003712177276611328, -0.00017499923706054688, 2.1219253540039062e-05, 0.000217437744140625, 0.00041365623474121094, 0.0006098747253417969, 0.0008060932159423828, 0.0010023117065429688, 0.0011985301971435547, 0.0013947486877441406, 0.0015909671783447266, 0.0017871856689453125, 0.0019834041595458984, 0.0021796226501464844, 0.0023758411407470703, 0.0025720596313476562, 0.002768278121948242, 0.002964496612548828, 0.003160715103149414, 0.00335693359375, 0.003553152084350586, 0.003749370574951172, 0.003945589065551758, 0.004141807556152344, 0.00433802604675293, 0.004534244537353516, 0.0047304630279541016, 0.0049266815185546875, 0.0051229000091552734, 0.005319118499755859, 0.005515336990356445, 0.005711555480957031, 0.005907773971557617, 0.006103992462158203, 0.006300210952758789, 0.006496429443359375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 2.0, 6.0, 0.0, 8.0, 17.0, 0.0, 18.0, 20.0, 32.0, 0.0, 28.0, 53.0, 0.0, 71.0, 84.0, 0.0, 107.0, 102.0, 0.0, 106.0, 94.0, 0.0, 71.0, 58.0, 42.0, 0.0, 25.0, 13.0, 0.0, 8.0, 12.0, 0.0, 7.0, 6.0, 0.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.0915100574493408e-06, -1.0505318641662598e-06, -1.0095536708831787e-06, -9.685754776000977e-07, -9.275972843170166e-07, -8.866190910339355e-07, -8.456408977508545e-07, -8.046627044677734e-07, -7.636845111846924e-07, -7.227063179016113e-07, -6.817281246185303e-07, -6.407499313354492e-07, -5.997717380523682e-07, -5.587935447692871e-07, -5.178153514862061e-07, -4.76837158203125e-07, -4.3585896492004395e-07, -3.948807716369629e-07, -3.5390257835388184e-07, -3.129243850708008e-07, -2.7194619178771973e-07, -2.3096799850463867e-07, -1.8998980522155762e-07, -1.4901161193847656e-07, -1.0803341865539551e-07, -6.705522537231445e-08, -2.60770320892334e-08, 1.4901161193847656e-08, 5.587935447692871e-08, 9.685754776000977e-08, 1.3783574104309082e-07, 1.7881393432617188e-07, 2.1979212760925293e-07, 2.60770320892334e-07, 3.0174851417541504e-07, 3.427267074584961e-07, 3.8370490074157715e-07, 4.246830940246582e-07, 4.6566128730773926e-07, 5.066394805908203e-07, 5.476176738739014e-07, 5.885958671569824e-07, 6.295740604400635e-07, 6.705522537231445e-07, 7.115304470062256e-07, 7.525086402893066e-07, 7.934868335723877e-07, 8.344650268554688e-07, 8.754432201385498e-07, 9.164214134216309e-07, 9.57399606704712e-07, 9.98377799987793e-07, 1.039355993270874e-06, 1.080334186553955e-06, 1.1213123798370361e-06, 1.1622905731201172e-06, 1.2032687664031982e-06, 1.2442469596862793e-06, 1.2852251529693604e-06, 1.3262033462524414e-06, 1.3671815395355225e-06, 1.4081597328186035e-06, 1.4491379261016846e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 11.0, 13.0, 7.0, 18.0, 14.0, 35.0, 43.0, 49.0, 66.0, 96.0, 132.0, 203.0, 261.0, 391.0, 583.0, 885.0, 1322.0, 2296.0, 3679.0, 6525.0, 12645.0, 28151.0, 89381.0, 633147.0, 187936.0, 42851.0, 17004.0, 8453.0, 4680.0, 2722.0, 1670.0, 1028.0, 673.0, 453.0, 328.0, 215.0, 165.0, 109.0, 78.0, 65.0, 45.0, 31.0, 30.0, 14.0, 22.0, 8.0, 6.0, 7.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005931854248046875, -0.005738675594329834, -0.005545496940612793, -0.005352318286895752, -0.005159139633178711, -0.00496596097946167, -0.004772782325744629, -0.004579603672027588, -0.004386425018310547, -0.004193246364593506, -0.004000067710876465, -0.003806889057159424, -0.003613710403442383, -0.003420531749725342, -0.0032273530960083008, -0.0030341744422912598, -0.0028409957885742188, -0.0026478171348571777, -0.0024546384811401367, -0.0022614598274230957, -0.0020682811737060547, -0.0018751025199890137, -0.0016819238662719727, -0.0014887452125549316, -0.0012955665588378906, -0.0011023879051208496, -0.0009092092514038086, -0.0007160305976867676, -0.0005228519439697266, -0.00032967329025268555, -0.00013649463653564453, 5.6684017181396484e-05, 0.0002498626708984375, 0.0004430413246154785, 0.0006362199783325195, 0.0008293986320495605, 0.0010225772857666016, 0.0012157559394836426, 0.0014089345932006836, 0.0016021132469177246, 0.0017952919006347656, 0.0019884705543518066, 0.0021816492080688477, 0.0023748278617858887, 0.0025680065155029297, 0.0027611851692199707, 0.0029543638229370117, 0.0031475424766540527, 0.0033407211303710938, 0.0035338997840881348, 0.0037270784378051758, 0.003920257091522217, 0.004113435745239258, 0.004306614398956299, 0.00449979305267334, 0.004692971706390381, 0.004886150360107422, 0.005079329013824463, 0.005272507667541504, 0.005465686321258545, 0.005658864974975586, 0.005852043628692627, 0.006045222282409668, 0.006238400936126709, 0.00643157958984375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 8.0, 20.0, 22.0, 35.0, 40.0, 46.0, 89.0, 114.0, 137.0, 118.0, 84.0, 61.0, 49.0, 32.0, 32.0, 20.0, 13.0, 10.0, 12.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012331008911132812, -0.001196354627609253, -0.0011596083641052246, -0.0011228621006011963, -0.001086115837097168, -0.0010493695735931396, -0.0010126233100891113, -0.000975877046585083, -0.0009391307830810547, -0.0009023845195770264, -0.000865638256072998, -0.0008288919925689697, -0.0007921457290649414, -0.0007553994655609131, -0.0007186532020568848, -0.0006819069385528564, -0.0006451606750488281, -0.0006084144115447998, -0.0005716681480407715, -0.0005349218845367432, -0.0004981756210327148, -0.0004614293575286865, -0.0004246830940246582, -0.0003879368305206299, -0.00035119056701660156, -0.00031444430351257324, -0.0002776980400085449, -0.0002409517765045166, -0.00020420551300048828, -0.00016745924949645996, -0.00013071298599243164, -9.396672248840332e-05, -5.7220458984375e-05, -2.047419548034668e-05, 1.627206802368164e-05, 5.301833152770996e-05, 8.976459503173828e-05, 0.0001265108585357666, 0.00016325712203979492, 0.00020000338554382324, 0.00023674964904785156, 0.0002734959125518799, 0.0003102421760559082, 0.0003469884395599365, 0.00038373470306396484, 0.00042048096656799316, 0.0004572272300720215, 0.0004939734935760498, 0.0005307197570800781, 0.0005674660205841064, 0.0006042122840881348, 0.0006409585475921631, 0.0006777048110961914, 0.0007144510746002197, 0.000751197338104248, 0.0007879436016082764, 0.0008246898651123047, 0.000861436128616333, 0.0008981823921203613, 0.0009349286556243896, 0.000971674919128418, 0.0010084211826324463, 0.0010451674461364746, 0.001081913709640503, 0.0011186599731445312]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 2.0, 8.0, 1.0, 9.0, 4.0, 6.0, 17.0, 11.0, 15.0, 33.0, 34.0, 50.0, 49.0, 63.0, 95.0, 94.0, 104.0, 83.0, 74.0, 54.0, 40.0, 33.0, 20.0, 16.0, 21.0, 18.0, 12.0, 11.0, 9.0, 8.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08681350946426392, -0.08350302278995514, -0.08019253611564636, -0.07688204944133759, -0.07357156276702881, -0.07026107609272003, -0.06695059686899185, -0.06364011019468307, -0.0603296235203743, -0.05701913684606552, -0.053708650171756744, -0.050398167222738266, -0.04708768054842949, -0.04377719387412071, -0.040466710925102234, -0.03715622425079346, -0.03384573757648468, -0.030535250902175903, -0.027224766090512276, -0.023914281278848648, -0.02060379460453987, -0.017293307930231094, -0.013982823118567467, -0.010672338306903839, -0.007361851632595062, -0.00405136588960886, -0.0007408801466226578, 0.0025696055963635445, 0.005880091339349747, 0.009190578013658524, 0.012501062825322151, 0.01581154763698578, 0.019122034311294556, 0.022432520985603333, 0.02574300579726696, 0.029053490608930588, 0.032363977283239365, 0.03567446395754814, 0.03898494690656662, 0.0422954335808754, 0.045605920255184174, 0.04891640692949295, 0.05222689360380173, 0.055537376552820206, 0.05884786322712898, 0.06215834990143776, 0.06546883285045624, 0.06877931952476501, 0.07208980619907379, 0.07540029287338257, 0.07871077954769135, 0.08202126622200012, 0.0853317528963089, 0.08864223957061768, 0.09195271879434586, 0.09526320546865463, 0.09857369214296341, 0.10188417881727219, 0.10519466549158096, 0.10850515216588974, 0.11181563138961792, 0.1151261180639267, 0.11843660473823547, 0.12174709141254425, 0.12505757808685303]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 12.0, 7.0, 9.0, 11.0, 12.0, 14.0, 18.0, 25.0, 17.0, 18.0, 24.0, 24.0, 29.0, 31.0, 33.0, 47.0, 32.0, 33.0, 42.0, 40.0, 39.0, 49.0, 43.0, 36.0, 37.0, 28.0, 29.0, 29.0, 24.0, 33.0, 24.0, 24.0, 20.0, 18.0, 14.0, 13.0, 7.0, 14.0, 7.0, 7.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06849992275238037, -0.06642637401819229, -0.06435282528400421, -0.06227928027510643, -0.06020573526620865, -0.05813218653202057, -0.05605863779783249, -0.05398508906364441, -0.05191154405474663, -0.04983799532055855, -0.04776445031166077, -0.04569090157747269, -0.04361735284328461, -0.041543807834386826, -0.039470259100198746, -0.037396714091300964, -0.035323165357112885, -0.033249616622924805, -0.031176071614027023, -0.029102522879838943, -0.027028976008296013, -0.024955429136753082, -0.022881880402565002, -0.020808333531022072, -0.01873478665947914, -0.01666123978793621, -0.014587691985070705, -0.0125141441822052, -0.01044059731066227, -0.008367050439119339, -0.006293502636253834, -0.0042199548333883286, -0.002146415412425995, -7.286807522177696e-05, 0.002000679261982441, 0.004074226599186659, 0.006147773936390877, 0.008221320807933807, 0.010294868610799313, 0.012368416413664818, 0.014441963285207748, 0.01651551015675068, 0.01858905702829361, 0.02066260576248169, 0.02273615263402462, 0.02480969950556755, 0.02688324823975563, 0.02895679511129856, 0.03103034198284149, 0.03310389071702957, 0.03517743572592735, 0.03725098446011543, 0.039324529469013214, 0.041398078203201294, 0.043471626937389374, 0.045545175671577454, 0.047618720680475235, 0.049692269414663315, 0.051765814423561096, 0.053839363157749176, 0.055912911891937256, 0.05798645690083504, 0.06006000563502312, 0.0621335506439209, 0.06420709937810898]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 9.0, 6.0, 7.0, 5.0, 21.0, 33.0, 34.0, 44.0, 66.0, 92.0, 133.0, 189.0, 275.0, 436.0, 598.0, 951.0, 1293.0, 1920.0, 2921.0, 4374.0, 6598.0, 10280.0, 16019.0, 24744.0, 39420.0, 64177.0, 113357.0, 223026.0, 236072.0, 119458.0, 67547.0, 41192.0, 25546.0, 16408.0, 10508.0, 6882.0, 4517.0, 3045.0, 2023.0, 1331.0, 926.0, 654.0, 430.0, 300.0, 201.0, 156.0, 114.0, 78.0, 49.0, 28.0, 26.0, 16.0, 18.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.129638671875, -0.1257152557373047, -0.12179183959960938, -0.11786842346191406, -0.11394500732421875, -0.11002159118652344, -0.10609817504882812, -0.10217475891113281, -0.0982513427734375, -0.09432792663574219, -0.09040451049804688, -0.08648109436035156, -0.08255767822265625, -0.07863426208496094, -0.07471084594726562, -0.07078742980957031, -0.066864013671875, -0.06294059753417969, -0.059017181396484375, -0.05509376525878906, -0.05117034912109375, -0.04724693298339844, -0.043323516845703125, -0.03940010070800781, -0.0354766845703125, -0.03155326843261719, -0.027629852294921875, -0.023706436157226562, -0.01978302001953125, -0.015859603881835938, -0.011936187744140625, -0.008012771606445312, -0.00408935546875, -0.0001659393310546875, 0.003757476806640625, 0.0076808929443359375, 0.01160430908203125, 0.015527725219726562, 0.019451141357421875, 0.023374557495117188, 0.0272979736328125, 0.031221389770507812, 0.035144805908203125, 0.03906822204589844, 0.04299163818359375, 0.04691505432128906, 0.050838470458984375, 0.05476188659667969, 0.058685302734375, 0.06260871887207031, 0.06653213500976562, 0.07045555114746094, 0.07437896728515625, 0.07830238342285156, 0.08222579956054688, 0.08614921569824219, 0.0900726318359375, 0.09399604797363281, 0.09791946411132812, 0.10184288024902344, 0.10576629638671875, 0.10968971252441406, 0.11361312866210938, 0.11753654479980469, 0.1214599609375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 6.0, 6.0, 8.0, 8.0, 9.0, 14.0, 16.0, 19.0, 18.0, 16.0, 21.0, 27.0, 32.0, 25.0, 30.0, 37.0, 40.0, 40.0, 38.0, 39.0, 45.0, 39.0, 43.0, 42.0, 34.0, 33.0, 30.0, 30.0, 24.0, 31.0, 25.0, 19.0, 24.0, 22.0, 16.0, 18.0, 12.0, 10.0, 8.0, 5.0, 11.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06292724609375, -0.061052799224853516, -0.05917835235595703, -0.05730390548706055, -0.05542945861816406, -0.05355501174926758, -0.051680564880371094, -0.04980611801147461, -0.047931671142578125, -0.04605722427368164, -0.044182777404785156, -0.04230833053588867, -0.04043388366699219, -0.0385594367980957, -0.03668498992919922, -0.034810543060302734, -0.03293609619140625, -0.031061649322509766, -0.02918720245361328, -0.027312755584716797, -0.025438308715820312, -0.023563861846923828, -0.021689414978027344, -0.01981496810913086, -0.017940521240234375, -0.01606607437133789, -0.014191627502441406, -0.012317180633544922, -0.010442733764648438, -0.008568286895751953, -0.006693840026855469, -0.004819393157958984, -0.0029449462890625, -0.0010704994201660156, 0.0008039474487304688, 0.002678394317626953, 0.0045528411865234375, 0.006427288055419922, 0.008301734924316406, 0.01017618179321289, 0.012050628662109375, 0.01392507553100586, 0.015799522399902344, 0.017673969268798828, 0.019548416137695312, 0.021422863006591797, 0.02329730987548828, 0.025171756744384766, 0.02704620361328125, 0.028920650482177734, 0.03079509735107422, 0.0326695442199707, 0.03454399108886719, 0.03641843795776367, 0.038292884826660156, 0.04016733169555664, 0.042041778564453125, 0.04391622543334961, 0.045790672302246094, 0.04766511917114258, 0.04953956604003906, 0.05141401290893555, 0.05328845977783203, 0.055162906646728516, 0.057037353515625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 8.0, 9.0, 13.0, 20.0, 43.0, 42.0, 54.0, 86.0, 114.0, 179.0, 257.0, 390.0, 584.0, 805.0, 1172.0, 1713.0, 2523.0, 3546.0, 5270.0, 7820.0, 11853.0, 17781.0, 27658.0, 43965.0, 72938.0, 129126.0, 245594.0, 200765.0, 104615.0, 61041.0, 37493.0, 23653.0, 15647.0, 10124.0, 6854.0, 4647.0, 3189.0, 2161.0, 1458.0, 1043.0, 734.0, 469.0, 358.0, 241.0, 163.0, 113.0, 69.0, 49.0, 49.0, 25.0, 16.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.11895751953125, -0.1152200698852539, -0.11148262023925781, -0.10774517059326172, -0.10400772094726562, -0.10027027130126953, -0.09653282165527344, -0.09279537200927734, -0.08905792236328125, -0.08532047271728516, -0.08158302307128906, -0.07784557342529297, -0.07410812377929688, -0.07037067413330078, -0.06663322448730469, -0.0628957748413086, -0.0591583251953125, -0.055420875549316406, -0.05168342590332031, -0.04794597625732422, -0.044208526611328125, -0.04047107696533203, -0.03673362731933594, -0.032996177673339844, -0.02925872802734375, -0.025521278381347656, -0.021783828735351562, -0.01804637908935547, -0.014308929443359375, -0.010571479797363281, -0.0068340301513671875, -0.0030965805053710938, 0.000640869140625, 0.004378318786621094, 0.008115768432617188, 0.011853218078613281, 0.015590667724609375, 0.01932811737060547, 0.023065567016601562, 0.026803016662597656, 0.03054046630859375, 0.034277915954589844, 0.03801536560058594, 0.04175281524658203, 0.045490264892578125, 0.04922771453857422, 0.05296516418457031, 0.056702613830566406, 0.0604400634765625, 0.0641775131225586, 0.06791496276855469, 0.07165241241455078, 0.07538986206054688, 0.07912731170654297, 0.08286476135253906, 0.08660221099853516, 0.09033966064453125, 0.09407711029052734, 0.09781455993652344, 0.10155200958251953, 0.10528945922851562, 0.10902690887451172, 0.11276435852050781, 0.1165018081665039, 0.1202392578125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 11.0, 4.0, 4.0, 3.0, 8.0, 9.0, 13.0, 14.0, 12.0, 10.0, 21.0, 25.0, 21.0, 23.0, 35.0, 38.0, 27.0, 32.0, 22.0, 32.0, 36.0, 36.0, 40.0, 30.0, 31.0, 36.0, 38.0, 42.0, 39.0, 31.0, 27.0, 28.0, 31.0, 31.0, 20.0, 17.0, 19.0, 9.0, 13.0, 19.0, 12.0, 8.0, 7.0, 9.0, 8.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0], "bins": [-0.038970947265625, -0.037804603576660156, -0.03663825988769531, -0.03547191619873047, -0.034305572509765625, -0.03313922882080078, -0.03197288513183594, -0.030806541442871094, -0.02964019775390625, -0.028473854064941406, -0.027307510375976562, -0.02614116668701172, -0.024974822998046875, -0.02380847930908203, -0.022642135620117188, -0.021475791931152344, -0.0203094482421875, -0.019143104553222656, -0.017976760864257812, -0.01681041717529297, -0.015644073486328125, -0.014477729797363281, -0.013311386108398438, -0.012145042419433594, -0.01097869873046875, -0.009812355041503906, -0.008646011352539062, -0.007479667663574219, -0.006313323974609375, -0.005146980285644531, -0.0039806365966796875, -0.0028142929077148438, -0.00164794921875, -0.00048160552978515625, 0.0006847381591796875, 0.0018510818481445312, 0.003017425537109375, 0.004183769226074219, 0.0053501129150390625, 0.006516456604003906, 0.00768280029296875, 0.008849143981933594, 0.010015487670898438, 0.011181831359863281, 0.012348175048828125, 0.013514518737792969, 0.014680862426757812, 0.015847206115722656, 0.0170135498046875, 0.018179893493652344, 0.019346237182617188, 0.02051258087158203, 0.021678924560546875, 0.02284526824951172, 0.024011611938476562, 0.025177955627441406, 0.02634429931640625, 0.027510643005371094, 0.028676986694335938, 0.02984333038330078, 0.031009674072265625, 0.03217601776123047, 0.03334236145019531, 0.034508705139160156, 0.035675048828125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 8.0, 12.0, 17.0, 26.0, 33.0, 44.0, 65.0, 81.0, 137.0, 210.0, 324.0, 532.0, 827.0, 1385.0, 2377.0, 4083.0, 7680.0, 16380.0, 37906.0, 133574.0, 721019.0, 69963.0, 26196.0, 11617.0, 5983.0, 3193.0, 1847.0, 1158.0, 638.0, 407.0, 267.0, 181.0, 130.0, 75.0, 50.0, 52.0, 23.0, 13.0, 7.0, 9.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.02789306640625, -0.02707958221435547, -0.026266098022460938, -0.025452613830566406, -0.024639129638671875, -0.023825645446777344, -0.023012161254882812, -0.02219867706298828, -0.02138519287109375, -0.02057170867919922, -0.019758224487304688, -0.018944740295410156, -0.018131256103515625, -0.017317771911621094, -0.016504287719726562, -0.01569080352783203, -0.0148773193359375, -0.014063835144042969, -0.013250350952148438, -0.012436866760253906, -0.011623382568359375, -0.010809898376464844, -0.009996414184570312, -0.009182929992675781, -0.00836944580078125, -0.007555961608886719, -0.0067424774169921875, -0.005928993225097656, -0.005115509033203125, -0.004302024841308594, -0.0034885406494140625, -0.0026750564575195312, -0.001861572265625, -0.0010480880737304688, -0.0002346038818359375, 0.0005788803100585938, 0.001392364501953125, 0.0022058486938476562, 0.0030193328857421875, 0.0038328170776367188, 0.00464630126953125, 0.005459785461425781, 0.0062732696533203125, 0.007086753845214844, 0.007900238037109375, 0.008713722229003906, 0.009527206420898438, 0.010340690612792969, 0.0111541748046875, 0.011967658996582031, 0.012781143188476562, 0.013594627380371094, 0.014408111572265625, 0.015221595764160156, 0.016035079956054688, 0.01684856414794922, 0.01766204833984375, 0.01847553253173828, 0.019289016723632812, 0.020102500915527344, 0.020915985107421875, 0.021729469299316406, 0.022542953491210938, 0.02335643768310547, 0.024169921875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 7.0, 0.0, 10.0, 16.0, 0.0, 52.0, 73.0, 0.0, 104.0, 151.0, 0.0, 152.0, 147.0, 0.0, 117.0, 70.0, 0.0, 44.0, 0.0, 19.0, 18.0, 0.0, 4.0, 5.0, 0.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.145587682723999e-07, -8.754432201385498e-07, -8.363276720046997e-07, -7.972121238708496e-07, -7.580965757369995e-07, -7.189810276031494e-07, -6.798654794692993e-07, -6.407499313354492e-07, -6.016343832015991e-07, -5.62518835067749e-07, -5.234032869338989e-07, -4.842877388000488e-07, -4.4517219066619873e-07, -4.0605664253234863e-07, -3.6694109439849854e-07, -3.2782554626464844e-07, -2.8870999813079834e-07, -2.4959444999694824e-07, -2.1047890186309814e-07, -1.7136335372924805e-07, -1.3224780559539795e-07, -9.313225746154785e-08, -5.4016709327697754e-08, -1.4901161193847656e-08, 2.421438694000244e-08, 6.332993507385254e-08, 1.0244548320770264e-07, 1.4156103134155273e-07, 1.8067657947540283e-07, 2.1979212760925293e-07, 2.5890767574310303e-07, 2.980232238769531e-07, 3.371387720108032e-07, 3.762543201446533e-07, 4.153698682785034e-07, 4.544854164123535e-07, 4.936009645462036e-07, 5.327165126800537e-07, 5.718320608139038e-07, 6.109476089477539e-07, 6.50063157081604e-07, 6.891787052154541e-07, 7.282942533493042e-07, 7.674098014831543e-07, 8.065253496170044e-07, 8.456408977508545e-07, 8.847564458847046e-07, 9.238719940185547e-07, 9.629875421524048e-07, 1.0021030902862549e-06, 1.041218638420105e-06, 1.080334186553955e-06, 1.1194497346878052e-06, 1.1585652828216553e-06, 1.1976808309555054e-06, 1.2367963790893555e-06, 1.2759119272232056e-06, 1.3150274753570557e-06, 1.3541430234909058e-06, 1.3932585716247559e-06, 1.432374119758606e-06, 1.471489667892456e-06, 1.5106052160263062e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 12.0, 17.0, 17.0, 24.0, 46.0, 61.0, 89.0, 116.0, 172.0, 272.0, 374.0, 609.0, 923.0, 1428.0, 2205.0, 3608.0, 6051.0, 11145.0, 22729.0, 56162.0, 650821.0, 203439.0, 45142.0, 19079.0, 9647.0, 5356.0, 3229.0, 1974.0, 1211.0, 864.0, 570.0, 355.0, 242.0, 171.0, 119.0, 75.0, 67.0, 39.0, 30.0, 14.0, 14.0, 9.0, 9.0, 4.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.030120849609375, -0.029257535934448242, -0.028394222259521484, -0.027530908584594727, -0.02666759490966797, -0.02580428123474121, -0.024940967559814453, -0.024077653884887695, -0.023214340209960938, -0.02235102653503418, -0.021487712860107422, -0.020624399185180664, -0.019761085510253906, -0.01889777183532715, -0.01803445816040039, -0.017171144485473633, -0.016307830810546875, -0.015444517135620117, -0.01458120346069336, -0.013717889785766602, -0.012854576110839844, -0.011991262435913086, -0.011127948760986328, -0.01026463508605957, -0.009401321411132812, -0.008538007736206055, -0.007674694061279297, -0.006811380386352539, -0.005948066711425781, -0.0050847530364990234, -0.004221439361572266, -0.003358125686645508, -0.00249481201171875, -0.0016314983367919922, -0.0007681846618652344, 9.512901306152344e-05, 0.0009584426879882812, 0.001821756362915039, 0.002685070037841797, 0.0035483837127685547, 0.0044116973876953125, 0.00527501106262207, 0.006138324737548828, 0.007001638412475586, 0.007864952087402344, 0.008728265762329102, 0.00959157943725586, 0.010454893112182617, 0.011318206787109375, 0.012181520462036133, 0.01304483413696289, 0.013908147811889648, 0.014771461486816406, 0.015634775161743164, 0.016498088836669922, 0.01736140251159668, 0.018224716186523438, 0.019088029861450195, 0.019951343536376953, 0.02081465721130371, 0.02167797088623047, 0.022541284561157227, 0.023404598236083984, 0.024267911911010742, 0.0251312255859375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 3.0, 5.0, 6.0, 7.0, 16.0, 20.0, 22.0, 28.0, 23.0, 33.0, 61.0, 222.0, 292.0, 56.0, 40.0, 39.0, 25.0, 20.0, 14.0, 12.0, 8.0, 3.0, 10.0, 3.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.008697509765625, -0.00845634937286377, -0.008215188980102539, -0.007974028587341309, -0.007732868194580078, -0.007491707801818848, -0.007250547409057617, -0.007009387016296387, -0.006768226623535156, -0.006527066230773926, -0.006285905838012695, -0.006044745445251465, -0.005803585052490234, -0.005562424659729004, -0.0053212642669677734, -0.005080103874206543, -0.0048389434814453125, -0.004597783088684082, -0.0043566226959228516, -0.004115462303161621, -0.0038743019104003906, -0.00363314151763916, -0.0033919811248779297, -0.0031508207321166992, -0.0029096603393554688, -0.0026684999465942383, -0.002427339553833008, -0.0021861791610717773, -0.0019450187683105469, -0.0017038583755493164, -0.001462697982788086, -0.0012215375900268555, -0.000980377197265625, -0.0007392168045043945, -0.0004980564117431641, -0.0002568960189819336, -1.5735626220703125e-05, 0.00022542476654052734, 0.0004665851593017578, 0.0007077455520629883, 0.0009489059448242188, 0.0011900663375854492, 0.0014312267303466797, 0.0016723871231079102, 0.0019135475158691406, 0.002154707908630371, 0.0023958683013916016, 0.002637028694152832, 0.0028781890869140625, 0.003119349479675293, 0.0033605098724365234, 0.003601670265197754, 0.0038428306579589844, 0.004083991050720215, 0.004325151443481445, 0.004566311836242676, 0.004807472229003906, 0.005048632621765137, 0.005289793014526367, 0.005530953407287598, 0.005772113800048828, 0.006013274192810059, 0.006254434585571289, 0.0064955949783325195, 0.00673675537109375]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 15.0, 14.0, 12.0, 22.0, 25.0, 46.0, 48.0, 55.0, 59.0, 94.0, 117.0, 103.0, 76.0, 56.0, 33.0, 30.0, 37.0, 29.0, 28.0, 17.0, 14.0, 11.0, 5.0, 8.0, 6.0, 8.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09528848528862, -0.09230369329452515, -0.0893189013004303, -0.08633410930633545, -0.0833493247628212, -0.08036453276872635, -0.0773797407746315, -0.07439494878053665, -0.0714101567864418, -0.06842536479234695, -0.0654405727982521, -0.062455784529447556, -0.05947099253535271, -0.05648620426654816, -0.05350141227245331, -0.05051662027835846, -0.04753183200955391, -0.04454704001545906, -0.04156225174665451, -0.03857745975255966, -0.03559266775846481, -0.032607875764369965, -0.029623087495565414, -0.026638295501470566, -0.023653505370020866, -0.020668715238571167, -0.01768392324447632, -0.014699133113026619, -0.011714342050254345, -0.008729550987482071, -0.0057447608560323715, -0.002759968861937523, 0.00022482126951217651, 0.003209612099453807, 0.006194402929395437, 0.009179193526506424, 0.012163984589278698, 0.015148775652050972, 0.01813356578350067, 0.02111835777759552, 0.02410314790904522, 0.02708793804049492, 0.030072730034589767, 0.03305751830339432, 0.036042310297489166, 0.039027102291584015, 0.042011894285678864, 0.04499668627977371, 0.04798147454857826, 0.05096626654267311, 0.05395105481147766, 0.05693584680557251, 0.05992063879966736, 0.06290543079376221, 0.06589022278785706, 0.0688750147819519, 0.07185979932546616, 0.074844591319561, 0.07782938331365585, 0.0808141678571701, 0.08379895985126495, 0.0867837518453598, 0.08976854383945465, 0.0927533358335495, 0.09573812782764435]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 5.0, 7.0, 9.0, 11.0, 19.0, 13.0, 11.0, 17.0, 12.0, 17.0, 26.0, 30.0, 33.0, 32.0, 35.0, 35.0, 27.0, 38.0, 42.0, 50.0, 29.0, 34.0, 40.0, 36.0, 27.0, 29.0, 33.0, 26.0, 28.0, 32.0, 24.0, 24.0, 22.0, 19.0, 17.0, 16.0, 14.0, 17.0, 15.0, 7.0, 11.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.06650801748037338, -0.06459624320268631, -0.06268447637557983, -0.06077270209789276, -0.05886092782020569, -0.056949157267808914, -0.05503738671541214, -0.05312561243772507, -0.05121384188532829, -0.04930207133293152, -0.047390297055244446, -0.04547852650284767, -0.0435667559504509, -0.041654981672763824, -0.03974321112036705, -0.037831440567970276, -0.0359196662902832, -0.03400789573788643, -0.032096121460199356, -0.030184350907802582, -0.028272578492760658, -0.026360806077718735, -0.02444903552532196, -0.022537263110280037, -0.020625490695238113, -0.01871371828019619, -0.016801945865154266, -0.014890175312757492, -0.012978402897715569, -0.011066630482673645, -0.009154858998954296, -0.007243087515234947, -0.005331315100193024, -0.0034195431508123875, -0.0015077712014317513, 0.00040400074794888496, 0.002315772697329521, 0.004227545112371445, 0.006139316596090794, 0.008051088079810143, 0.009962860494852066, 0.01187463290989399, 0.013786404393613338, 0.015698175877332687, 0.01760994829237461, 0.019521720707416534, 0.02143349125981331, 0.023345263674855232, 0.025257036089897156, 0.02716880850493908, 0.029080580919981003, 0.030992351472377777, 0.03290412575006485, 0.034815896302461624, 0.0367276668548584, 0.03863944113254547, 0.040551211684942245, 0.04246298223733902, 0.04437475651502609, 0.04628652706742287, 0.04819829761981964, 0.050110071897506714, 0.05202184244990349, 0.05393361300230026, 0.055845387279987335]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 13.0, 12.0, 24.0, 22.0, 39.0, 81.0, 91.0, 142.0, 228.0, 347.0, 538.0, 827.0, 1320.0, 2127.0, 3596.0, 5813.0, 10130.0, 17307.0, 31589.0, 58312.0, 114909.0, 259830.0, 999895.0, 1850954.0, 478393.0, 173042.0, 83171.0, 43511.0, 23821.0, 13602.0, 7947.0, 4770.0, 2891.0, 1790.0, 1138.0, 690.0, 465.0, 287.0, 200.0, 130.0, 104.0, 61.0, 41.0, 27.0, 15.0, 20.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09335041046142578, -0.09026527404785156, -0.08718013763427734, -0.08409500122070312, -0.0810098648071289, -0.07792472839355469, -0.07483959197998047, -0.07175445556640625, -0.06866931915283203, -0.06558418273925781, -0.062499046325683594, -0.059413909912109375, -0.056328773498535156, -0.05324363708496094, -0.05015850067138672, -0.0470733642578125, -0.04398822784423828, -0.04090309143066406, -0.037817955017089844, -0.034732818603515625, -0.031647682189941406, -0.028562545776367188, -0.02547740936279297, -0.02239227294921875, -0.01930713653564453, -0.016222000122070312, -0.013136863708496094, -0.010051727294921875, -0.006966590881347656, -0.0038814544677734375, -0.0007963180541992188, 0.002288818359375, 0.005373954772949219, 0.008459091186523438, 0.011544227600097656, 0.014629364013671875, 0.017714500427246094, 0.020799636840820312, 0.02388477325439453, 0.02696990966796875, 0.03005504608154297, 0.03314018249511719, 0.036225318908691406, 0.039310455322265625, 0.042395591735839844, 0.04548072814941406, 0.04856586456298828, 0.0516510009765625, 0.05473613739013672, 0.05782127380371094, 0.060906410217285156, 0.06399154663085938, 0.0670766830444336, 0.07016181945800781, 0.07324695587158203, 0.07633209228515625, 0.07941722869873047, 0.08250236511230469, 0.0855875015258789, 0.08867263793945312, 0.09175777435302734, 0.09484291076660156, 0.09792804718017578, 0.10101318359375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 5.0, 4.0, 4.0, 4.0, 6.0, 6.0, 13.0, 12.0, 14.0, 18.0, 9.0, 16.0, 24.0, 23.0, 25.0, 36.0, 37.0, 35.0, 33.0, 41.0, 48.0, 48.0, 38.0, 38.0, 37.0, 41.0, 38.0, 25.0, 32.0, 39.0, 32.0, 19.0, 35.0, 19.0, 25.0, 16.0, 9.0, 20.0, 18.0, 12.0, 8.0, 15.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.041595458984375, -0.040410518646240234, -0.03922557830810547, -0.0380406379699707, -0.03685569763183594, -0.03567075729370117, -0.034485816955566406, -0.03330087661743164, -0.032115936279296875, -0.03093099594116211, -0.029746055603027344, -0.028561115264892578, -0.027376174926757812, -0.026191234588623047, -0.02500629425048828, -0.023821353912353516, -0.02263641357421875, -0.021451473236083984, -0.02026653289794922, -0.019081592559814453, -0.017896652221679688, -0.016711711883544922, -0.015526771545410156, -0.01434183120727539, -0.013156890869140625, -0.01197195053100586, -0.010787010192871094, -0.009602069854736328, -0.008417129516601562, -0.007232189178466797, -0.006047248840332031, -0.004862308502197266, -0.0036773681640625, -0.0024924278259277344, -0.0013074874877929688, -0.00012254714965820312, 0.0010623931884765625, 0.002247333526611328, 0.0034322738647460938, 0.004617214202880859, 0.005802154541015625, 0.006987094879150391, 0.008172035217285156, 0.009356975555419922, 0.010541915893554688, 0.011726856231689453, 0.012911796569824219, 0.014096736907958984, 0.01528167724609375, 0.016466617584228516, 0.01765155792236328, 0.018836498260498047, 0.020021438598632812, 0.021206378936767578, 0.022391319274902344, 0.02357625961303711, 0.024761199951171875, 0.02594614028930664, 0.027131080627441406, 0.028316020965576172, 0.029500961303710938, 0.030685901641845703, 0.03187084197998047, 0.033055782318115234, 0.03424072265625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 8.0, 9.0, 10.0, 21.0, 27.0, 45.0, 51.0, 75.0, 148.0, 185.0, 303.0, 455.0, 651.0, 1137.0, 1690.0, 2718.0, 4402.0, 7250.0, 11956.0, 20206.0, 34697.0, 60614.0, 111176.0, 213160.0, 466096.0, 1268363.0, 1128009.0, 423028.0, 197334.0, 102687.0, 56762.0, 32553.0, 18862.0, 11274.0, 6808.0, 4320.0, 2563.0, 1673.0, 1039.0, 684.0, 408.0, 261.0, 207.0, 127.0, 83.0, 55.0, 34.0, 20.0, 12.0, 18.0, 8.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.065185546875, -0.0630788803100586, -0.06097221374511719, -0.05886554718017578, -0.056758880615234375, -0.05465221405029297, -0.05254554748535156, -0.050438880920410156, -0.04833221435546875, -0.046225547790527344, -0.04411888122558594, -0.04201221466064453, -0.039905548095703125, -0.03779888153076172, -0.03569221496582031, -0.033585548400878906, -0.0314788818359375, -0.029372215270996094, -0.027265548706054688, -0.02515888214111328, -0.023052215576171875, -0.02094554901123047, -0.018838882446289062, -0.016732215881347656, -0.01462554931640625, -0.012518882751464844, -0.010412216186523438, -0.008305549621582031, -0.006198883056640625, -0.004092216491699219, -0.0019855499267578125, 0.00012111663818359375, 0.002227783203125, 0.004334449768066406, 0.0064411163330078125, 0.008547782897949219, 0.010654449462890625, 0.012761116027832031, 0.014867782592773438, 0.016974449157714844, 0.01908111572265625, 0.021187782287597656, 0.023294448852539062, 0.02540111541748047, 0.027507781982421875, 0.02961444854736328, 0.03172111511230469, 0.033827781677246094, 0.0359344482421875, 0.038041114807128906, 0.04014778137207031, 0.04225444793701172, 0.044361114501953125, 0.04646778106689453, 0.04857444763183594, 0.050681114196777344, 0.05278778076171875, 0.054894447326660156, 0.05700111389160156, 0.05910778045654297, 0.061214447021484375, 0.06332111358642578, 0.06542778015136719, 0.0675344467163086, 0.06964111328125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 10.0, 6.0, 18.0, 12.0, 15.0, 18.0, 35.0, 34.0, 44.0, 46.0, 71.0, 81.0, 96.0, 99.0, 130.0, 151.0, 171.0, 214.0, 259.0, 271.0, 290.0, 295.0, 255.0, 219.0, 198.0, 165.0, 163.0, 117.0, 103.0, 92.0, 70.0, 70.0, 53.0, 47.0, 41.0, 18.0, 15.0, 15.0, 17.0, 13.0, 10.0, 10.0, 3.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.0222015380859375, -0.02156543731689453, -0.020929336547851562, -0.020293235778808594, -0.019657135009765625, -0.019021034240722656, -0.018384933471679688, -0.01774883270263672, -0.01711273193359375, -0.01647663116455078, -0.015840530395507812, -0.015204429626464844, -0.014568328857421875, -0.013932228088378906, -0.013296127319335938, -0.012660026550292969, -0.01202392578125, -0.011387825012207031, -0.010751724243164062, -0.010115623474121094, -0.009479522705078125, -0.008843421936035156, -0.008207321166992188, -0.007571220397949219, -0.00693511962890625, -0.006299018859863281, -0.0056629180908203125, -0.005026817321777344, -0.004390716552734375, -0.0037546157836914062, -0.0031185150146484375, -0.0024824142456054688, -0.0018463134765625, -0.0012102127075195312, -0.0005741119384765625, 6.198883056640625e-05, 0.000698089599609375, 0.0013341903686523438, 0.0019702911376953125, 0.0026063919067382812, 0.00324249267578125, 0.0038785934448242188, 0.0045146942138671875, 0.005150794982910156, 0.005786895751953125, 0.006422996520996094, 0.0070590972900390625, 0.007695198059082031, 0.008331298828125, 0.008967399597167969, 0.009603500366210938, 0.010239601135253906, 0.010875701904296875, 0.011511802673339844, 0.012147903442382812, 0.012784004211425781, 0.01342010498046875, 0.014056205749511719, 0.014692306518554688, 0.015328407287597656, 0.015964508056640625, 0.016600608825683594, 0.017236709594726562, 0.01787281036376953, 0.0185089111328125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 1.0, 2.0, 11.0, 13.0, 8.0, 20.0, 16.0, 29.0, 43.0, 42.0, 63.0, 59.0, 81.0, 89.0, 94.0, 95.0, 69.0, 35.0, 52.0, 32.0, 29.0, 25.0, 17.0, 17.0, 11.0, 14.0, 7.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07154228538274765, -0.06946065276861191, -0.06737902760505676, -0.06529739499092102, -0.06321576237678528, -0.061134129762649536, -0.05905250087380409, -0.05697087198495865, -0.054889239370822906, -0.052807606756687164, -0.05072597786784172, -0.04864434897899628, -0.046562716364860535, -0.04448108375072479, -0.04239945486187935, -0.040317825973033905, -0.03823619335889816, -0.03615456074476242, -0.03407293185591698, -0.03199130296707153, -0.02990967035293579, -0.027828039601445198, -0.025746408849954605, -0.023664778098464012, -0.02158314734697342, -0.019501516595482826, -0.017419885843992233, -0.01533825509250164, -0.013256624341011047, -0.011174993589520454, -0.009093362838029861, -0.0070117320865392685, -0.0049301087856292725, -0.0028484780341386795, -0.0007668472826480865, 0.0013147834688425064, 0.0033964142203330994, 0.005478044971823692, 0.007559675723314285, 0.009641306474804878, 0.011722937226295471, 0.013804567977786064, 0.015886198729276657, 0.01796782948076725, 0.020049460232257843, 0.022131090983748436, 0.02421272173523903, 0.026294352486729622, 0.028375983238220215, 0.030457613989710808, 0.0325392447412014, 0.034620873630046844, 0.03670250624418259, 0.03878413885831833, 0.04086576774716377, 0.042947396636009216, 0.04502902925014496, 0.0471106618642807, 0.049192290753126144, 0.05127391964197159, 0.05335555225610733, 0.05543718487024307, 0.057518813759088516, 0.05960044264793396, 0.0616820752620697]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 5.0, 7.0, 5.0, 13.0, 8.0, 11.0, 11.0, 19.0, 18.0, 17.0, 26.0, 27.0, 18.0, 33.0, 25.0, 30.0, 37.0, 34.0, 50.0, 38.0, 47.0, 34.0, 41.0, 39.0, 26.0, 29.0, 37.0, 32.0, 32.0, 42.0, 28.0, 24.0, 20.0, 21.0, 21.0, 15.0, 15.0, 10.0, 11.0, 9.0, 7.0, 3.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.04233264550566673, -0.0410650372505188, -0.039797425270080566, -0.03852981701493263, -0.0372622087597847, -0.035994600504636765, -0.03472699224948883, -0.0334593802690506, -0.032191772013902664, -0.03092416375875473, -0.029656553640961647, -0.028388943523168564, -0.02712133526802063, -0.025853727012872696, -0.024586116895079613, -0.02331850677728653, -0.022050898522138596, -0.02078329026699066, -0.01951568014919758, -0.018248070031404495, -0.01698046177625656, -0.015712853521108627, -0.014445243403315544, -0.013177634216845036, -0.011910025030374527, -0.010642415843904018, -0.00937480665743351, -0.008107197470963001, -0.006839588284492493, -0.005571979098021984, -0.0043043699115514755, -0.003036760725080967, -0.0017691552639007568, -0.0005015460774302483, 0.0007660631090402603, 0.002033672295510769, 0.0033012814819812775, 0.004568890668451786, 0.005836499854922295, 0.007104109041392803, 0.008371718227863312, 0.00963932741433382, 0.010906936600804329, 0.012174545787274837, 0.013442154973745346, 0.014709764160215855, 0.015977373346686363, 0.017244983464479446, 0.01851259171962738, 0.019780199974775314, 0.021047810092568398, 0.02231542021036148, 0.023583028465509415, 0.02485063672065735, 0.026118246838450432, 0.027385856956243515, 0.02865346521139145, 0.029921073466539383, 0.031188683584332466, 0.03245629370212555, 0.03372390195727348, 0.03499151021242142, 0.03625912219285965, 0.037526730448007584, 0.03879433870315552]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 13.0, 28.0, 34.0, 51.0, 59.0, 89.0, 143.0, 197.0, 307.0, 523.0, 715.0, 1035.0, 1559.0, 2339.0, 3674.0, 5668.0, 8794.0, 13960.0, 23253.0, 38274.0, 67583.0, 123758.0, 242821.0, 232941.0, 118305.0, 64902.0, 37215.0, 22080.0, 13491.0, 8505.0, 5592.0, 3631.0, 2371.0, 1519.0, 951.0, 698.0, 471.0, 326.0, 199.0, 149.0, 96.0, 72.0, 42.0, 31.0, 24.0, 20.0, 7.0, 11.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.021881103515625, -0.02121734619140625, -0.0205535888671875, -0.01988983154296875, -0.01922607421875, -0.01856231689453125, -0.0178985595703125, -0.01723480224609375, -0.016571044921875, -0.01590728759765625, -0.0152435302734375, -0.01457977294921875, -0.013916015625, -0.01325225830078125, -0.0125885009765625, -0.01192474365234375, -0.011260986328125, -0.01059722900390625, -0.0099334716796875, -0.00926971435546875, -0.00860595703125, -0.00794219970703125, -0.0072784423828125, -0.00661468505859375, -0.005950927734375, -0.00528717041015625, -0.0046234130859375, -0.00395965576171875, -0.0032958984375, -0.00263214111328125, -0.0019683837890625, -0.00130462646484375, -0.000640869140625, 2.288818359375e-05, 0.0006866455078125, 0.00135040283203125, 0.00201416015625, 0.00267791748046875, 0.0033416748046875, 0.00400543212890625, 0.004669189453125, 0.00533294677734375, 0.0059967041015625, 0.00666046142578125, 0.00732421875, 0.00798797607421875, 0.0086517333984375, 0.00931549072265625, 0.009979248046875, 0.01064300537109375, 0.0113067626953125, 0.01197052001953125, 0.01263427734375, 0.01329803466796875, 0.0139617919921875, 0.01462554931640625, 0.015289306640625, 0.01595306396484375, 0.0166168212890625, 0.01728057861328125, 0.0179443359375, 0.01860809326171875, 0.0192718505859375, 0.01993560791015625, 0.020599365234375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 7.0, 4.0, 13.0, 6.0, 6.0, 15.0, 12.0, 9.0, 7.0, 21.0, 24.0, 19.0, 21.0, 23.0, 29.0, 23.0, 37.0, 37.0, 44.0, 35.0, 49.0, 32.0, 32.0, 39.0, 35.0, 35.0, 28.0, 38.0, 30.0, 33.0, 30.0, 33.0, 18.0, 29.0, 18.0, 14.0, 14.0, 23.0, 11.0, 11.0, 7.0, 9.0, 11.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.038909912109375, -0.037686824798583984, -0.03646373748779297, -0.03524065017700195, -0.03401756286621094, -0.03279447555541992, -0.031571388244628906, -0.03034830093383789, -0.029125213623046875, -0.02790212631225586, -0.026679039001464844, -0.025455951690673828, -0.024232864379882812, -0.023009777069091797, -0.02178668975830078, -0.020563602447509766, -0.01934051513671875, -0.018117427825927734, -0.01689434051513672, -0.015671253204345703, -0.014448165893554688, -0.013225078582763672, -0.012001991271972656, -0.01077890396118164, -0.009555816650390625, -0.00833272933959961, -0.007109642028808594, -0.005886554718017578, -0.0046634674072265625, -0.003440380096435547, -0.0022172927856445312, -0.0009942054748535156, 0.0002288818359375, 0.0014519691467285156, 0.0026750564575195312, 0.003898143768310547, 0.0051212310791015625, 0.006344318389892578, 0.007567405700683594, 0.00879049301147461, 0.010013580322265625, 0.01123666763305664, 0.012459754943847656, 0.013682842254638672, 0.014905929565429688, 0.016129016876220703, 0.01735210418701172, 0.018575191497802734, 0.01979827880859375, 0.021021366119384766, 0.02224445343017578, 0.023467540740966797, 0.024690628051757812, 0.025913715362548828, 0.027136802673339844, 0.02835988998413086, 0.029582977294921875, 0.03080606460571289, 0.032029151916503906, 0.03325223922729492, 0.03447532653808594, 0.03569841384887695, 0.03692150115966797, 0.038144588470458984, 0.03936767578125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 17.0, 16.0, 25.0, 29.0, 36.0, 75.0, 78.0, 154.0, 220.0, 267.0, 426.0, 629.0, 928.0, 1283.0, 2136.0, 3136.0, 4942.0, 8472.0, 16409.0, 39253.0, 129816.0, 563202.0, 182577.0, 49483.0, 19412.0, 9710.0, 5493.0, 3336.0, 2333.0, 1411.0, 1016.0, 733.0, 498.0, 303.0, 230.0, 156.0, 99.0, 68.0, 50.0, 31.0, 16.0, 14.0, 19.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.039642333984375, -0.03834724426269531, -0.037052154541015625, -0.03575706481933594, -0.03446197509765625, -0.03316688537597656, -0.031871795654296875, -0.030576705932617188, -0.0292816162109375, -0.027986526489257812, -0.026691436767578125, -0.025396347045898438, -0.02410125732421875, -0.022806167602539062, -0.021511077880859375, -0.020215988159179688, -0.0189208984375, -0.017625808715820312, -0.016330718994140625, -0.015035629272460938, -0.01374053955078125, -0.012445449829101562, -0.011150360107421875, -0.009855270385742188, -0.0085601806640625, -0.0072650909423828125, -0.005970001220703125, -0.0046749114990234375, -0.00337982177734375, -0.0020847320556640625, -0.000789642333984375, 0.0005054473876953125, 0.001800537109375, 0.0030956268310546875, 0.004390716552734375, 0.0056858062744140625, 0.00698089599609375, 0.008275985717773438, 0.009571075439453125, 0.010866165161132812, 0.0121612548828125, 0.013456344604492188, 0.014751434326171875, 0.016046524047851562, 0.01734161376953125, 0.018636703491210938, 0.019931793212890625, 0.021226882934570312, 0.02252197265625, 0.023817062377929688, 0.025112152099609375, 0.026407241821289062, 0.02770233154296875, 0.028997421264648438, 0.030292510986328125, 0.03158760070800781, 0.0328826904296875, 0.03417778015136719, 0.035472869873046875, 0.03676795959472656, 0.03806304931640625, 0.03935813903808594, 0.040653228759765625, 0.04194831848144531, 0.043243408203125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 1.0, 5.0, 5.0, 15.0, 5.0, 6.0, 12.0, 13.0, 16.0, 16.0, 23.0, 22.0, 36.0, 37.0, 39.0, 29.0, 37.0, 42.0, 36.0, 47.0, 39.0, 45.0, 47.0, 45.0, 28.0, 36.0, 32.0, 41.0, 27.0, 30.0, 23.0, 24.0, 24.0, 17.0, 18.0, 15.0, 13.0, 12.0, 3.0, 10.0, 8.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0283660888671875, -0.027469635009765625, -0.02657318115234375, -0.025676727294921875, -0.0247802734375, -0.023883819580078125, -0.02298736572265625, -0.022090911865234375, -0.0211944580078125, -0.020298004150390625, -0.01940155029296875, -0.018505096435546875, -0.017608642578125, -0.016712188720703125, -0.01581573486328125, -0.014919281005859375, -0.0140228271484375, -0.013126373291015625, -0.01222991943359375, -0.011333465576171875, -0.01043701171875, -0.009540557861328125, -0.00864410400390625, -0.007747650146484375, -0.0068511962890625, -0.005954742431640625, -0.00505828857421875, -0.004161834716796875, -0.003265380859375, -0.002368927001953125, -0.00147247314453125, -0.000576019287109375, 0.0003204345703125, 0.001216888427734375, 0.00211334228515625, 0.003009796142578125, 0.00390625, 0.004802703857421875, 0.00569915771484375, 0.006595611572265625, 0.0074920654296875, 0.008388519287109375, 0.00928497314453125, 0.010181427001953125, 0.011077880859375, 0.011974334716796875, 0.01287078857421875, 0.013767242431640625, 0.0146636962890625, 0.015560150146484375, 0.01645660400390625, 0.017353057861328125, 0.01824951171875, 0.019145965576171875, 0.02004241943359375, 0.020938873291015625, 0.0218353271484375, 0.022731781005859375, 0.02362823486328125, 0.024524688720703125, 0.025421142578125, 0.026317596435546875, 0.02721405029296875, 0.028110504150390625, 0.0290069580078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 10.0, 8.0, 12.0, 18.0, 18.0, 17.0, 36.0, 30.0, 58.0, 70.0, 110.0, 170.0, 199.0, 310.0, 411.0, 636.0, 1080.0, 1651.0, 2899.0, 5874.0, 14271.0, 52213.0, 785359.0, 141684.0, 23305.0, 8377.0, 3803.0, 2150.0, 1248.0, 770.0, 515.0, 344.0, 231.0, 193.0, 144.0, 86.0, 84.0, 40.0, 31.0, 31.0, 26.0, 12.0, 7.0, 7.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.005084991455078125, -0.004919469356536865, -0.0047539472579956055, -0.004588425159454346, -0.004422903060913086, -0.004257380962371826, -0.004091858863830566, -0.003926336765289307, -0.003760814666748047, -0.003595292568206787, -0.0034297704696655273, -0.0032642483711242676, -0.003098726272583008, -0.002933204174041748, -0.0027676820755004883, -0.0026021599769592285, -0.0024366378784179688, -0.002271115779876709, -0.0021055936813354492, -0.0019400715827941895, -0.0017745494842529297, -0.00160902738571167, -0.0014435052871704102, -0.0012779831886291504, -0.0011124610900878906, -0.0009469389915466309, -0.0007814168930053711, -0.0006158947944641113, -0.00045037269592285156, -0.0002848505973815918, -0.00011932849884033203, 4.6193599700927734e-05, 0.0002117156982421875, 0.00037723779678344727, 0.000542759895324707, 0.0007082819938659668, 0.0008738040924072266, 0.0010393261909484863, 0.001204848289489746, 0.0013703703880310059, 0.0015358924865722656, 0.0017014145851135254, 0.0018669366836547852, 0.002032458782196045, 0.0021979808807373047, 0.0023635029792785645, 0.0025290250778198242, 0.002694547176361084, 0.0028600692749023438, 0.0030255913734436035, 0.0031911134719848633, 0.003356635570526123, 0.003522157669067383, 0.0036876797676086426, 0.0038532018661499023, 0.004018723964691162, 0.004184246063232422, 0.004349768161773682, 0.004515290260314941, 0.004680812358856201, 0.004846334457397461, 0.005011856555938721, 0.0051773786544799805, 0.00534290075302124, 0.0055084228515625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 9.0, 0.0, 11.0, 0.0, 0.0, 13.0, 0.0, 21.0, 0.0, 0.0, 36.0, 0.0, 66.0, 0.0, 0.0, 89.0, 0.0, 101.0, 0.0, 0.0, 124.0, 0.0, 123.0, 0.0, 118.0, 0.0, 0.0, 80.0, 0.0, 69.0, 0.0, 0.0, 55.0, 0.0, 40.0, 0.0, 0.0, 29.0, 0.0, 15.0, 0.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.102506399154663e-07, -7.860362529754639e-07, -7.618218660354614e-07, -7.37607479095459e-07, -7.133930921554565e-07, -6.891787052154541e-07, -6.649643182754517e-07, -6.407499313354492e-07, -6.165355443954468e-07, -5.923211574554443e-07, -5.681067705154419e-07, -5.438923835754395e-07, -5.19677996635437e-07, -4.954636096954346e-07, -4.7124922275543213e-07, -4.470348358154297e-07, -4.2282044887542725e-07, -3.986060619354248e-07, -3.7439167499542236e-07, -3.501772880554199e-07, -3.259629011154175e-07, -3.0174851417541504e-07, -2.775341272354126e-07, -2.5331974029541016e-07, -2.2910535335540771e-07, -2.0489096641540527e-07, -1.8067657947540283e-07, -1.564621925354004e-07, -1.3224780559539795e-07, -1.0803341865539551e-07, -8.381903171539307e-08, -5.960464477539063e-08, -3.5390257835388184e-08, -1.1175870895385742e-08, 1.30385160446167e-08, 3.725290298461914e-08, 6.146728992462158e-08, 8.568167686462402e-08, 1.0989606380462646e-07, 1.341104507446289e-07, 1.5832483768463135e-07, 1.825392246246338e-07, 2.0675361156463623e-07, 2.3096799850463867e-07, 2.551823854446411e-07, 2.7939677238464355e-07, 3.03611159324646e-07, 3.2782554626464844e-07, 3.520399332046509e-07, 3.762543201446533e-07, 4.0046870708465576e-07, 4.246830940246582e-07, 4.4889748096466064e-07, 4.731118679046631e-07, 4.973262548446655e-07, 5.21540641784668e-07, 5.457550287246704e-07, 5.699694156646729e-07, 5.941838026046753e-07, 6.183981895446777e-07, 6.426125764846802e-07, 6.668269634246826e-07, 6.910413503646851e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 8.0, 12.0, 19.0, 31.0, 36.0, 48.0, 59.0, 68.0, 97.0, 170.0, 235.0, 358.0, 468.0, 673.0, 1037.0, 1571.0, 2295.0, 3771.0, 6082.0, 11152.0, 20418.0, 42859.0, 109963.0, 487966.0, 225202.0, 67250.0, 29570.0, 15059.0, 8154.0, 4899.0, 3089.0, 1935.0, 1193.0, 867.0, 557.0, 417.0, 278.0, 170.0, 138.0, 108.0, 85.0, 52.0, 49.0, 28.0, 21.0, 11.0, 8.0, 8.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0027484893798828125, -0.002659142017364502, -0.0025697946548461914, -0.002480447292327881, -0.0023910999298095703, -0.0023017525672912598, -0.0022124052047729492, -0.0021230578422546387, -0.002033710479736328, -0.0019443631172180176, -0.001855015754699707, -0.0017656683921813965, -0.001676321029663086, -0.0015869736671447754, -0.0014976263046264648, -0.0014082789421081543, -0.0013189315795898438, -0.0012295842170715332, -0.0011402368545532227, -0.0010508894920349121, -0.0009615421295166016, -0.000872194766998291, -0.0007828474044799805, -0.0006935000419616699, -0.0006041526794433594, -0.0005148053169250488, -0.0004254579544067383, -0.00033611059188842773, -0.0002467632293701172, -0.00015741586685180664, -6.80685043334961e-05, 2.1278858184814453e-05, 0.000110626220703125, 0.00019997358322143555, 0.0002893209457397461, 0.00037866830825805664, 0.0004680156707763672, 0.0005573630332946777, 0.0006467103958129883, 0.0007360577583312988, 0.0008254051208496094, 0.0009147524833679199, 0.0010040998458862305, 0.001093447208404541, 0.0011827945709228516, 0.0012721419334411621, 0.0013614892959594727, 0.0014508366584777832, 0.0015401840209960938, 0.0016295313835144043, 0.0017188787460327148, 0.0018082261085510254, 0.001897573471069336, 0.0019869208335876465, 0.002076268196105957, 0.0021656155586242676, 0.002254962921142578, 0.0023443102836608887, 0.0024336576461791992, 0.0025230050086975098, 0.0026123523712158203, 0.002701699733734131, 0.0027910470962524414, 0.002880394458770752, 0.0029697418212890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 18.0, 11.0, 15.0, 31.0, 41.0, 69.0, 89.0, 206.0, 213.0, 98.0, 57.0, 32.0, 32.0, 19.0, 14.0, 17.0, 12.0, 5.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00079345703125, -0.0007605254650115967, -0.0007275938987731934, -0.00069466233253479, -0.0006617307662963867, -0.0006287992000579834, -0.0005958676338195801, -0.0005629360675811768, -0.0005300045013427734, -0.0004970729351043701, -0.0004641413688659668, -0.0004312098026275635, -0.00039827823638916016, -0.00036534667015075684, -0.0003324151039123535, -0.0002994835376739502, -0.0002665519714355469, -0.00023362040519714355, -0.00020068883895874023, -0.00016775727272033691, -0.0001348257064819336, -0.00010189414024353027, -6.896257400512695e-05, -3.603100776672363e-05, -3.0994415283203125e-06, 2.9832124710083008e-05, 6.276369094848633e-05, 9.569525718688965e-05, 0.00012862682342529297, 0.0001615583896636963, 0.0001944899559020996, 0.00022742152214050293, 0.00026035308837890625, 0.00029328465461730957, 0.0003262162208557129, 0.0003591477870941162, 0.00039207935333251953, 0.00042501091957092285, 0.00045794248580932617, 0.0004908740520477295, 0.0005238056182861328, 0.0005567371845245361, 0.0005896687507629395, 0.0006226003170013428, 0.0006555318832397461, 0.0006884634494781494, 0.0007213950157165527, 0.0007543265819549561, 0.0007872581481933594, 0.0008201897144317627, 0.000853121280670166, 0.0008860528469085693, 0.0009189844131469727, 0.000951915979385376, 0.0009848475456237793, 0.0010177791118621826, 0.001050710678100586, 0.0010836422443389893, 0.0011165738105773926, 0.001149505376815796, 0.0011824369430541992, 0.0012153685092926025, 0.0012483000755310059, 0.0012812316417694092, 0.0013141632080078125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 3.0, 9.0, 6.0, 14.0, 11.0, 18.0, 23.0, 35.0, 44.0, 53.0, 49.0, 69.0, 101.0, 100.0, 87.0, 69.0, 66.0, 34.0, 41.0, 37.0, 27.0, 21.0, 17.0, 13.0, 9.0, 13.0, 7.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06912243366241455, -0.06707853078842163, -0.06503462791442871, -0.06299072504043579, -0.06094681844115257, -0.058902911841869354, -0.056859008967876434, -0.054815106093883514, -0.052771203219890594, -0.050727300345897675, -0.048683393746614456, -0.046639490872621536, -0.044595587998628616, -0.0425516813993454, -0.04050777852535248, -0.03846387565135956, -0.03641996905207634, -0.03437606617808342, -0.0323321595788002, -0.03028825670480728, -0.02824435383081436, -0.026200449094176292, -0.024156544357538223, -0.022112641483545303, -0.020068736746907234, -0.018024832010269165, -0.015980929136276245, -0.013937024399638176, -0.011893120594322681, -0.009849216789007187, -0.007805312052369118, -0.005761408247053623, -0.00371750071644783, -0.001673596678301692, 0.0003703073598444462, 0.002414211630821228, 0.0044581154361367226, 0.006502019241452217, 0.008545923978090286, 0.01058982778340578, 0.012633731588721275, 0.01467763539403677, 0.016721539199352264, 0.018765443935990334, 0.020809348672628403, 0.022853251546621323, 0.024897156283259392, 0.02694106101989746, 0.02898496389389038, 0.03102886863052845, 0.03307277336716652, 0.03511667624115944, 0.03716057911515236, 0.03920448571443558, 0.0412483885884285, 0.04329229146242142, 0.04533619433641434, 0.04738009721040726, 0.049424003809690475, 0.051467906683683395, 0.053511809557676315, 0.055555716156959534, 0.057599619030952454, 0.059643521904945374, 0.06168742850422859]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 6.0, 10.0, 10.0, 10.0, 12.0, 18.0, 17.0, 17.0, 24.0, 30.0, 19.0, 33.0, 25.0, 27.0, 39.0, 35.0, 45.0, 45.0, 39.0, 36.0, 42.0, 43.0, 27.0, 27.0, 36.0, 30.0, 34.0, 41.0, 26.0, 26.0, 22.0, 20.0, 21.0, 16.0, 17.0, 10.0, 10.0, 9.0, 6.0, 4.0, 9.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.04234780743718147, -0.04108668118715286, -0.03982555866241455, -0.03856443613767624, -0.03730330988764763, -0.03604218363761902, -0.03478106111288071, -0.033519938588142395, -0.032258812338113785, -0.030997687950730324, -0.029736563563346863, -0.028475439175963402, -0.02721431478857994, -0.02595319040119648, -0.02469206601381302, -0.023430941626429558, -0.022169817239046097, -0.020908692851662636, -0.019647568464279175, -0.018386444076895714, -0.017125319689512253, -0.015864195302128792, -0.01460307091474533, -0.01334194652736187, -0.012080822139978409, -0.010819697752594948, -0.009558573365211487, -0.008297448977828026, -0.007036324590444565, -0.005775200203061104, -0.004514075815677643, -0.003252951428294182, -0.0019918233156204224, -0.0007306989282369614, 0.0005304254591464996, 0.0017915498465299606, 0.0030526742339134216, 0.004313798621296883, 0.005574923008680344, 0.006836047396063805, 0.008097171783447266, 0.009358296170830727, 0.010619420558214188, 0.011880544945597649, 0.01314166933298111, 0.01440279372036457, 0.01566391810774803, 0.016925042495131493, 0.018186166882514954, 0.019447291269898415, 0.020708415657281876, 0.021969540044665337, 0.023230664432048798, 0.02449178881943226, 0.02575291320681572, 0.02701403759419918, 0.02827516198158264, 0.029536286368966103, 0.030797410756349564, 0.032058537006378174, 0.033319659531116486, 0.0345807820558548, 0.03584190830588341, 0.03710303455591202, 0.03836415708065033]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 6.0, 13.0, 25.0, 32.0, 58.0, 72.0, 94.0, 128.0, 187.0, 290.0, 430.0, 583.0, 911.0, 1373.0, 2058.0, 3256.0, 4835.0, 7331.0, 11517.0, 17690.0, 27660.0, 44185.0, 74533.0, 133960.0, 251572.0, 199906.0, 103706.0, 59714.0, 36637.0, 23114.0, 14695.0, 9476.0, 6146.0, 4085.0, 2741.0, 1817.0, 1212.0, 767.0, 545.0, 337.0, 278.0, 160.0, 129.0, 84.0, 53.0, 38.0, 35.0, 27.0, 16.0, 10.0, 3.0, 6.0, 4.0, 4.0], "bins": [-0.08428955078125, -0.08186721801757812, -0.07944488525390625, -0.07702255249023438, -0.0746002197265625, -0.07217788696289062, -0.06975555419921875, -0.06733322143554688, -0.064910888671875, -0.062488555908203125, -0.06006622314453125, -0.057643890380859375, -0.0552215576171875, -0.052799224853515625, -0.05037689208984375, -0.047954559326171875, -0.0455322265625, -0.043109893798828125, -0.04068756103515625, -0.038265228271484375, -0.0358428955078125, -0.033420562744140625, -0.03099822998046875, -0.028575897216796875, -0.026153564453125, -0.023731231689453125, -0.02130889892578125, -0.018886566162109375, -0.0164642333984375, -0.014041900634765625, -0.01161956787109375, -0.009197235107421875, -0.00677490234375, -0.004352569580078125, -0.00193023681640625, 0.000492095947265625, 0.0029144287109375, 0.005336761474609375, 0.00775909423828125, 0.010181427001953125, 0.012603759765625, 0.015026092529296875, 0.01744842529296875, 0.019870758056640625, 0.0222930908203125, 0.024715423583984375, 0.02713775634765625, 0.029560089111328125, 0.031982421875, 0.034404754638671875, 0.03682708740234375, 0.039249420166015625, 0.0416717529296875, 0.044094085693359375, 0.04651641845703125, 0.048938751220703125, 0.051361083984375, 0.053783416748046875, 0.05620574951171875, 0.058628082275390625, 0.0610504150390625, 0.06347274780273438, 0.06589508056640625, 0.06831741333007812, 0.07073974609375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 4.0, 6.0, 8.0, 10.0, 11.0, 14.0, 13.0, 14.0, 17.0, 22.0, 24.0, 29.0, 23.0, 32.0, 34.0, 39.0, 37.0, 35.0, 48.0, 51.0, 40.0, 34.0, 39.0, 33.0, 43.0, 39.0, 28.0, 25.0, 38.0, 30.0, 30.0, 24.0, 22.0, 22.0, 17.0, 11.0, 12.0, 5.0, 11.0, 5.0, 1.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0413818359375, -0.040190696716308594, -0.03899955749511719, -0.03780841827392578, -0.036617279052734375, -0.03542613983154297, -0.03423500061035156, -0.033043861389160156, -0.03185272216796875, -0.030661582946777344, -0.029470443725585938, -0.02827930450439453, -0.027088165283203125, -0.02589702606201172, -0.024705886840820312, -0.023514747619628906, -0.0223236083984375, -0.021132469177246094, -0.019941329956054688, -0.01875019073486328, -0.017559051513671875, -0.01636791229248047, -0.015176773071289062, -0.013985633850097656, -0.01279449462890625, -0.011603355407714844, -0.010412216186523438, -0.009221076965332031, -0.008029937744140625, -0.006838798522949219, -0.0056476593017578125, -0.004456520080566406, -0.003265380859375, -0.0020742416381835938, -0.0008831024169921875, 0.00030803680419921875, 0.001499176025390625, 0.0026903152465820312, 0.0038814544677734375, 0.005072593688964844, 0.00626373291015625, 0.007454872131347656, 0.008646011352539062, 0.009837150573730469, 0.011028289794921875, 0.012219429016113281, 0.013410568237304688, 0.014601707458496094, 0.0157928466796875, 0.016983985900878906, 0.018175125122070312, 0.01936626434326172, 0.020557403564453125, 0.02174854278564453, 0.022939682006835938, 0.024130821228027344, 0.02532196044921875, 0.026513099670410156, 0.027704238891601562, 0.02889537811279297, 0.030086517333984375, 0.03127765655517578, 0.03246879577636719, 0.033659934997558594, 0.03485107421875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 8.0, 12.0, 12.0, 13.0, 22.0, 54.0, 81.0, 104.0, 150.0, 253.0, 382.0, 548.0, 887.0, 1452.0, 2239.0, 3650.0, 6035.0, 9754.0, 16465.0, 27523.0, 47273.0, 82255.0, 155281.0, 295455.0, 178344.0, 91314.0, 52107.0, 30541.0, 18090.0, 10761.0, 6571.0, 4002.0, 2538.0, 1571.0, 972.0, 642.0, 422.0, 265.0, 158.0, 109.0, 79.0, 61.0, 30.0, 22.0, 20.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0810546875, -0.07831573486328125, -0.0755767822265625, -0.07283782958984375, -0.070098876953125, -0.06735992431640625, -0.0646209716796875, -0.06188201904296875, -0.05914306640625, -0.05640411376953125, -0.0536651611328125, -0.05092620849609375, -0.048187255859375, -0.04544830322265625, -0.0427093505859375, -0.03997039794921875, -0.0372314453125, -0.03449249267578125, -0.0317535400390625, -0.02901458740234375, -0.026275634765625, -0.02353668212890625, -0.0207977294921875, -0.01805877685546875, -0.01531982421875, -0.01258087158203125, -0.0098419189453125, -0.00710296630859375, -0.004364013671875, -0.00162506103515625, 0.0011138916015625, 0.00385284423828125, 0.006591796875, 0.00933074951171875, 0.0120697021484375, 0.01480865478515625, 0.017547607421875, 0.02028656005859375, 0.0230255126953125, 0.02576446533203125, 0.02850341796875, 0.03124237060546875, 0.0339813232421875, 0.03672027587890625, 0.039459228515625, 0.04219818115234375, 0.0449371337890625, 0.04767608642578125, 0.0504150390625, 0.05315399169921875, 0.0558929443359375, 0.05863189697265625, 0.061370849609375, 0.06410980224609375, 0.0668487548828125, 0.06958770751953125, 0.07232666015625, 0.07506561279296875, 0.0778045654296875, 0.08054351806640625, 0.083282470703125, 0.08602142333984375, 0.0887603759765625, 0.09149932861328125, 0.09423828125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 10.0, 15.0, 12.0, 12.0, 21.0, 18.0, 16.0, 22.0, 33.0, 24.0, 27.0, 42.0, 40.0, 43.0, 44.0, 45.0, 34.0, 47.0, 47.0, 44.0, 44.0, 54.0, 32.0, 37.0, 34.0, 24.0, 26.0, 24.0, 26.0, 15.0, 18.0, 17.0, 9.0, 13.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0278167724609375, -0.026989459991455078, -0.026162147521972656, -0.025334835052490234, -0.024507522583007812, -0.02368021011352539, -0.02285289764404297, -0.022025585174560547, -0.021198272705078125, -0.020370960235595703, -0.01954364776611328, -0.01871633529663086, -0.017889022827148438, -0.017061710357666016, -0.016234397888183594, -0.015407085418701172, -0.01457977294921875, -0.013752460479736328, -0.012925148010253906, -0.012097835540771484, -0.011270523071289062, -0.01044321060180664, -0.009615898132324219, -0.008788585662841797, -0.007961273193359375, -0.007133960723876953, -0.006306648254394531, -0.005479335784912109, -0.0046520233154296875, -0.0038247108459472656, -0.0029973983764648438, -0.002170085906982422, -0.0013427734375, -0.0005154609680175781, 0.00031185150146484375, 0.0011391639709472656, 0.0019664764404296875, 0.0027937889099121094, 0.0036211013793945312, 0.004448413848876953, 0.005275726318359375, 0.006103038787841797, 0.006930351257324219, 0.007757663726806641, 0.008584976196289062, 0.009412288665771484, 0.010239601135253906, 0.011066913604736328, 0.01189422607421875, 0.012721538543701172, 0.013548851013183594, 0.014376163482666016, 0.015203475952148438, 0.01603078842163086, 0.01685810089111328, 0.017685413360595703, 0.018512725830078125, 0.019340038299560547, 0.02016735076904297, 0.02099466323852539, 0.021821975708007812, 0.022649288177490234, 0.023476600646972656, 0.024303913116455078, 0.0251312255859375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 7.0, 8.0, 12.0, 24.0, 29.0, 28.0, 48.0, 75.0, 118.0, 124.0, 212.0, 283.0, 341.0, 577.0, 734.0, 1089.0, 1665.0, 2566.0, 4101.0, 7161.0, 13119.0, 30088.0, 163636.0, 737302.0, 45473.0, 17052.0, 8559.0, 4899.0, 3130.0, 1903.0, 1213.0, 846.0, 626.0, 389.0, 285.0, 222.0, 156.0, 119.0, 82.0, 54.0, 52.0, 36.0, 28.0, 31.0, 11.0, 10.0, 4.0, 9.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.008928060531616211, -0.008632183074951172, -0.008336305618286133, -0.008040428161621094, -0.007744550704956055, -0.007448673248291016, -0.0071527957916259766, -0.0068569183349609375, -0.0065610408782958984, -0.006265163421630859, -0.00596928596496582, -0.005673408508300781, -0.005377531051635742, -0.005081653594970703, -0.004785776138305664, -0.004489898681640625, -0.004194021224975586, -0.003898143768310547, -0.003602266311645508, -0.0033063888549804688, -0.0030105113983154297, -0.0027146339416503906, -0.0024187564849853516, -0.0021228790283203125, -0.0018270015716552734, -0.0015311241149902344, -0.0012352466583251953, -0.0009393692016601562, -0.0006434917449951172, -0.0003476142883300781, -5.173683166503906e-05, 0.000244140625, 0.0005400180816650391, 0.0008358955383300781, 0.0011317729949951172, 0.0014276504516601562, 0.0017235279083251953, 0.0020194053649902344, 0.0023152828216552734, 0.0026111602783203125, 0.0029070377349853516, 0.0032029151916503906, 0.0034987926483154297, 0.0037946701049804688, 0.004090547561645508, 0.004386425018310547, 0.004682302474975586, 0.004978179931640625, 0.005274057388305664, 0.005569934844970703, 0.005865812301635742, 0.006161689758300781, 0.00645756721496582, 0.006753444671630859, 0.0070493221282958984, 0.0073451995849609375, 0.0076410770416259766, 0.007936954498291016, 0.008232831954956055, 0.008528709411621094, 0.008824586868286133, 0.009120464324951172, 0.009416341781616211, 0.00971221923828125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 0.0, 4.0, 0.0, 9.0, 0.0, 19.0, 0.0, 29.0, 0.0, 40.0, 0.0, 63.0, 0.0, 127.0, 0.0, 146.0, 0.0, 140.0, 0.0, 159.0, 0.0, 97.0, 0.0, 71.0, 0.0, 31.0, 0.0, 26.0, 0.0, 9.0, 0.0, 9.0, 0.0, 13.0, 0.0, 6.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07, 9.834766387939453e-07, 1.0132789611816406e-06, 1.043081283569336e-06, 1.0728836059570312e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 15.0, 13.0, 32.0, 29.0, 61.0, 76.0, 106.0, 138.0, 210.0, 254.0, 380.0, 528.0, 732.0, 1085.0, 1445.0, 2142.0, 3323.0, 5011.0, 8072.0, 14499.0, 35148.0, 449936.0, 451952.0, 34977.0, 14665.0, 8114.0, 5017.0, 3309.0, 2135.0, 1460.0, 1070.0, 763.0, 509.0, 395.0, 252.0, 200.0, 153.0, 88.0, 73.0, 63.0, 36.0, 20.0, 15.0, 14.0, 11.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00966644287109375, -0.00936436653137207, -0.00906229019165039, -0.008760213851928711, -0.008458137512207031, -0.008156061172485352, -0.007853984832763672, -0.007551908493041992, -0.0072498321533203125, -0.006947755813598633, -0.006645679473876953, -0.0063436031341552734, -0.006041526794433594, -0.005739450454711914, -0.005437374114990234, -0.005135297775268555, -0.004833221435546875, -0.004531145095825195, -0.004229068756103516, -0.003926992416381836, -0.0036249160766601562, -0.0033228397369384766, -0.003020763397216797, -0.002718687057495117, -0.0024166107177734375, -0.002114534378051758, -0.0018124580383300781, -0.0015103816986083984, -0.0012083053588867188, -0.0009062290191650391, -0.0006041526794433594, -0.0003020763397216797, 0.0, 0.0003020763397216797, 0.0006041526794433594, 0.0009062290191650391, 0.0012083053588867188, 0.0015103816986083984, 0.0018124580383300781, 0.002114534378051758, 0.0024166107177734375, 0.002718687057495117, 0.003020763397216797, 0.0033228397369384766, 0.0036249160766601562, 0.003926992416381836, 0.004229068756103516, 0.004531145095825195, 0.004833221435546875, 0.005135297775268555, 0.005437374114990234, 0.005739450454711914, 0.006041526794433594, 0.0063436031341552734, 0.006645679473876953, 0.006947755813598633, 0.0072498321533203125, 0.007551908493041992, 0.007853984832763672, 0.008156061172485352, 0.008458137512207031, 0.008760213851928711, 0.00906229019165039, 0.00936436653137207, 0.00966644287109375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 7.0, 4.0, 8.0, 16.0, 14.0, 28.0, 62.0, 97.0, 474.0, 102.0, 48.0, 33.0, 15.0, 11.0, 6.0, 8.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027713775634765625, -0.002683401107788086, -0.0025954246520996094, -0.002507448196411133, -0.0024194717407226562, -0.0023314952850341797, -0.002243518829345703, -0.0021555423736572266, -0.00206756591796875, -0.0019795894622802734, -0.0018916130065917969, -0.0018036365509033203, -0.0017156600952148438, -0.0016276836395263672, -0.0015397071838378906, -0.001451730728149414, -0.0013637542724609375, -0.001275777816772461, -0.0011878013610839844, -0.0010998249053955078, -0.0010118484497070312, -0.0009238719940185547, -0.0008358955383300781, -0.0007479190826416016, -0.000659942626953125, -0.0005719661712646484, -0.0004839897155761719, -0.0003960132598876953, -0.00030803680419921875, -0.0002200603485107422, -0.00013208389282226562, -4.410743713378906e-05, 4.38690185546875e-05, 0.00013184547424316406, 0.00021982192993164062, 0.0003077983856201172, 0.00039577484130859375, 0.0004837512969970703, 0.0005717277526855469, 0.0006597042083740234, 0.0007476806640625, 0.0008356571197509766, 0.0009236335754394531, 0.0010116100311279297, 0.0010995864868164062, 0.0011875629425048828, 0.0012755393981933594, 0.001363515853881836, 0.0014514923095703125, 0.001539468765258789, 0.0016274452209472656, 0.0017154216766357422, 0.0018033981323242188, 0.0018913745880126953, 0.001979351043701172, 0.0020673274993896484, 0.002155303955078125, 0.0022432804107666016, 0.002331256866455078, 0.0024192333221435547, 0.0025072097778320312, 0.002595186233520508, 0.0026831626892089844, 0.002771139144897461, 0.0028591156005859375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 6.0, 14.0, 17.0, 13.0, 29.0, 38.0, 45.0, 74.0, 90.0, 101.0, 114.0, 112.0, 89.0, 62.0, 40.0, 36.0, 23.0, 17.0, 17.0, 14.0, 15.0, 6.0, 2.0, 9.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08441954106092453, -0.08211138844490051, -0.07980324327945709, -0.07749509066343307, -0.07518693804740906, -0.07287878543138504, -0.07057063281536102, -0.0682624876499176, -0.06595433503389359, -0.06364618241786957, -0.06133803352713585, -0.05902988463640213, -0.05672173202037811, -0.054413579404354095, -0.05210543051362038, -0.04979728162288666, -0.04748912900686264, -0.04518097639083862, -0.042872827500104904, -0.040564678609371185, -0.03825652599334717, -0.03594837337732315, -0.03364022448658943, -0.03133207559585571, -0.029023922979831696, -0.026715772226452827, -0.02440762147307396, -0.02209947071969509, -0.019791319966316223, -0.017483169212937355, -0.015175018459558487, -0.012866867706179619, -0.01055871695280075, -0.008250566199421883, -0.0059424154460430145, -0.0036342646926641464, -0.0013261139392852783, 0.0009820368140935898, 0.003290187567472458, 0.005598338320851326, 0.007906489074230194, 0.010214639827609062, 0.01252279058098793, 0.014830941334366798, 0.017139092087745667, 0.019447242841124535, 0.021755393594503403, 0.02406354434788227, 0.02637169510126114, 0.028679845854640007, 0.030987996608018875, 0.033296145498752594, 0.03560429811477661, 0.03791245073080063, 0.04022059962153435, 0.042528748512268066, 0.044836901128292084, 0.0471450537443161, 0.04945320263504982, 0.05176135152578354, 0.054069504141807556, 0.056377656757831573, 0.05868580564856529, 0.06099395453929901, 0.06330210715532303]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 7.0, 7.0, 7.0, 5.0, 13.0, 20.0, 15.0, 19.0, 24.0, 20.0, 32.0, 38.0, 42.0, 24.0, 41.0, 53.0, 46.0, 38.0, 45.0, 42.0, 55.0, 33.0, 34.0, 38.0, 37.0, 44.0, 26.0, 29.0, 28.0, 25.0, 23.0, 20.0, 13.0, 14.0, 4.0, 15.0, 5.0, 4.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0460062138736248, -0.044649578630924225, -0.04329294338822365, -0.04193630814552307, -0.040579672902822495, -0.03922303766012192, -0.03786640241742134, -0.036509767174720764, -0.03515313193202019, -0.03379649668931961, -0.032439861446619034, -0.031083226203918457, -0.02972659096121788, -0.028369955718517303, -0.027013320475816727, -0.02565668523311615, -0.024300049990415573, -0.022943414747714996, -0.02158677950501442, -0.020230144262313843, -0.018873509019613266, -0.01751687377691269, -0.016160238534212112, -0.014803603291511536, -0.013446968048810959, -0.012090332806110382, -0.010733697563409805, -0.009377062320709229, -0.008020427078008652, -0.006663791835308075, -0.005307156592607498, -0.003950521349906921, -0.002593882381916046, -0.0012372471392154694, 0.00011938810348510742, 0.0014760233461856842, 0.002832658588886261, 0.004189293831586838, 0.0055459290742874146, 0.006902564316987991, 0.008259199559688568, 0.009615834802389145, 0.010972470045089722, 0.012329105287790298, 0.013685740530490875, 0.015042375773191452, 0.01639901101589203, 0.017755646258592606, 0.019112281501293182, 0.02046891674399376, 0.021825551986694336, 0.023182187229394913, 0.02453882247209549, 0.025895457714796066, 0.027252092957496643, 0.02860872820019722, 0.029965363442897797, 0.03132199868559837, 0.03267863392829895, 0.03403526917099953, 0.035391904413700104, 0.03674853965640068, 0.03810517489910126, 0.039461810141801834, 0.04081844538450241]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 8.0, 9.0, 15.0, 21.0, 26.0, 55.0, 73.0, 100.0, 155.0, 231.0, 350.0, 488.0, 707.0, 1047.0, 1450.0, 2263.0, 3515.0, 5258.0, 7965.0, 13325.0, 21306.0, 36005.0, 62648.0, 114406.0, 237376.0, 723014.0, 1822693.0, 663281.0, 225360.0, 107945.0, 57850.0, 32881.0, 19672.0, 12080.0, 7391.0, 4695.0, 3022.0, 1986.0, 1233.0, 815.0, 555.0, 351.0, 221.0, 142.0, 92.0, 60.0, 42.0, 30.0, 25.0, 16.0, 15.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.050140380859375, -0.048438072204589844, -0.04673576354980469, -0.04503345489501953, -0.043331146240234375, -0.04162883758544922, -0.03992652893066406, -0.038224220275878906, -0.03652191162109375, -0.034819602966308594, -0.03311729431152344, -0.03141498565673828, -0.029712677001953125, -0.02801036834716797, -0.026308059692382812, -0.024605751037597656, -0.0229034423828125, -0.021201133728027344, -0.019498825073242188, -0.01779651641845703, -0.016094207763671875, -0.014391899108886719, -0.012689590454101562, -0.010987281799316406, -0.00928497314453125, -0.007582664489746094, -0.0058803558349609375, -0.004178047180175781, -0.002475738525390625, -0.0007734298706054688, 0.0009288787841796875, 0.0026311874389648438, 0.00433349609375, 0.006035804748535156, 0.0077381134033203125, 0.009440422058105469, 0.011142730712890625, 0.012845039367675781, 0.014547348022460938, 0.016249656677246094, 0.01795196533203125, 0.019654273986816406, 0.021356582641601562, 0.02305889129638672, 0.024761199951171875, 0.02646350860595703, 0.028165817260742188, 0.029868125915527344, 0.0315704345703125, 0.033272743225097656, 0.03497505187988281, 0.03667736053466797, 0.038379669189453125, 0.04008197784423828, 0.04178428649902344, 0.043486595153808594, 0.04518890380859375, 0.046891212463378906, 0.04859352111816406, 0.05029582977294922, 0.051998138427734375, 0.05370044708251953, 0.05540275573730469, 0.057105064392089844, 0.058807373046875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 4.0, 10.0, 9.0, 14.0, 19.0, 21.0, 18.0, 26.0, 34.0, 24.0, 36.0, 41.0, 35.0, 40.0, 45.0, 48.0, 50.0, 40.0, 47.0, 40.0, 39.0, 43.0, 26.0, 48.0, 31.0, 31.0, 27.0, 22.0, 28.0, 14.0, 17.0, 16.0, 9.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0254364013671875, -0.024654388427734375, -0.02387237548828125, -0.023090362548828125, -0.022308349609375, -0.021526336669921875, -0.02074432373046875, -0.019962310791015625, -0.0191802978515625, -0.018398284912109375, -0.01761627197265625, -0.016834259033203125, -0.01605224609375, -0.015270233154296875, -0.01448822021484375, -0.013706207275390625, -0.0129241943359375, -0.012142181396484375, -0.01136016845703125, -0.010578155517578125, -0.009796142578125, -0.009014129638671875, -0.00823211669921875, -0.007450103759765625, -0.0066680908203125, -0.005886077880859375, -0.00510406494140625, -0.004322052001953125, -0.0035400390625, -0.002758026123046875, -0.00197601318359375, -0.001194000244140625, -0.0004119873046875, 0.000370025634765625, 0.00115203857421875, 0.001934051513671875, 0.002716064453125, 0.003498077392578125, 0.00428009033203125, 0.005062103271484375, 0.0058441162109375, 0.006626129150390625, 0.00740814208984375, 0.008190155029296875, 0.00897216796875, 0.009754180908203125, 0.01053619384765625, 0.011318206787109375, 0.0121002197265625, 0.012882232666015625, 0.01366424560546875, 0.014446258544921875, 0.015228271484375, 0.016010284423828125, 0.01679229736328125, 0.017574310302734375, 0.0183563232421875, 0.019138336181640625, 0.01992034912109375, 0.020702362060546875, 0.021484375, 0.022266387939453125, 0.02304840087890625, 0.023830413818359375, 0.0246124267578125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 11.0, 5.0, 14.0, 35.0, 50.0, 50.0, 104.0, 158.0, 232.0, 364.0, 538.0, 736.0, 1195.0, 1806.0, 2654.0, 4130.0, 6314.0, 10092.0, 15575.0, 24726.0, 40066.0, 65730.0, 111644.0, 197592.0, 379418.0, 854957.0, 1261745.0, 565241.0, 273845.0, 149807.0, 86607.0, 51897.0, 31615.0, 19693.0, 12619.0, 8086.0, 5243.0, 3466.0, 2188.0, 1465.0, 912.0, 599.0, 406.0, 241.0, 147.0, 95.0, 55.0, 47.0, 32.0, 24.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.035888671875, -0.03477621078491211, -0.03366374969482422, -0.03255128860473633, -0.03143882751464844, -0.030326366424560547, -0.029213905334472656, -0.028101444244384766, -0.026988983154296875, -0.025876522064208984, -0.024764060974121094, -0.023651599884033203, -0.022539138793945312, -0.021426677703857422, -0.02031421661376953, -0.01920175552368164, -0.01808929443359375, -0.01697683334350586, -0.01586437225341797, -0.014751911163330078, -0.013639450073242188, -0.012526988983154297, -0.011414527893066406, -0.010302066802978516, -0.009189605712890625, -0.008077144622802734, -0.006964683532714844, -0.005852222442626953, -0.0047397613525390625, -0.003627300262451172, -0.0025148391723632812, -0.0014023780822753906, -0.0002899169921875, 0.0008225440979003906, 0.0019350051879882812, 0.003047466278076172, 0.0041599273681640625, 0.005272388458251953, 0.006384849548339844, 0.007497310638427734, 0.008609771728515625, 0.009722232818603516, 0.010834693908691406, 0.011947154998779297, 0.013059616088867188, 0.014172077178955078, 0.015284538269042969, 0.01639699935913086, 0.01750946044921875, 0.01862192153930664, 0.01973438262939453, 0.020846843719482422, 0.021959304809570312, 0.023071765899658203, 0.024184226989746094, 0.025296688079833984, 0.026409149169921875, 0.027521610260009766, 0.028634071350097656, 0.029746532440185547, 0.030858993530273438, 0.03197145462036133, 0.03308391571044922, 0.03419637680053711, 0.035308837890625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 4.0, 4.0, 3.0, 7.0, 6.0, 6.0, 6.0, 17.0, 25.0, 13.0, 23.0, 42.0, 38.0, 48.0, 37.0, 65.0, 54.0, 84.0, 80.0, 102.0, 128.0, 144.0, 162.0, 168.0, 175.0, 240.0, 215.0, 227.0, 225.0, 190.0, 221.0, 182.0, 138.0, 144.0, 120.0, 101.0, 97.0, 82.0, 87.0, 65.0, 59.0, 42.0, 38.0, 31.0, 22.0, 25.0, 16.0, 16.0, 14.0, 13.0, 10.0, 2.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.01045989990234375, -0.010130047798156738, -0.009800195693969727, -0.009470343589782715, -0.009140491485595703, -0.008810639381408691, -0.00848078727722168, -0.008150935173034668, -0.007821083068847656, -0.0074912309646606445, -0.007161378860473633, -0.006831526756286621, -0.006501674652099609, -0.006171822547912598, -0.005841970443725586, -0.005512118339538574, -0.0051822662353515625, -0.004852414131164551, -0.004522562026977539, -0.004192709922790527, -0.0038628578186035156, -0.003533005714416504, -0.003203153610229492, -0.0028733015060424805, -0.0025434494018554688, -0.002213597297668457, -0.0018837451934814453, -0.0015538930892944336, -0.0012240409851074219, -0.0008941888809204102, -0.0005643367767333984, -0.00023448467254638672, 9.5367431640625e-05, 0.0004252195358276367, 0.0007550716400146484, 0.0010849237442016602, 0.0014147758483886719, 0.0017446279525756836, 0.0020744800567626953, 0.002404332160949707, 0.0027341842651367188, 0.0030640363693237305, 0.003393888473510742, 0.003723740577697754, 0.004053592681884766, 0.004383444786071777, 0.004713296890258789, 0.005043148994445801, 0.0053730010986328125, 0.005702853202819824, 0.006032705307006836, 0.006362557411193848, 0.006692409515380859, 0.007022261619567871, 0.007352113723754883, 0.0076819658279418945, 0.008011817932128906, 0.008341670036315918, 0.00867152214050293, 0.009001374244689941, 0.009331226348876953, 0.009661078453063965, 0.009990930557250977, 0.010320782661437988, 0.010650634765625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 10.0, 15.0, 18.0, 29.0, 37.0, 39.0, 47.0, 63.0, 87.0, 108.0, 87.0, 90.0, 81.0, 59.0, 50.0, 28.0, 22.0, 29.0, 18.0, 13.0, 18.0, 8.0, 9.0, 8.0, 6.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.053438857197761536, -0.05218092352151871, -0.05092299357056618, -0.04966505989432335, -0.04840712621808052, -0.04714919626712799, -0.04589126259088516, -0.044633328914642334, -0.043375395238399506, -0.04211746156215668, -0.04085953161120415, -0.03960159793496132, -0.03834366425871849, -0.03708573430776596, -0.03582780063152313, -0.034569866955280304, -0.033311937004327774, -0.032054003328084946, -0.030796071514487267, -0.029538139700889587, -0.02828020602464676, -0.02702227421104908, -0.0257643423974514, -0.024506408721208572, -0.023248476907610893, -0.021990545094013214, -0.020732611417770386, -0.019474679604172707, -0.018216747790575027, -0.0169588141143322, -0.01570088230073452, -0.014442949555814266, -0.013185016810894012, -0.011927084065973759, -0.010669151321053505, -0.009411219507455826, -0.008153286762535572, -0.006895354017615318, -0.005637421738356352, -0.004379489459097385, -0.0031215567141771317, -0.0018636242020875216, -0.0006056916899979115, 0.0006522408220916986, 0.0019101733341813087, 0.0031681060791015625, 0.004426038358360529, 0.005683970637619495, 0.006941903382539749, 0.008199836127460003, 0.009457768872380257, 0.010715700685977936, 0.01197363343089819, 0.013231566175818443, 0.014489497989416122, 0.01574743166565895, 0.01700536347925663, 0.01826329529285431, 0.019521228969097137, 0.020779160782694817, 0.022037092596292496, 0.023295026272535324, 0.024552958086133003, 0.025810889899730682, 0.02706882357597351]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 8.0, 9.0, 13.0, 11.0, 18.0, 24.0, 21.0, 21.0, 21.0, 22.0, 38.0, 29.0, 32.0, 45.0, 40.0, 41.0, 45.0, 38.0, 47.0, 42.0, 35.0, 47.0, 40.0, 39.0, 36.0, 38.0, 27.0, 32.0, 20.0, 12.0, 13.0, 13.0, 15.0, 15.0, 9.0, 8.0, 4.0, 3.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02443515881896019, -0.023621488362550735, -0.02280781976878643, -0.021994151175022125, -0.02118048071861267, -0.020366810262203217, -0.01955314166843891, -0.018739473074674606, -0.017925802618265152, -0.017112132161855698, -0.016298463568091393, -0.015484794043004513, -0.014671124517917633, -0.013857454992830753, -0.013043785467743874, -0.012230115942656994, -0.011416446417570114, -0.010602776892483234, -0.009789107367396355, -0.008975437842309475, -0.008161768317222595, -0.0073480987921357155, -0.006534429267048836, -0.005720759741961956, -0.004907090216875076, -0.0040934206917881966, -0.003279751166701317, -0.002466081641614437, -0.0016524121165275574, -0.0008387425914406776, -2.5073066353797913e-05, 0.0007885964587330818, 0.0016022678464651108, 0.0024159373715519905, 0.0032296068966388702, 0.00404327642172575, 0.00485694594681263, 0.005670615471899509, 0.006484284996986389, 0.007297954522073269, 0.008111624047160149, 0.008925293572247028, 0.009738963097333908, 0.010552632622420788, 0.011366302147507668, 0.012179971672594547, 0.012993641197681427, 0.013807310722768307, 0.014620980247855186, 0.015434649772942066, 0.016248319298028946, 0.0170619897544384, 0.017875658348202705, 0.01868932694196701, 0.019502997398376465, 0.02031666785478592, 0.021130336448550224, 0.02194400504231453, 0.022757675498723984, 0.023571345955133438, 0.024385014548897743, 0.02519868314266205, 0.026012353599071503, 0.026826024055480957, 0.027639692649245262]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 13.0, 19.0, 22.0, 22.0, 27.0, 55.0, 80.0, 119.0, 166.0, 229.0, 326.0, 450.0, 608.0, 941.0, 1388.0, 2154.0, 3282.0, 4977.0, 8060.0, 13142.0, 22953.0, 40815.0, 77964.0, 158705.0, 304206.0, 197050.0, 94782.0, 48354.0, 26608.0, 15323.0, 9104.0, 5615.0, 3621.0, 2364.0, 1592.0, 1043.0, 743.0, 512.0, 313.0, 220.0, 167.0, 117.0, 100.0, 58.0, 42.0, 36.0, 21.0, 12.0, 9.0, 10.0, 6.0, 2.0, 6.0, 1.0], "bins": [-0.0142669677734375, -0.01385509967803955, -0.013443231582641602, -0.013031363487243652, -0.012619495391845703, -0.012207627296447754, -0.011795759201049805, -0.011383891105651855, -0.010972023010253906, -0.010560154914855957, -0.010148286819458008, -0.009736418724060059, -0.00932455062866211, -0.00891268253326416, -0.008500814437866211, -0.008088946342468262, -0.0076770782470703125, -0.007265210151672363, -0.006853342056274414, -0.006441473960876465, -0.006029605865478516, -0.005617737770080566, -0.005205869674682617, -0.004794001579284668, -0.004382133483886719, -0.0039702653884887695, -0.0035583972930908203, -0.003146529197692871, -0.002734661102294922, -0.0023227930068969727, -0.0019109249114990234, -0.0014990568161010742, -0.001087188720703125, -0.0006753206253051758, -0.00026345252990722656, 0.00014841556549072266, 0.0005602836608886719, 0.0009721517562866211, 0.0013840198516845703, 0.0017958879470825195, 0.0022077560424804688, 0.002619624137878418, 0.003031492233276367, 0.0034433603286743164, 0.0038552284240722656, 0.004267096519470215, 0.004678964614868164, 0.005090832710266113, 0.0055027008056640625, 0.005914568901062012, 0.006326436996459961, 0.00673830509185791, 0.007150173187255859, 0.007562041282653809, 0.007973909378051758, 0.008385777473449707, 0.008797645568847656, 0.009209513664245605, 0.009621381759643555, 0.010033249855041504, 0.010445117950439453, 0.010856986045837402, 0.011268854141235352, 0.0116807222366333, 0.01209259033203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 10.0, 8.0, 16.0, 16.0, 12.0, 20.0, 17.0, 25.0, 33.0, 25.0, 25.0, 31.0, 40.0, 44.0, 40.0, 43.0, 44.0, 48.0, 43.0, 45.0, 44.0, 42.0, 43.0, 29.0, 34.0, 34.0, 26.0, 22.0, 24.0, 16.0, 6.0, 13.0, 17.0, 12.0, 7.0, 4.0, 3.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.026123046875, -0.025298118591308594, -0.024473190307617188, -0.02364826202392578, -0.022823333740234375, -0.02199840545654297, -0.021173477172851562, -0.020348548889160156, -0.01952362060546875, -0.018698692321777344, -0.017873764038085938, -0.01704883575439453, -0.016223907470703125, -0.015398979187011719, -0.014574050903320312, -0.013749122619628906, -0.0129241943359375, -0.012099266052246094, -0.011274337768554688, -0.010449409484863281, -0.009624481201171875, -0.008799552917480469, -0.007974624633789062, -0.007149696350097656, -0.00632476806640625, -0.005499839782714844, -0.0046749114990234375, -0.0038499832153320312, -0.003025054931640625, -0.0022001266479492188, -0.0013751983642578125, -0.0005502700805664062, 0.000274658203125, 0.0010995864868164062, 0.0019245147705078125, 0.0027494430541992188, 0.003574371337890625, 0.004399299621582031, 0.0052242279052734375, 0.006049156188964844, 0.00687408447265625, 0.007699012756347656, 0.008523941040039062, 0.009348869323730469, 0.010173797607421875, 0.010998725891113281, 0.011823654174804688, 0.012648582458496094, 0.0134735107421875, 0.014298439025878906, 0.015123367309570312, 0.01594829559326172, 0.016773223876953125, 0.01759815216064453, 0.018423080444335938, 0.019248008728027344, 0.02007293701171875, 0.020897865295410156, 0.021722793579101562, 0.02254772186279297, 0.023372650146484375, 0.02419757843017578, 0.025022506713867188, 0.025847434997558594, 0.02667236328125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 3.0, 8.0, 13.0, 18.0, 22.0, 32.0, 46.0, 70.0, 110.0, 135.0, 205.0, 283.0, 503.0, 711.0, 1027.0, 1647.0, 2486.0, 3946.0, 6426.0, 11219.0, 22738.0, 59215.0, 225410.0, 520696.0, 115221.0, 37386.0, 16117.0, 8637.0, 4972.0, 3135.0, 1972.0, 1381.0, 878.0, 615.0, 414.0, 264.0, 183.0, 132.0, 98.0, 57.0, 38.0, 22.0, 16.0, 17.0, 12.0, 10.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0258636474609375, -0.025109052658081055, -0.02435445785522461, -0.023599863052368164, -0.02284526824951172, -0.022090673446655273, -0.021336078643798828, -0.020581483840942383, -0.019826889038085938, -0.019072294235229492, -0.018317699432373047, -0.0175631046295166, -0.016808509826660156, -0.01605391502380371, -0.015299320220947266, -0.01454472541809082, -0.013790130615234375, -0.01303553581237793, -0.012280941009521484, -0.011526346206665039, -0.010771751403808594, -0.010017156600952148, -0.009262561798095703, -0.008507966995239258, -0.0077533721923828125, -0.006998777389526367, -0.006244182586669922, -0.0054895877838134766, -0.004734992980957031, -0.003980398178100586, -0.0032258033752441406, -0.0024712085723876953, -0.00171661376953125, -0.0009620189666748047, -0.00020742416381835938, 0.0005471706390380859, 0.0013017654418945312, 0.0020563602447509766, 0.002810955047607422, 0.003565549850463867, 0.0043201446533203125, 0.005074739456176758, 0.005829334259033203, 0.0065839290618896484, 0.007338523864746094, 0.008093118667602539, 0.008847713470458984, 0.00960230827331543, 0.010356903076171875, 0.01111149787902832, 0.011866092681884766, 0.012620687484741211, 0.013375282287597656, 0.014129877090454102, 0.014884471893310547, 0.015639066696166992, 0.016393661499023438, 0.017148256301879883, 0.017902851104736328, 0.018657445907592773, 0.01941204071044922, 0.020166635513305664, 0.02092123031616211, 0.021675825119018555, 0.022430419921875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 7.0, 7.0, 10.0, 7.0, 11.0, 22.0, 21.0, 19.0, 24.0, 26.0, 30.0, 32.0, 39.0, 31.0, 43.0, 35.0, 33.0, 45.0, 42.0, 34.0, 41.0, 42.0, 46.0, 37.0, 41.0, 36.0, 33.0, 26.0, 31.0, 20.0, 22.0, 11.0, 19.0, 12.0, 18.0, 9.0, 11.0, 14.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0173492431640625, -0.01680731773376465, -0.016265392303466797, -0.015723466873168945, -0.015181541442871094, -0.014639616012573242, -0.01409769058227539, -0.013555765151977539, -0.013013839721679688, -0.012471914291381836, -0.011929988861083984, -0.011388063430786133, -0.010846138000488281, -0.01030421257019043, -0.009762287139892578, -0.009220361709594727, -0.008678436279296875, -0.008136510848999023, -0.007594585418701172, -0.00705265998840332, -0.006510734558105469, -0.005968809127807617, -0.005426883697509766, -0.004884958267211914, -0.0043430328369140625, -0.003801107406616211, -0.0032591819763183594, -0.002717256546020508, -0.0021753311157226562, -0.0016334056854248047, -0.0010914802551269531, -0.0005495548248291016, -7.62939453125e-06, 0.0005342960357666016, 0.0010762214660644531, 0.0016181468963623047, 0.0021600723266601562, 0.002701997756958008, 0.0032439231872558594, 0.003785848617553711, 0.0043277740478515625, 0.004869699478149414, 0.005411624908447266, 0.005953550338745117, 0.006495475769042969, 0.00703740119934082, 0.007579326629638672, 0.008121252059936523, 0.008663177490234375, 0.009205102920532227, 0.009747028350830078, 0.01028895378112793, 0.010830879211425781, 0.011372804641723633, 0.011914730072021484, 0.012456655502319336, 0.012998580932617188, 0.013540506362915039, 0.01408243179321289, 0.014624357223510742, 0.015166282653808594, 0.015708208084106445, 0.016250133514404297, 0.01679205894470215, 0.017333984375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 6.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 8.0, 8.0, 28.0, 24.0, 29.0, 40.0, 74.0, 79.0, 98.0, 141.0, 164.0, 223.0, 381.0, 441.0, 584.0, 942.0, 1299.0, 1936.0, 3059.0, 5213.0, 9610.0, 20625.0, 68923.0, 711271.0, 160944.0, 31659.0, 12783.0, 6437.0, 3733.0, 2308.0, 1548.0, 1080.0, 770.0, 531.0, 421.0, 324.0, 209.0, 144.0, 107.0, 90.0, 64.0, 50.0, 30.0, 34.0, 20.0, 12.0, 11.0, 11.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0021762847900390625, -0.0021076500415802, -0.002039015293121338, -0.0019703805446624756, -0.0019017457962036133, -0.001833111047744751, -0.0017644762992858887, -0.0016958415508270264, -0.001627206802368164, -0.0015585720539093018, -0.0014899373054504395, -0.0014213025569915771, -0.0013526678085327148, -0.0012840330600738525, -0.0012153983116149902, -0.001146763563156128, -0.0010781288146972656, -0.0010094940662384033, -0.000940859317779541, -0.0008722245693206787, -0.0008035898208618164, -0.0007349550724029541, -0.0006663203239440918, -0.0005976855754852295, -0.0005290508270263672, -0.0004604160785675049, -0.0003917813301086426, -0.0003231465816497803, -0.00025451183319091797, -0.00018587708473205566, -0.00011724233627319336, -4.8607587814331055e-05, 2.002716064453125e-05, 8.866190910339355e-05, 0.00015729665756225586, 0.00022593140602111816, 0.00029456615447998047, 0.0003632009029388428, 0.0004318356513977051, 0.0005004703998565674, 0.0005691051483154297, 0.000637739896774292, 0.0007063746452331543, 0.0007750093936920166, 0.0008436441421508789, 0.0009122788906097412, 0.0009809136390686035, 0.0010495483875274658, 0.0011181831359863281, 0.0011868178844451904, 0.0012554526329040527, 0.001324087381362915, 0.0013927221298217773, 0.0014613568782806396, 0.001529991626739502, 0.0015986263751983643, 0.0016672611236572266, 0.0017358958721160889, 0.0018045306205749512, 0.0018731653690338135, 0.0019418001174926758, 0.002010434865951538, 0.0020790696144104004, 0.0021477043628692627, 0.002216339111328125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 0.0, 6.0, 0.0, 7.0, 11.0, 0.0, 17.0, 0.0, 25.0, 0.0, 26.0, 0.0, 29.0, 0.0, 48.0, 0.0, 65.0, 0.0, 83.0, 0.0, 112.0, 105.0, 0.0, 123.0, 0.0, 100.0, 0.0, 72.0, 0.0, 58.0, 0.0, 34.0, 0.0, 26.0, 0.0, 19.0, 10.0, 0.0, 10.0, 0.0, 5.0, 0.0, 7.0, 0.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0728836059570312e-06, -1.041218638420105e-06, -1.0095536708831787e-06, -9.778887033462524e-07, -9.462237358093262e-07, -9.145587682723999e-07, -8.828938007354736e-07, -8.512288331985474e-07, -8.195638656616211e-07, -7.878988981246948e-07, -7.562339305877686e-07, -7.245689630508423e-07, -6.92903995513916e-07, -6.612390279769897e-07, -6.295740604400635e-07, -5.979090929031372e-07, -5.662441253662109e-07, -5.345791578292847e-07, -5.029141902923584e-07, -4.7124922275543213e-07, -4.3958425521850586e-07, -4.079192876815796e-07, -3.762543201446533e-07, -3.4458935260772705e-07, -3.129243850708008e-07, -2.812594175338745e-07, -2.4959444999694824e-07, -2.1792948246002197e-07, -1.862645149230957e-07, -1.5459954738616943e-07, -1.2293457984924316e-07, -9.12696123123169e-08, -5.960464477539063e-08, -2.7939677238464355e-08, 3.725290298461914e-09, 3.5390257835388184e-08, 6.705522537231445e-08, 9.872019290924072e-08, 1.30385160446167e-07, 1.6205012798309326e-07, 1.9371509552001953e-07, 2.253800630569458e-07, 2.5704503059387207e-07, 2.8870999813079834e-07, 3.203749656677246e-07, 3.520399332046509e-07, 3.8370490074157715e-07, 4.153698682785034e-07, 4.470348358154297e-07, 4.78699803352356e-07, 5.103647708892822e-07, 5.420297384262085e-07, 5.736947059631348e-07, 6.05359673500061e-07, 6.370246410369873e-07, 6.686896085739136e-07, 7.003545761108398e-07, 7.320195436477661e-07, 7.636845111846924e-07, 7.953494787216187e-07, 8.270144462585449e-07, 8.586794137954712e-07, 8.903443813323975e-07, 9.220093488693237e-07, 9.5367431640625e-07]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 17.0, 22.0, 25.0, 27.0, 49.0, 80.0, 95.0, 143.0, 211.0, 253.0, 375.0, 538.0, 799.0, 1128.0, 1769.0, 2645.0, 4138.0, 6826.0, 11596.0, 21898.0, 50006.0, 166633.0, 564086.0, 125739.0, 42150.0, 19297.0, 10595.0, 6112.0, 3803.0, 2383.0, 1585.0, 1060.0, 744.0, 489.0, 363.0, 221.0, 172.0, 128.0, 108.0, 55.0, 53.0, 35.0, 27.0, 28.0, 8.0, 14.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002017974853515625, -0.0019516050815582275, -0.00188523530960083, -0.0018188655376434326, -0.0017524957656860352, -0.0016861259937286377, -0.0016197562217712402, -0.0015533864498138428, -0.0014870166778564453, -0.0014206469058990479, -0.0013542771339416504, -0.001287907361984253, -0.0012215375900268555, -0.001155167818069458, -0.0010887980461120605, -0.001022428274154663, -0.0009560585021972656, -0.0008896887302398682, -0.0008233189582824707, -0.0007569491863250732, -0.0006905794143676758, -0.0006242096424102783, -0.0005578398704528809, -0.0004914700984954834, -0.00042510032653808594, -0.0003587305545806885, -0.000292360782623291, -0.00022599101066589355, -0.0001596212387084961, -9.325146675109863e-05, -2.6881694793701172e-05, 3.948807716369629e-05, 0.00010585784912109375, 0.0001722276210784912, 0.00023859739303588867, 0.00030496716499328613, 0.0003713369369506836, 0.00043770670890808105, 0.0005040764808654785, 0.000570446252822876, 0.0006368160247802734, 0.0007031857967376709, 0.0007695555686950684, 0.0008359253406524658, 0.0009022951126098633, 0.0009686648845672607, 0.0010350346565246582, 0.0011014044284820557, 0.0011677742004394531, 0.0012341439723968506, 0.001300513744354248, 0.0013668835163116455, 0.001433253288269043, 0.0014996230602264404, 0.0015659928321838379, 0.0016323626041412354, 0.0016987323760986328, 0.0017651021480560303, 0.0018314719200134277, 0.0018978416919708252, 0.0019642114639282227, 0.00203058123588562, 0.0020969510078430176, 0.002163320779800415, 0.0022296905517578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 8.0, 7.0, 7.0, 4.0, 7.0, 5.0, 12.0, 12.0, 21.0, 30.0, 43.0, 39.0, 65.0, 122.0, 168.0, 139.0, 77.0, 51.0, 41.0, 26.0, 23.0, 18.0, 9.0, 13.0, 3.0, 9.0, 7.0, 7.0, 4.0, 9.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005931854248046875, -0.0005750581622123718, -0.0005569308996200562, -0.0005388036370277405, -0.0005206763744354248, -0.0005025491118431091, -0.00048442184925079346, -0.0004662945866584778, -0.0004481673240661621, -0.00043004006147384644, -0.00041191279888153076, -0.0003937855362892151, -0.0003756582736968994, -0.00035753101110458374, -0.00033940374851226807, -0.0003212764859199524, -0.0003031492233276367, -0.00028502196073532104, -0.00026689469814300537, -0.0002487674355506897, -0.00023064017295837402, -0.00021251291036605835, -0.00019438564777374268, -0.000176258385181427, -0.00015813112258911133, -0.00014000385999679565, -0.00012187659740447998, -0.0001037493348121643, -8.562207221984863e-05, -6.749480962753296e-05, -4.9367547035217285e-05, -3.124028444290161e-05, -1.3113021850585938e-05, 5.014240741729736e-06, 2.314150333404541e-05, 4.1268765926361084e-05, 5.939602851867676e-05, 7.752329111099243e-05, 9.56505537033081e-05, 0.00011377781629562378, 0.00013190507888793945, 0.00015003234148025513, 0.0001681596040725708, 0.00018628686666488647, 0.00020441412925720215, 0.00022254139184951782, 0.0002406686544418335, 0.00025879591703414917, 0.00027692317962646484, 0.0002950504422187805, 0.0003131777048110962, 0.00033130496740341187, 0.00034943222999572754, 0.0003675594925880432, 0.0003856867551803589, 0.00040381401777267456, 0.00042194128036499023, 0.0004400685429573059, 0.0004581958055496216, 0.00047632306814193726, 0.0004944503307342529, 0.0005125775933265686, 0.0005307048559188843, 0.0005488321185112, 0.0005669593811035156]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 10.0, 20.0, 24.0, 23.0, 34.0, 39.0, 50.0, 62.0, 89.0, 105.0, 103.0, 90.0, 70.0, 57.0, 53.0, 22.0, 33.0, 21.0, 20.0, 10.0, 16.0, 9.0, 7.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.05350768193602562, -0.052246592938899994, -0.05098550021648407, -0.049724411219358444, -0.04846332222223282, -0.047202229499816895, -0.04594114050269127, -0.04468005150556564, -0.04341895878314972, -0.042157869786024094, -0.04089677706360817, -0.039635688066482544, -0.03837459906935692, -0.037113506346940994, -0.03585241734981537, -0.034591324627399445, -0.03333023935556412, -0.03206915035843849, -0.030808059498667717, -0.029546968638896942, -0.028285877779126167, -0.027024786919355392, -0.025763697922229767, -0.024502607062458992, -0.023241516202688217, -0.021980425342917442, -0.020719336345791817, -0.019458245486021042, -0.018197154626250267, -0.016936063766479492, -0.015674974769353867, -0.014413883909583092, -0.013152791187167168, -0.011891701258718967, -0.010630610398948193, -0.009369520470499992, -0.008108429610729218, -0.006847339682281017, -0.005586249753832817, -0.004325158894062042, -0.003064068965613842, -0.0018029786879196763, -0.0005418884102255106, 0.0007192017510533333, 0.001980292145162821, 0.0032413825392723083, 0.004502472467720509, 0.005763563327491283, 0.007024653255939484, 0.008285743184387684, 0.009546834044158459, 0.010807923972606659, 0.012069014832377434, 0.013330104760825634, 0.014591194689273834, 0.01585228554904461, 0.017113376408815384, 0.01837446726858616, 0.019635556265711784, 0.02089664712548256, 0.022157737985253334, 0.02341882884502411, 0.024679917842149734, 0.02594100870192051, 0.027202097699046135]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 10.0, 13.0, 12.0, 17.0, 25.0, 22.0, 19.0, 23.0, 24.0, 37.0, 31.0, 34.0, 43.0, 42.0, 37.0, 44.0, 39.0, 49.0, 36.0, 42.0, 40.0, 42.0, 42.0, 38.0, 34.0, 30.0, 27.0, 21.0, 13.0, 15.0, 11.0, 14.0, 14.0, 8.0, 9.0, 5.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024233534932136536, -0.02342360094189644, -0.02261366695165634, -0.021803731098771095, -0.020993797108530998, -0.0201838631182909, -0.019373927265405655, -0.018563993275165558, -0.01775405928492546, -0.016944125294685364, -0.016134191304445267, -0.01532425545156002, -0.014514321461319923, -0.013704387471079826, -0.012894452549517155, -0.012084517627954483, -0.011274583637714386, -0.010464649647474289, -0.009654714725911617, -0.008844779804348946, -0.008034845814108849, -0.007224911358207464, -0.00641497690230608, -0.0056050424464046955, -0.004795107990503311, -0.003985173534601927, -0.0031752390787005424, -0.002365304622799158, -0.0015553701668977737, -0.0007454357109963894, 6.449874490499496e-05, 0.0008744332008063793, 0.001684369519352913, 0.0024943039752542973, 0.0033042384311556816, 0.004114172887057066, 0.00492410734295845, 0.005734041798859835, 0.006543976254761219, 0.007353910710662603, 0.008163845166563988, 0.008973779156804085, 0.009783714078366756, 0.010593648999929428, 0.011403582990169525, 0.012213516980409622, 0.013023451901972294, 0.013833386823534966, 0.014643320813775063, 0.01545325480401516, 0.016263190656900406, 0.017073124647140503, 0.0178830586373806, 0.018692992627620697, 0.019502926617860794, 0.02031286247074604, 0.021122796460986137, 0.021932730451226234, 0.02274266630411148, 0.023552600294351578, 0.024362534284591675, 0.025172468274831772, 0.02598240226507187, 0.026792338117957115, 0.027602272108197212]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 15.0, 14.0, 15.0, 30.0, 43.0, 59.0, 79.0, 98.0, 147.0, 190.0, 305.0, 404.0, 576.0, 732.0, 1036.0, 1384.0, 1968.0, 2764.0, 3890.0, 5798.0, 8284.0, 11868.0, 17441.0, 26191.0, 40010.0, 62753.0, 100519.0, 166224.0, 216645.0, 136476.0, 83279.0, 52841.0, 34037.0, 22558.0, 15088.0, 10350.0, 7152.0, 4942.0, 3496.0, 2564.0, 1719.0, 1302.0, 917.0, 666.0, 484.0, 357.0, 237.0, 179.0, 153.0, 78.0, 69.0, 33.0, 42.0, 24.0, 24.0, 9.0, 0.0, 4.0, 4.0], "bins": [-0.04107666015625, -0.03984355926513672, -0.03861045837402344, -0.037377357482910156, -0.036144256591796875, -0.034911155700683594, -0.03367805480957031, -0.03244495391845703, -0.03121185302734375, -0.02997875213623047, -0.028745651245117188, -0.027512550354003906, -0.026279449462890625, -0.025046348571777344, -0.023813247680664062, -0.02258014678955078, -0.0213470458984375, -0.02011394500732422, -0.018880844116210938, -0.017647743225097656, -0.016414642333984375, -0.015181541442871094, -0.013948440551757812, -0.012715339660644531, -0.01148223876953125, -0.010249137878417969, -0.009016036987304688, -0.007782936096191406, -0.006549835205078125, -0.005316734313964844, -0.0040836334228515625, -0.0028505325317382812, -0.001617431640625, -0.00038433074951171875, 0.0008487701416015625, 0.0020818710327148438, 0.003314971923828125, 0.004548072814941406, 0.0057811737060546875, 0.007014274597167969, 0.00824737548828125, 0.009480476379394531, 0.010713577270507812, 0.011946678161621094, 0.013179779052734375, 0.014412879943847656, 0.015645980834960938, 0.01687908172607422, 0.0181121826171875, 0.01934528350830078, 0.020578384399414062, 0.021811485290527344, 0.023044586181640625, 0.024277687072753906, 0.025510787963867188, 0.02674388885498047, 0.02797698974609375, 0.02921009063720703, 0.030443191528320312, 0.031676292419433594, 0.032909393310546875, 0.034142494201660156, 0.03537559509277344, 0.03660869598388672, 0.037841796875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 2.0, 5.0, 5.0, 9.0, 11.0, 20.0, 23.0, 15.0, 24.0, 16.0, 19.0, 36.0, 29.0, 27.0, 40.0, 36.0, 40.0, 43.0, 45.0, 29.0, 44.0, 41.0, 37.0, 33.0, 49.0, 45.0, 30.0, 34.0, 39.0, 24.0, 23.0, 20.0, 13.0, 15.0, 9.0, 9.0, 8.0, 7.0, 11.0, 3.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0214691162109375, -0.0207977294921875, -0.0201263427734375, -0.0194549560546875, -0.0187835693359375, -0.0181121826171875, -0.0174407958984375, -0.0167694091796875, -0.0160980224609375, -0.0154266357421875, -0.0147552490234375, -0.0140838623046875, -0.0134124755859375, -0.0127410888671875, -0.0120697021484375, -0.0113983154296875, -0.0107269287109375, -0.0100555419921875, -0.0093841552734375, -0.0087127685546875, -0.0080413818359375, -0.0073699951171875, -0.0066986083984375, -0.0060272216796875, -0.0053558349609375, -0.0046844482421875, -0.0040130615234375, -0.0033416748046875, -0.0026702880859375, -0.0019989013671875, -0.0013275146484375, -0.0006561279296875, 1.52587890625e-05, 0.0006866455078125, 0.0013580322265625, 0.0020294189453125, 0.0027008056640625, 0.0033721923828125, 0.0040435791015625, 0.0047149658203125, 0.0053863525390625, 0.0060577392578125, 0.0067291259765625, 0.0074005126953125, 0.0080718994140625, 0.0087432861328125, 0.0094146728515625, 0.0100860595703125, 0.0107574462890625, 0.0114288330078125, 0.0121002197265625, 0.0127716064453125, 0.0134429931640625, 0.0141143798828125, 0.0147857666015625, 0.0154571533203125, 0.0161285400390625, 0.0167999267578125, 0.0174713134765625, 0.0181427001953125, 0.0188140869140625, 0.0194854736328125, 0.0201568603515625, 0.0208282470703125, 0.0214996337890625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 11.0, 16.0, 28.0, 33.0, 61.0, 101.0, 169.0, 231.0, 401.0, 578.0, 955.0, 1403.0, 2282.0, 3499.0, 5769.0, 9069.0, 14667.0, 23917.0, 39810.0, 66915.0, 116245.0, 215178.0, 235549.0, 127569.0, 72728.0, 43214.0, 25764.0, 15968.0, 9598.0, 6210.0, 3811.0, 2529.0, 1555.0, 988.0, 617.0, 390.0, 239.0, 179.0, 106.0, 79.0, 41.0, 30.0, 13.0, 16.0, 8.0, 10.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048675537109375, -0.047204017639160156, -0.04573249816894531, -0.04426097869873047, -0.042789459228515625, -0.04131793975830078, -0.03984642028808594, -0.038374900817871094, -0.03690338134765625, -0.035431861877441406, -0.03396034240722656, -0.03248882293701172, -0.031017303466796875, -0.02954578399658203, -0.028074264526367188, -0.026602745056152344, -0.0251312255859375, -0.023659706115722656, -0.022188186645507812, -0.02071666717529297, -0.019245147705078125, -0.01777362823486328, -0.016302108764648438, -0.014830589294433594, -0.01335906982421875, -0.011887550354003906, -0.010416030883789062, -0.008944511413574219, -0.007472991943359375, -0.006001472473144531, -0.0045299530029296875, -0.0030584335327148438, -0.0015869140625, -0.00011539459228515625, 0.0013561248779296875, 0.0028276443481445312, 0.004299163818359375, 0.005770683288574219, 0.0072422027587890625, 0.008713722229003906, 0.01018524169921875, 0.011656761169433594, 0.013128280639648438, 0.014599800109863281, 0.016071319580078125, 0.01754283905029297, 0.019014358520507812, 0.020485877990722656, 0.0219573974609375, 0.023428916931152344, 0.024900436401367188, 0.02637195587158203, 0.027843475341796875, 0.02931499481201172, 0.030786514282226562, 0.032258033752441406, 0.03372955322265625, 0.035201072692871094, 0.03667259216308594, 0.03814411163330078, 0.039615631103515625, 0.04108715057373047, 0.04255867004394531, 0.044030189514160156, 0.045501708984375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 6.0, 10.0, 10.0, 9.0, 10.0, 15.0, 15.0, 17.0, 25.0, 25.0, 27.0, 32.0, 27.0, 41.0, 18.0, 34.0, 38.0, 36.0, 37.0, 34.0, 36.0, 46.0, 49.0, 26.0, 29.0, 29.0, 39.0, 32.0, 34.0, 33.0, 31.0, 21.0, 23.0, 24.0, 13.0, 15.0, 10.0, 9.0, 8.0, 6.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01239013671875, -0.011963844299316406, -0.011537551879882812, -0.011111259460449219, -0.010684967041015625, -0.010258674621582031, -0.009832382202148438, -0.009406089782714844, -0.00897979736328125, -0.008553504943847656, -0.008127212524414062, -0.007700920104980469, -0.007274627685546875, -0.006848335266113281, -0.0064220428466796875, -0.005995750427246094, -0.0055694580078125, -0.005143165588378906, -0.0047168731689453125, -0.004290580749511719, -0.003864288330078125, -0.0034379959106445312, -0.0030117034912109375, -0.0025854110717773438, -0.00215911865234375, -0.0017328262329101562, -0.0013065338134765625, -0.0008802413940429688, -0.000453948974609375, -2.765655517578125e-05, 0.0003986358642578125, 0.0008249282836914062, 0.001251220703125, 0.0016775131225585938, 0.0021038055419921875, 0.0025300979614257812, 0.002956390380859375, 0.0033826828002929688, 0.0038089752197265625, 0.004235267639160156, 0.00466156005859375, 0.005087852478027344, 0.0055141448974609375, 0.005940437316894531, 0.006366729736328125, 0.006793022155761719, 0.0072193145751953125, 0.007645606994628906, 0.0080718994140625, 0.008498191833496094, 0.008924484252929688, 0.009350776672363281, 0.009777069091796875, 0.010203361511230469, 0.010629653930664062, 0.011055946350097656, 0.01148223876953125, 0.011908531188964844, 0.012334823608398438, 0.012761116027832031, 0.013187408447265625, 0.013613700866699219, 0.014039993286132812, 0.014466285705566406, 0.014892578125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 12.0, 31.0, 37.0, 46.0, 67.0, 105.0, 162.0, 199.0, 313.0, 384.0, 518.0, 673.0, 936.0, 1235.0, 1694.0, 2282.0, 3341.0, 4786.0, 7278.0, 11736.0, 21319.0, 54116.0, 561180.0, 282025.0, 42303.0, 18851.0, 10681.0, 6521.0, 4315.0, 3123.0, 2219.0, 1623.0, 1227.0, 847.0, 633.0, 490.0, 308.0, 257.0, 214.0, 112.0, 94.0, 78.0, 53.0, 32.0, 37.0, 17.0, 8.0, 16.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.0030975341796875, -0.003006160259246826, -0.0029147863388061523, -0.0028234124183654785, -0.0027320384979248047, -0.002640664577484131, -0.002549290657043457, -0.002457916736602783, -0.0023665428161621094, -0.0022751688957214355, -0.0021837949752807617, -0.002092421054840088, -0.002001047134399414, -0.0019096732139587402, -0.0018182992935180664, -0.0017269253730773926, -0.0016355514526367188, -0.001544177532196045, -0.001452803611755371, -0.0013614296913146973, -0.0012700557708740234, -0.0011786818504333496, -0.0010873079299926758, -0.000995934009552002, -0.0009045600891113281, -0.0008131861686706543, -0.0007218122482299805, -0.0006304383277893066, -0.0005390644073486328, -0.000447690486907959, -0.00035631656646728516, -0.00026494264602661133, -0.0001735687255859375, -8.219480514526367e-05, 9.179115295410156e-06, 0.00010055303573608398, 0.0001919269561767578, 0.00028330087661743164, 0.00037467479705810547, 0.0004660487174987793, 0.0005574226379394531, 0.000648796558380127, 0.0007401704788208008, 0.0008315443992614746, 0.0009229183197021484, 0.0010142922401428223, 0.001105666160583496, 0.00119704008102417, 0.0012884140014648438, 0.0013797879219055176, 0.0014711618423461914, 0.0015625357627868652, 0.001653909683227539, 0.0017452836036682129, 0.0018366575241088867, 0.0019280314445495605, 0.0020194053649902344, 0.002110779285430908, 0.002202153205871582, 0.002293527126312256, 0.0023849010467529297, 0.0024762749671936035, 0.0025676488876342773, 0.002659022808074951, 0.002750396728515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 9.0, 0.0, 12.0, 0.0, 21.0, 0.0, 27.0, 0.0, 46.0, 0.0, 69.0, 0.0, 104.0, 0.0, 141.0, 0.0, 159.0, 0.0, 151.0, 0.0, 97.0, 0.0, 67.0, 0.0, 35.0, 0.0, 20.0, 0.0, 9.0, 0.0, 13.0, 0.0, 12.0, 0.0, 7.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.0132789611816406e-06, -9.834766387939453e-07, -9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 11.0, 12.0, 18.0, 20.0, 30.0, 34.0, 54.0, 93.0, 89.0, 137.0, 215.0, 290.0, 412.0, 584.0, 837.0, 1336.0, 1961.0, 3441.0, 5322.0, 9506.0, 17913.0, 48890.0, 665857.0, 221801.0, 34058.0, 14793.0, 7824.0, 4601.0, 2894.0, 1777.0, 1149.0, 782.0, 529.0, 391.0, 234.0, 191.0, 123.0, 83.0, 76.0, 53.0, 36.0, 27.0, 21.0, 11.0, 18.0, 2.0, 7.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.003711700439453125, -0.0035951733589172363, -0.0034786462783813477, -0.003362119197845459, -0.0032455921173095703, -0.0031290650367736816, -0.003012537956237793, -0.0028960108757019043, -0.0027794837951660156, -0.002662956714630127, -0.0025464296340942383, -0.0024299025535583496, -0.002313375473022461, -0.0021968483924865723, -0.0020803213119506836, -0.001963794231414795, -0.0018472671508789062, -0.0017307400703430176, -0.001614212989807129, -0.0014976859092712402, -0.0013811588287353516, -0.0012646317481994629, -0.0011481046676635742, -0.0010315775871276855, -0.0009150505065917969, -0.0007985234260559082, -0.0006819963455200195, -0.0005654692649841309, -0.0004489421844482422, -0.0003324151039123535, -0.00021588802337646484, -9.936094284057617e-05, 1.71661376953125e-05, 0.00013369321823120117, 0.00025022029876708984, 0.0003667473793029785, 0.0004832744598388672, 0.0005998015403747559, 0.0007163286209106445, 0.0008328557014465332, 0.0009493827819824219, 0.0010659098625183105, 0.0011824369430541992, 0.0012989640235900879, 0.0014154911041259766, 0.0015320181846618652, 0.001648545265197754, 0.0017650723457336426, 0.0018815994262695312, 0.00199812650680542, 0.0021146535873413086, 0.0022311806678771973, 0.002347707748413086, 0.0024642348289489746, 0.0025807619094848633, 0.002697288990020752, 0.0028138160705566406, 0.0029303431510925293, 0.003046870231628418, 0.0031633973121643066, 0.0032799243927001953, 0.003396451473236084, 0.0035129785537719727, 0.0036295056343078613, 0.00374603271484375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 12.0, 6.0, 5.0, 12.0, 9.0, 6.0, 16.0, 23.0, 34.0, 68.0, 188.0, 335.0, 142.0, 40.0, 28.0, 10.0, 11.0, 13.0, 8.0, 6.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011920928955078125, -0.0011552423238754272, -0.001118391752243042, -0.0010815411806106567, -0.0010446906089782715, -0.0010078400373458862, -0.000970989465713501, -0.0009341388940811157, -0.0008972883224487305, -0.0008604377508163452, -0.00082358717918396, -0.0007867366075515747, -0.0007498860359191895, -0.0007130354642868042, -0.0006761848926544189, -0.0006393343210220337, -0.0006024837493896484, -0.0005656331777572632, -0.0005287826061248779, -0.0004919320344924927, -0.0004550814628601074, -0.00041823089122772217, -0.0003813803195953369, -0.00034452974796295166, -0.0003076791763305664, -0.00027082860469818115, -0.0002339780330657959, -0.00019712746143341064, -0.0001602768898010254, -0.00012342631816864014, -8.657574653625488e-05, -4.972517490386963e-05, -1.2874603271484375e-05, 2.397596836090088e-05, 6.082653999328613e-05, 9.767711162567139e-05, 0.00013452768325805664, 0.0001713782548904419, 0.00020822882652282715, 0.0002450793981552124, 0.00028192996978759766, 0.0003187805414199829, 0.00035563111305236816, 0.0003924816846847534, 0.00042933225631713867, 0.0004661828279495239, 0.0005030333995819092, 0.0005398839712142944, 0.0005767345428466797, 0.0006135851144790649, 0.0006504356861114502, 0.0006872862577438354, 0.0007241368293762207, 0.000760987401008606, 0.0007978379726409912, 0.0008346885442733765, 0.0008715391159057617, 0.000908389687538147, 0.0009452402591705322, 0.0009820908308029175, 0.0010189414024353027, 0.001055791974067688, 0.0010926425457000732, 0.0011294931173324585, 0.0011663436889648438]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 3.0, 6.0, 10.0, 9.0, 16.0, 29.0, 18.0, 28.0, 46.0, 52.0, 68.0, 91.0, 92.0, 109.0, 93.0, 78.0, 46.0, 51.0, 38.0, 29.0, 16.0, 8.0, 16.0, 13.0, 10.0, 5.0, 6.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040862008929252625, -0.03973864018917084, -0.03861527144908905, -0.03749190643429756, -0.036368537694215775, -0.03524516895413399, -0.0341218002140522, -0.03299843147397041, -0.031875066459178925, -0.030751697719097137, -0.0296283308416605, -0.028504962101578712, -0.027381595224142075, -0.026258226484060287, -0.0251348577439785, -0.024011489003896713, -0.022888120263814926, -0.02176475152373314, -0.0206413846462965, -0.019518015906214714, -0.018394649028778076, -0.01727128028869629, -0.016147911548614502, -0.01502454373985529, -0.013901175931096077, -0.012777808122336864, -0.011654440313577652, -0.010531071573495865, -0.009407703764736652, -0.00828433595597744, -0.00716096768155694, -0.00603759940713644, -0.0049142297357320786, -0.0037908616941422224, -0.0026674936525523663, -0.0015441256109625101, -0.00042075756937265396, 0.0007026102393865585, 0.0018259785138070583, 0.002949346788227558, 0.004072714596986771, 0.005196082405745983, 0.006319450680166483, 0.007442818954586983, 0.008566186763346195, 0.009689554572105408, 0.010812923312187195, 0.011936291120946407, 0.01305965892970562, 0.014183026738464832, 0.015306394547224045, 0.016429763287305832, 0.01755313202738762, 0.018676498904824257, 0.019799867644906044, 0.020923234522342682, 0.02204660326242447, 0.023169972002506256, 0.024293338879942894, 0.02541670762002468, 0.02654007449746132, 0.027663443237543106, 0.028786811977624893, 0.02991018071770668, 0.031033547595143318]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 8.0, 6.0, 5.0, 6.0, 7.0, 4.0, 8.0, 15.0, 15.0, 14.0, 25.0, 23.0, 16.0, 25.0, 25.0, 22.0, 33.0, 34.0, 50.0, 32.0, 33.0, 34.0, 47.0, 41.0, 47.0, 35.0, 28.0, 40.0, 38.0, 36.0, 39.0, 19.0, 27.0, 22.0, 19.0, 16.0, 9.0, 16.0, 15.0, 13.0, 12.0, 10.0, 10.0, 6.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02046930231153965, -0.019792180508375168, -0.019115058705210686, -0.018437936902046204, -0.01776081509888172, -0.01708369329571724, -0.016406573355197906, -0.015729451552033424, -0.015052329748868942, -0.01437520794570446, -0.013698086142539978, -0.013020964339375496, -0.012343843467533588, -0.011666721664369106, -0.010989599861204624, -0.010312478989362717, -0.00963535625487566, -0.008958234451711178, -0.008281112648546696, -0.007603991311043501, -0.006926869973540306, -0.006249748170375824, -0.005572626367211342, -0.004895505029708147, -0.004218383226543665, -0.0035412616562098265, -0.002864140085875988, -0.002187018282711506, -0.0015098967123776674, -0.000832775142043829, -0.00015565333887934685, 0.000521467998623848, 0.00119858980178833, 0.0018757113721221685, 0.002552832942456007, 0.003229954745620489, 0.003907076083123684, 0.004584197886288166, 0.005261319689452648, 0.005938441026955843, 0.006615562830120325, 0.007292684633284807, 0.007969805970788002, 0.008646927773952484, 0.009324049577116966, 0.010001171380281448, 0.01067829318344593, 0.011355414055287838, 0.01203253585845232, 0.012709657661616802, 0.013386779464781284, 0.014063900336623192, 0.014741022139787674, 0.015418143942952156, 0.016095265746116638, 0.01677238754928112, 0.017449509352445602, 0.018126631155610085, 0.018803752958774567, 0.01948087476193905, 0.02015799656510353, 0.020835116505622864, 0.021512240171432495, 0.022189360111951828, 0.02286648191511631]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 8.0, 14.0, 17.0, 22.0, 45.0, 53.0, 90.0, 130.0, 191.0, 283.0, 409.0, 636.0, 828.0, 1286.0, 1742.0, 2542.0, 3612.0, 5379.0, 8243.0, 12419.0, 18710.0, 28691.0, 46415.0, 76400.0, 132425.0, 266232.0, 762407.0, 1595755.0, 670490.0, 244803.0, 124872.0, 71280.0, 42325.0, 26387.0, 16707.0, 10685.0, 6965.0, 4770.0, 3127.0, 2099.0, 1447.0, 987.0, 725.0, 424.0, 361.0, 253.0, 166.0, 124.0, 105.0, 54.0, 49.0, 37.0, 24.0, 14.0, 12.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.0254364013671875, -0.024600744247436523, -0.023765087127685547, -0.02292943000793457, -0.022093772888183594, -0.021258115768432617, -0.02042245864868164, -0.019586801528930664, -0.018751144409179688, -0.01791548728942871, -0.017079830169677734, -0.016244173049926758, -0.015408515930175781, -0.014572858810424805, -0.013737201690673828, -0.012901544570922852, -0.012065887451171875, -0.011230230331420898, -0.010394573211669922, -0.009558916091918945, -0.008723258972167969, -0.007887601852416992, -0.007051944732666016, -0.006216287612915039, -0.0053806304931640625, -0.004544973373413086, -0.0037093162536621094, -0.002873659133911133, -0.0020380020141601562, -0.0012023448944091797, -0.0003666877746582031, 0.00046896934509277344, 0.00130462646484375, 0.0021402835845947266, 0.002975940704345703, 0.0038115978240966797, 0.004647254943847656, 0.005482912063598633, 0.006318569183349609, 0.007154226303100586, 0.007989883422851562, 0.008825540542602539, 0.009661197662353516, 0.010496854782104492, 0.011332511901855469, 0.012168169021606445, 0.013003826141357422, 0.013839483261108398, 0.014675140380859375, 0.015510797500610352, 0.016346454620361328, 0.017182111740112305, 0.01801776885986328, 0.018853425979614258, 0.019689083099365234, 0.02052474021911621, 0.021360397338867188, 0.022196054458618164, 0.02303171157836914, 0.023867368698120117, 0.024703025817871094, 0.02553868293762207, 0.026374340057373047, 0.027209997177124023, 0.028045654296875]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 4.0, 13.0, 7.0, 14.0, 12.0, 19.0, 20.0, 20.0, 20.0, 28.0, 17.0, 28.0, 32.0, 42.0, 45.0, 42.0, 32.0, 44.0, 41.0, 55.0, 48.0, 37.0, 52.0, 24.0, 31.0, 32.0, 32.0, 19.0, 28.0, 21.0, 18.0, 16.0, 16.0, 9.0, 16.0, 14.0, 3.0, 7.0, 10.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01277923583984375, -0.012364983558654785, -0.01195073127746582, -0.011536478996276855, -0.01112222671508789, -0.010707974433898926, -0.010293722152709961, -0.009879469871520996, -0.009465217590332031, -0.009050965309143066, -0.008636713027954102, -0.008222460746765137, -0.007808208465576172, -0.007393956184387207, -0.006979703903198242, -0.006565451622009277, -0.0061511993408203125, -0.005736947059631348, -0.005322694778442383, -0.004908442497253418, -0.004494190216064453, -0.004079937934875488, -0.0036656856536865234, -0.0032514333724975586, -0.0028371810913085938, -0.002422928810119629, -0.002008676528930664, -0.0015944242477416992, -0.0011801719665527344, -0.0007659196853637695, -0.0003516674041748047, 6.258487701416016e-05, 0.000476837158203125, 0.0008910894393920898, 0.0013053417205810547, 0.0017195940017700195, 0.0021338462829589844, 0.0025480985641479492, 0.002962350845336914, 0.003376603126525879, 0.0037908554077148438, 0.004205107688903809, 0.0046193599700927734, 0.005033612251281738, 0.005447864532470703, 0.005862116813659668, 0.006276369094848633, 0.006690621376037598, 0.0071048736572265625, 0.007519125938415527, 0.007933378219604492, 0.008347630500793457, 0.008761882781982422, 0.009176135063171387, 0.009590387344360352, 0.010004639625549316, 0.010418891906738281, 0.010833144187927246, 0.011247396469116211, 0.011661648750305176, 0.01207590103149414, 0.012490153312683105, 0.01290440559387207, 0.013318657875061035, 0.01373291015625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 20.0, 14.0, 50.0, 88.0, 145.0, 238.0, 400.0, 633.0, 1102.0, 1772.0, 3121.0, 5348.0, 9649.0, 17745.0, 32924.0, 64251.0, 129825.0, 286601.0, 738803.0, 1672647.0, 698304.0, 273195.0, 125329.0, 61494.0, 31632.0, 16872.0, 9504.0, 5336.0, 2924.0, 1714.0, 1019.0, 609.0, 373.0, 251.0, 126.0, 86.0, 44.0, 27.0, 17.0, 21.0, 10.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029571533203125, -0.028713703155517578, -0.027855873107910156, -0.026998043060302734, -0.026140213012695312, -0.02528238296508789, -0.02442455291748047, -0.023566722869873047, -0.022708892822265625, -0.021851062774658203, -0.02099323272705078, -0.02013540267944336, -0.019277572631835938, -0.018419742584228516, -0.017561912536621094, -0.016704082489013672, -0.01584625244140625, -0.014988422393798828, -0.014130592346191406, -0.013272762298583984, -0.012414932250976562, -0.01155710220336914, -0.010699272155761719, -0.009841442108154297, -0.008983612060546875, -0.008125782012939453, -0.007267951965332031, -0.006410121917724609, -0.0055522918701171875, -0.004694461822509766, -0.0038366317749023438, -0.002978801727294922, -0.0021209716796875, -0.0012631416320800781, -0.00040531158447265625, 0.0004525184631347656, 0.0013103485107421875, 0.0021681785583496094, 0.0030260086059570312, 0.003883838653564453, 0.004741668701171875, 0.005599498748779297, 0.006457328796386719, 0.007315158843994141, 0.008172988891601562, 0.009030818939208984, 0.009888648986816406, 0.010746479034423828, 0.01160430908203125, 0.012462139129638672, 0.013319969177246094, 0.014177799224853516, 0.015035629272460938, 0.01589345932006836, 0.01675128936767578, 0.017609119415283203, 0.018466949462890625, 0.019324779510498047, 0.02018260955810547, 0.02104043960571289, 0.021898269653320312, 0.022756099700927734, 0.023613929748535156, 0.024471759796142578, 0.02532958984375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 7.0, 7.0, 2.0, 8.0, 15.0, 15.0, 15.0, 24.0, 20.0, 38.0, 39.0, 49.0, 65.0, 72.0, 86.0, 86.0, 120.0, 128.0, 145.0, 169.0, 207.0, 239.0, 264.0, 282.0, 281.0, 242.0, 205.0, 168.0, 183.0, 162.0, 121.0, 117.0, 85.0, 78.0, 71.0, 72.0, 33.0, 32.0, 36.0, 18.0, 19.0, 9.0, 17.0, 6.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006679534912109375, -0.006461977958679199, -0.0062444210052490234, -0.006026864051818848, -0.005809307098388672, -0.005591750144958496, -0.00537419319152832, -0.0051566362380981445, -0.004939079284667969, -0.004721522331237793, -0.004503965377807617, -0.004286408424377441, -0.004068851470947266, -0.00385129451751709, -0.003633737564086914, -0.0034161806106567383, -0.0031986236572265625, -0.0029810667037963867, -0.002763509750366211, -0.002545952796936035, -0.0023283958435058594, -0.0021108388900756836, -0.0018932819366455078, -0.001675724983215332, -0.0014581680297851562, -0.0012406110763549805, -0.0010230541229248047, -0.0008054971694946289, -0.0005879402160644531, -0.00037038326263427734, -0.00015282630920410156, 6.473064422607422e-05, 0.00028228759765625, 0.0004998445510864258, 0.0007174015045166016, 0.0009349584579467773, 0.0011525154113769531, 0.001370072364807129, 0.0015876293182373047, 0.0018051862716674805, 0.0020227432250976562, 0.002240300178527832, 0.002457857131958008, 0.0026754140853881836, 0.0028929710388183594, 0.003110527992248535, 0.003328084945678711, 0.0035456418991088867, 0.0037631988525390625, 0.003980755805969238, 0.004198312759399414, 0.00441586971282959, 0.004633426666259766, 0.004850983619689941, 0.005068540573120117, 0.005286097526550293, 0.005503654479980469, 0.0057212114334106445, 0.00593876838684082, 0.006156325340270996, 0.006373882293701172, 0.006591439247131348, 0.0068089962005615234, 0.007026553153991699, 0.007244110107421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 3.0, 9.0, 22.0, 16.0, 23.0, 32.0, 44.0, 41.0, 57.0, 74.0, 93.0, 88.0, 76.0, 73.0, 60.0, 70.0, 40.0, 45.0, 22.0, 16.0, 20.0, 14.0, 9.0, 10.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.023661727085709572, -0.02301955223083496, -0.0223773792386055, -0.02173520438373089, -0.021093031391501427, -0.020450856536626816, -0.019808683544397354, -0.019166508689522743, -0.018524333834648132, -0.01788215897977352, -0.01723998598754406, -0.01659781113266945, -0.015955638140439987, -0.015313463285565376, -0.01467128936201334, -0.014029115438461304, -0.013386942446231842, -0.012744768522679806, -0.01210259459912777, -0.011460420675575733, -0.010818246752023697, -0.010176071897149086, -0.00953389797359705, -0.008891724050045013, -0.008249550126492977, -0.007607376202940941, -0.006965202279388905, -0.006323027890175581, -0.005680853966623545, -0.005038680043071508, -0.004396505653858185, -0.0037543317303061485, -0.003112155944108963, -0.0024699820205569267, -0.0018278078641742468, -0.0011856338242068887, -0.0005434597842395306, 9.871413931250572e-05, 0.0007408882956951857, 0.0013830624520778656, 0.002025236375629902, 0.002667410299181938, 0.003309584455564618, 0.003951758611947298, 0.004593932535499334, 0.005236106459051371, 0.005878280848264694, 0.0065204547718167305, 0.007162628695368767, 0.007804802618920803, 0.00844697654247284, 0.009089150466024876, 0.009731324389576912, 0.010373499244451523, 0.011015673168003559, 0.011657847091555595, 0.012300021015107632, 0.012942194938659668, 0.013584368862211704, 0.01422654278576374, 0.014868717640638351, 0.015510890632867813, 0.016153065487742424, 0.016795240342617035, 0.017437413334846497]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 7.0, 8.0, 10.0, 15.0, 14.0, 17.0, 22.0, 29.0, 14.0, 36.0, 36.0, 34.0, 37.0, 31.0, 43.0, 40.0, 46.0, 51.0, 57.0, 40.0, 57.0, 42.0, 40.0, 37.0, 37.0, 18.0, 24.0, 20.0, 18.0, 16.0, 10.0, 19.0, 14.0, 6.0, 7.0, 9.0, 8.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015637991949915886, -0.015152214094996452, -0.014666437171399593, -0.01418065931648016, -0.0136948823928833, -0.013209104537963867, -0.012723326683044434, -0.012237548828125, -0.011751771904528141, -0.011265994049608707, -0.010780217126011848, -0.010294439271092415, -0.009808661416172981, -0.009322884492576122, -0.008837106637656689, -0.00835132971405983, -0.007865551859140396, -0.00737977446988225, -0.0068939970806241035, -0.00640821922570467, -0.005922441836446524, -0.005436664447188377, -0.004950886592268944, -0.0044651092030107975, -0.003979331813752651, -0.003493554424494505, -0.003007776802405715, -0.002521999180316925, -0.0020362217910587788, -0.0015504444018006325, -0.0010646667797118425, -0.0005788891576230526, -9.311269968748093e-05, 0.0003926648059859872, 0.0008784423116594553, 0.0013642198173329234, 0.0018499973230063915, 0.002335774712264538, 0.0028215523343533278, 0.0033073299564421177, 0.003793107345700264, 0.00427888473495841, 0.0047646621242165565, 0.00525043997913599, 0.005736217368394136, 0.006221994757652283, 0.006707772612571716, 0.007193550001829863, 0.007679327391088009, 0.008165105246007442, 0.008650882169604301, 0.009136660024523735, 0.009622437879443169, 0.010108214803040028, 0.010593992657959461, 0.01107976958155632, 0.011565547436475754, 0.012051325291395187, 0.012537102214992046, 0.01302288006991148, 0.013508656993508339, 0.013994434848427773, 0.014480212703347206, 0.01496599055826664, 0.015451767481863499]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 18.0, 22.0, 29.0, 42.0, 77.0, 105.0, 127.0, 226.0, 309.0, 424.0, 693.0, 974.0, 1588.0, 2529.0, 4034.0, 6677.0, 11440.0, 20573.0, 37125.0, 71289.0, 150744.0, 327956.0, 209353.0, 93922.0, 47184.0, 25204.0, 14202.0, 8137.0, 4930.0, 3003.0, 1889.0, 1224.0, 833.0, 530.0, 352.0, 258.0, 155.0, 115.0, 72.0, 40.0, 40.0, 28.0, 20.0, 9.0, 10.0, 5.0, 8.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00893402099609375, -0.008642911911010742, -0.008351802825927734, -0.008060693740844727, -0.007769584655761719, -0.007478475570678711, -0.007187366485595703, -0.006896257400512695, -0.0066051483154296875, -0.00631403923034668, -0.006022930145263672, -0.005731821060180664, -0.005440711975097656, -0.0051496028900146484, -0.004858493804931641, -0.004567384719848633, -0.004276275634765625, -0.003985166549682617, -0.0036940574645996094, -0.0034029483795166016, -0.0031118392944335938, -0.002820730209350586, -0.002529621124267578, -0.0022385120391845703, -0.0019474029541015625, -0.0016562938690185547, -0.0013651847839355469, -0.001074075698852539, -0.0007829666137695312, -0.0004918575286865234, -0.00020074844360351562, 9.036064147949219e-05, 0.0003814697265625, 0.0006725788116455078, 0.0009636878967285156, 0.0012547969818115234, 0.0015459060668945312, 0.001837015151977539, 0.002128124237060547, 0.0024192333221435547, 0.0027103424072265625, 0.0030014514923095703, 0.003292560577392578, 0.003583669662475586, 0.0038747787475585938, 0.0041658878326416016, 0.004456996917724609, 0.004748106002807617, 0.005039215087890625, 0.005330324172973633, 0.005621433258056641, 0.0059125423431396484, 0.006203651428222656, 0.006494760513305664, 0.006785869598388672, 0.00707697868347168, 0.0073680877685546875, 0.007659196853637695, 0.007950305938720703, 0.008241415023803711, 0.008532524108886719, 0.008823633193969727, 0.009114742279052734, 0.009405851364135742, 0.00969696044921875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 5.0, 4.0, 10.0, 10.0, 7.0, 8.0, 16.0, 19.0, 25.0, 25.0, 18.0, 35.0, 25.0, 28.0, 40.0, 33.0, 52.0, 32.0, 46.0, 56.0, 46.0, 45.0, 49.0, 50.0, 47.0, 38.0, 35.0, 28.0, 21.0, 28.0, 14.0, 22.0, 19.0, 9.0, 10.0, 14.0, 4.0, 7.0, 8.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01540374755859375, -0.01490175724029541, -0.01439976692199707, -0.01389777660369873, -0.01339578628540039, -0.01289379596710205, -0.012391805648803711, -0.011889815330505371, -0.011387825012207031, -0.010885834693908691, -0.010383844375610352, -0.009881854057312012, -0.009379863739013672, -0.008877873420715332, -0.008375883102416992, -0.007873892784118652, -0.0073719024658203125, -0.006869912147521973, -0.006367921829223633, -0.005865931510925293, -0.005363941192626953, -0.004861950874328613, -0.0043599605560302734, -0.0038579702377319336, -0.0033559799194335938, -0.002853989601135254, -0.002351999282836914, -0.0018500089645385742, -0.0013480186462402344, -0.0008460283279418945, -0.0003440380096435547, 0.00015795230865478516, 0.000659942626953125, 0.0011619329452514648, 0.0016639232635498047, 0.0021659135818481445, 0.0026679039001464844, 0.0031698942184448242, 0.003671884536743164, 0.004173874855041504, 0.004675865173339844, 0.005177855491638184, 0.0056798458099365234, 0.006181836128234863, 0.006683826446533203, 0.007185816764831543, 0.007687807083129883, 0.008189797401428223, 0.008691787719726562, 0.009193778038024902, 0.009695768356323242, 0.010197758674621582, 0.010699748992919922, 0.011201739311218262, 0.011703729629516602, 0.012205719947814941, 0.012707710266113281, 0.013209700584411621, 0.013711690902709961, 0.0142136812210083, 0.01471567153930664, 0.01521766185760498, 0.01571965217590332, 0.01622164249420166, 0.0167236328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 8.0, 14.0, 18.0, 24.0, 48.0, 63.0, 104.0, 132.0, 195.0, 282.0, 371.0, 556.0, 713.0, 1023.0, 1461.0, 2005.0, 2997.0, 4605.0, 7154.0, 12628.0, 26092.0, 67423.0, 271556.0, 473980.0, 99418.0, 34335.0, 15883.0, 8733.0, 5445.0, 3529.0, 2356.0, 1561.0, 1124.0, 779.0, 583.0, 392.0, 273.0, 203.0, 130.0, 96.0, 69.0, 52.0, 41.0, 23.0, 25.0, 19.0, 8.0, 12.0, 7.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.014678955078125, -0.014249324798583984, -0.013819694519042969, -0.013390064239501953, -0.012960433959960938, -0.012530803680419922, -0.012101173400878906, -0.01167154312133789, -0.011241912841796875, -0.01081228256225586, -0.010382652282714844, -0.009953022003173828, -0.009523391723632812, -0.009093761444091797, -0.008664131164550781, -0.008234500885009766, -0.00780487060546875, -0.007375240325927734, -0.006945610046386719, -0.006515979766845703, -0.0060863494873046875, -0.005656719207763672, -0.005227088928222656, -0.004797458648681641, -0.004367828369140625, -0.003938198089599609, -0.0035085678100585938, -0.003078937530517578, -0.0026493072509765625, -0.002219676971435547, -0.0017900466918945312, -0.0013604164123535156, -0.0009307861328125, -0.0005011558532714844, -7.152557373046875e-05, 0.0003581047058105469, 0.0007877349853515625, 0.0012173652648925781, 0.0016469955444335938, 0.0020766258239746094, 0.002506256103515625, 0.0029358863830566406, 0.0033655166625976562, 0.003795146942138672, 0.0042247772216796875, 0.004654407501220703, 0.005084037780761719, 0.005513668060302734, 0.00594329833984375, 0.006372928619384766, 0.006802558898925781, 0.007232189178466797, 0.0076618194580078125, 0.008091449737548828, 0.008521080017089844, 0.00895071029663086, 0.009380340576171875, 0.00980997085571289, 0.010239601135253906, 0.010669231414794922, 0.011098861694335938, 0.011528491973876953, 0.011958122253417969, 0.012387752532958984, 0.0128173828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 2.0, 1.0, 7.0, 6.0, 10.0, 11.0, 8.0, 14.0, 19.0, 17.0, 27.0, 29.0, 26.0, 28.0, 30.0, 30.0, 37.0, 40.0, 39.0, 34.0, 39.0, 43.0, 37.0, 35.0, 43.0, 27.0, 54.0, 40.0, 34.0, 29.0, 42.0, 27.0, 19.0, 25.0, 21.0, 7.0, 12.0, 12.0, 8.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01012420654296875, -0.009817838668823242, -0.009511470794677734, -0.009205102920532227, -0.008898735046386719, -0.008592367172241211, -0.008285999298095703, -0.007979631423950195, -0.0076732635498046875, -0.00736689567565918, -0.007060527801513672, -0.006754159927368164, -0.006447792053222656, -0.0061414241790771484, -0.005835056304931641, -0.005528688430786133, -0.005222320556640625, -0.004915952682495117, -0.004609584808349609, -0.0043032169342041016, -0.003996849060058594, -0.003690481185913086, -0.003384113311767578, -0.0030777454376220703, -0.0027713775634765625, -0.0024650096893310547, -0.002158641815185547, -0.001852273941040039, -0.0015459060668945312, -0.0012395381927490234, -0.0009331703186035156, -0.0006268024444580078, -0.0003204345703125, -1.4066696166992188e-05, 0.0002923011779785156, 0.0005986690521240234, 0.0009050369262695312, 0.001211404800415039, 0.0015177726745605469, 0.0018241405487060547, 0.0021305084228515625, 0.0024368762969970703, 0.002743244171142578, 0.003049612045288086, 0.0033559799194335938, 0.0036623477935791016, 0.003968715667724609, 0.004275083541870117, 0.004581451416015625, 0.004887819290161133, 0.005194187164306641, 0.0055005550384521484, 0.005806922912597656, 0.006113290786743164, 0.006419658660888672, 0.00672602653503418, 0.0070323944091796875, 0.007338762283325195, 0.007645130157470703, 0.007951498031616211, 0.008257865905761719, 0.008564233779907227, 0.008870601654052734, 0.009176969528198242, 0.00948333740234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 0.0, 2.0, 4.0, 8.0, 7.0, 8.0, 10.0, 28.0, 17.0, 29.0, 44.0, 69.0, 67.0, 119.0, 146.0, 202.0, 279.0, 431.0, 555.0, 757.0, 1145.0, 1829.0, 2685.0, 4278.0, 7445.0, 14931.0, 37722.0, 193807.0, 663717.0, 69931.0, 22201.0, 10179.0, 5726.0, 3336.0, 2176.0, 1390.0, 929.0, 648.0, 451.0, 334.0, 232.0, 170.0, 132.0, 97.0, 79.0, 52.0, 46.0, 35.0, 22.0, 19.0, 6.0, 8.0, 4.0, 10.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010431557893753052, -0.0010086596012115479, -0.0009741634130477905, -0.0009396672248840332, -0.0009051710367202759, -0.0008706748485565186, -0.0008361786603927612, -0.0008016824722290039, -0.0007671862840652466, -0.0007326900959014893, -0.0006981939077377319, -0.0006636977195739746, -0.0006292015314102173, -0.00059470534324646, -0.0005602091550827026, -0.0005257129669189453, -0.000491216778755188, -0.00045672059059143066, -0.00042222440242767334, -0.000387728214263916, -0.0003532320261001587, -0.00031873583793640137, -0.00028423964977264404, -0.0002497434616088867, -0.0002152472734451294, -0.00018075108528137207, -0.00014625489711761475, -0.00011175870895385742, -7.72625207901001e-05, -4.2766332626342773e-05, -8.27014446258545e-06, 2.6226043701171875e-05, 6.07222318649292e-05, 9.521842002868652e-05, 0.00012971460819244385, 0.00016421079635620117, 0.0001987069845199585, 0.00023320317268371582, 0.00026769936084747314, 0.00030219554901123047, 0.0003366917371749878, 0.0003711879253387451, 0.00040568411350250244, 0.00044018030166625977, 0.0004746764898300171, 0.0005091726779937744, 0.0005436688661575317, 0.0005781650543212891, 0.0006126612424850464, 0.0006471574306488037, 0.000681653618812561, 0.0007161498069763184, 0.0007506459951400757, 0.000785142183303833, 0.0008196383714675903, 0.0008541345596313477, 0.000888630747795105, 0.0009231269359588623, 0.0009576231241226196, 0.000992119312286377, 0.0010266155004501343, 0.0010611116886138916, 0.001095607876777649, 0.0011301040649414062]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 21.0, 0.0, 19.0, 0.0, 0.0, 28.0, 0.0, 43.0, 0.0, 60.0, 0.0, 68.0, 0.0, 0.0, 86.0, 0.0, 108.0, 0.0, 115.0, 0.0, 0.0, 111.0, 0.0, 80.0, 0.0, 77.0, 0.0, 66.0, 0.0, 0.0, 50.0, 0.0, 28.0, 0.0, 19.0, 0.0, 0.0, 11.0, 0.0, 8.0, 0.0, 7.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.487833499908447e-07, -7.227063179016113e-07, -6.966292858123779e-07, -6.705522537231445e-07, -6.444752216339111e-07, -6.183981895446777e-07, -5.923211574554443e-07, -5.662441253662109e-07, -5.401670932769775e-07, -5.140900611877441e-07, -4.880130290985107e-07, -4.6193599700927734e-07, -4.3585896492004395e-07, -4.0978193283081055e-07, -3.8370490074157715e-07, -3.5762786865234375e-07, -3.3155083656311035e-07, -3.0547380447387695e-07, -2.7939677238464355e-07, -2.5331974029541016e-07, -2.2724270820617676e-07, -2.0116567611694336e-07, -1.7508864402770996e-07, -1.4901161193847656e-07, -1.2293457984924316e-07, -9.685754776000977e-08, -7.078051567077637e-08, -4.470348358154297e-08, -1.862645149230957e-08, 7.450580596923828e-09, 3.3527612686157227e-08, 5.960464477539063e-08, 8.568167686462402e-08, 1.1175870895385742e-07, 1.3783574104309082e-07, 1.6391277313232422e-07, 1.8998980522155762e-07, 2.1606683731079102e-07, 2.421438694000244e-07, 2.682209014892578e-07, 2.942979335784912e-07, 3.203749656677246e-07, 3.46451997756958e-07, 3.725290298461914e-07, 3.986060619354248e-07, 4.246830940246582e-07, 4.507601261138916e-07, 4.76837158203125e-07, 5.029141902923584e-07, 5.289912223815918e-07, 5.550682544708252e-07, 5.811452865600586e-07, 6.07222318649292e-07, 6.332993507385254e-07, 6.593763828277588e-07, 6.854534149169922e-07, 7.115304470062256e-07, 7.37607479095459e-07, 7.636845111846924e-07, 7.897615432739258e-07, 8.158385753631592e-07, 8.419156074523926e-07, 8.67992639541626e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 13.0, 14.0, 15.0, 32.0, 42.0, 60.0, 91.0, 153.0, 193.0, 257.0, 403.0, 565.0, 836.0, 1218.0, 1833.0, 2491.0, 3901.0, 5678.0, 8738.0, 13669.0, 21353.0, 35306.0, 63579.0, 145886.0, 406407.0, 164931.0, 68608.0, 37588.0, 22606.0, 14266.0, 9194.0, 6109.0, 3942.0, 2656.0, 1843.0, 1279.0, 885.0, 623.0, 388.0, 288.0, 187.0, 141.0, 95.0, 49.0, 44.0, 29.0, 21.0, 15.0, 12.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.0007677078247070312, -0.0007441267371177673, -0.0007205456495285034, -0.0006969645619392395, -0.0006733834743499756, -0.0006498023867607117, -0.0006262212991714478, -0.0006026402115821838, -0.0005790591239929199, -0.000555478036403656, -0.0005318969488143921, -0.0005083158612251282, -0.00048473477363586426, -0.00046115368604660034, -0.0004375725984573364, -0.0004139915108680725, -0.0003904104232788086, -0.0003668293356895447, -0.00034324824810028076, -0.00031966716051101685, -0.00029608607292175293, -0.000272504985332489, -0.0002489238977432251, -0.00022534281015396118, -0.00020176172256469727, -0.00017818063497543335, -0.00015459954738616943, -0.00013101845979690552, -0.0001074373722076416, -8.385628461837769e-05, -6.027519702911377e-05, -3.6694109439849854e-05, -1.3113021850585938e-05, 1.0468065738677979e-05, 3.4049153327941895e-05, 5.763024091720581e-05, 8.121132850646973e-05, 0.00010479241609573364, 0.00012837350368499756, 0.00015195459127426147, 0.0001755356788635254, 0.0001991167664527893, 0.00022269785404205322, 0.00024627894163131714, 0.00026986002922058105, 0.00029344111680984497, 0.0003170222043991089, 0.0003406032919883728, 0.0003641843795776367, 0.00038776546716690063, 0.00041134655475616455, 0.00043492764234542847, 0.0004585087299346924, 0.0004820898175239563, 0.0005056709051132202, 0.0005292519927024841, 0.000552833080291748, 0.000576414167881012, 0.0005999952554702759, 0.0006235763430595398, 0.0006471574306488037, 0.0006707385182380676, 0.0006943196058273315, 0.0007179006934165955, 0.0007414817810058594]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 7.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 17.0, 14.0, 16.0, 30.0, 41.0, 37.0, 69.0, 84.0, 137.0, 157.0, 106.0, 55.0, 59.0, 45.0, 24.0, 18.0, 17.0, 17.0, 8.0, 1.0, 1.0, 3.0, 5.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00036716461181640625, -0.00035753101110458374, -0.00034789741039276123, -0.0003382638096809387, -0.0003286302089691162, -0.0003189966082572937, -0.0003093630075454712, -0.0002997294068336487, -0.00029009580612182617, -0.00028046220541000366, -0.00027082860469818115, -0.00026119500398635864, -0.00025156140327453613, -0.00024192780256271362, -0.0002322942018508911, -0.0002226606011390686, -0.0002130270004272461, -0.00020339339971542358, -0.00019375979900360107, -0.00018412619829177856, -0.00017449259757995605, -0.00016485899686813354, -0.00015522539615631104, -0.00014559179544448853, -0.00013595819473266602, -0.0001263245940208435, -0.000116690993309021, -0.00010705739259719849, -9.742379188537598e-05, -8.779019117355347e-05, -7.815659046173096e-05, -6.852298974990845e-05, -5.888938903808594e-05, -4.925578832626343e-05, -3.962218761444092e-05, -2.9988586902618408e-05, -2.03549861907959e-05, -1.0721385478973389e-05, -1.087784767150879e-06, 8.545815944671631e-06, 1.817941665649414e-05, 2.781301736831665e-05, 3.744661808013916e-05, 4.708021879196167e-05, 5.671381950378418e-05, 6.634742021560669e-05, 7.59810209274292e-05, 8.561462163925171e-05, 9.524822235107422e-05, 0.00010488182306289673, 0.00011451542377471924, 0.00012414902448654175, 0.00013378262519836426, 0.00014341622591018677, 0.00015304982662200928, 0.0001626834273338318, 0.0001723170280456543, 0.0001819506287574768, 0.00019158422946929932, 0.00020121783018112183, 0.00021085143089294434, 0.00022048503160476685, 0.00023011863231658936, 0.00023975223302841187, 0.0002493858337402344]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 4.0, 7.0, 14.0, 27.0, 13.0, 29.0, 33.0, 52.0, 40.0, 82.0, 90.0, 83.0, 83.0, 83.0, 61.0, 66.0, 44.0, 42.0, 33.0, 16.0, 16.0, 17.0, 12.0, 9.0, 11.0, 5.0, 1.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.024028152227401733, -0.023382341489195824, -0.022736530750989914, -0.022090718150138855, -0.021444907411932945, -0.020799096673727036, -0.020153285935521126, -0.019507475197315216, -0.018861662596464157, -0.018215851858258247, -0.017570041120052338, -0.01692422851920128, -0.01627841778099537, -0.01563260704278946, -0.01498679630458355, -0.01434098556637764, -0.01369517482817173, -0.01304936408996582, -0.012403552420437336, -0.011757741682231426, -0.011111930012702942, -0.010466119274497032, -0.009820308536291122, -0.009174497798085213, -0.008528686128556728, -0.007882875390350819, -0.007237063720822334, -0.0065912529826164246, -0.0059454417787492275, -0.0052996305748820305, -0.004653819836676121, -0.004008008632808924, -0.0033621974289417267, -0.0027163862250745296, -0.0020705752540379763, -0.001424764166586101, -0.0007789530791342258, -0.0001331418752670288, 0.0005126690957695246, 0.001158480066806078, 0.001804291270673275, 0.002450102474540472, 0.0030959134455770254, 0.003741724416613579, 0.004387535620480776, 0.005033346824347973, 0.005679157562553883, 0.00632496876642108, 0.006970779970288277, 0.007616591174155474, 0.00826240237802267, 0.00890821311622858, 0.009554024785757065, 0.010199835523962975, 0.010845646262168884, 0.011491457000374794, 0.012137268669903278, 0.012783079408109188, 0.013428891077637672, 0.014074701815843582, 0.014720512554049492, 0.015366324223577976, 0.01601213589310646, 0.01665794663131237, 0.01730375736951828]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 8.0, 10.0, 9.0, 11.0, 16.0, 16.0, 29.0, 20.0, 25.0, 34.0, 33.0, 32.0, 35.0, 40.0, 39.0, 45.0, 41.0, 49.0, 57.0, 49.0, 47.0, 43.0, 43.0, 36.0, 33.0, 22.0, 22.0, 20.0, 17.0, 17.0, 8.0, 19.0, 14.0, 6.0, 8.0, 10.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015455709770321846, -0.014975931495428085, -0.014496153220534325, -0.014016374945640564, -0.013536596670746803, -0.013056818395853043, -0.012577040120959282, -0.012097261846065521, -0.01161748357117176, -0.011137705296278, -0.01065792702138424, -0.010178148746490479, -0.009698370471596718, -0.009218592196702957, -0.008738813921809196, -0.008259035646915436, -0.00777925830334425, -0.007299480028450489, -0.006819701753556728, -0.006339923478662968, -0.005860145203769207, -0.005380366928875446, -0.004900589119642973, -0.004420810844749212, -0.003941032569855452, -0.003461254294961691, -0.0029814760200679302, -0.002501697978004813, -0.0020219197031110525, -0.0015421414282172918, -0.0010623633861541748, -0.0005825851112604141, -0.00010280683636665344, 0.0003769713803194463, 0.0008567495970055461, 0.001336527755483985, 0.0018163060303777456, 0.0022960843052715063, 0.0027758623473346233, 0.003255640622228384, 0.0037354188971221447, 0.004215197172015905, 0.004694975446909666, 0.0051747532561421394, 0.0056545315310359, 0.006134309805929661, 0.0066140880808234215, 0.007093866355717182, 0.007573644630610943, 0.008053422905504704, 0.008533201180398464, 0.009012979455292225, 0.009492757730185986, 0.009972536005079746, 0.010452313348650932, 0.010932091623544693, 0.011411869898438454, 0.011891648173332214, 0.012371426448225975, 0.012851204723119736, 0.013330982998013496, 0.013810761272907257, 0.014290539547801018, 0.014770317822694778, 0.015250096097588539]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 7.0, 7.0, 12.0, 23.0, 34.0, 45.0, 64.0, 103.0, 136.0, 223.0, 374.0, 514.0, 767.0, 1219.0, 1783.0, 2820.0, 4362.0, 6645.0, 10504.0, 16472.0, 27149.0, 45531.0, 80728.0, 160233.0, 297655.0, 177441.0, 86907.0, 48746.0, 28811.0, 17849.0, 11047.0, 7048.0, 4554.0, 2961.0, 1988.0, 1300.0, 881.0, 565.0, 375.0, 232.0, 146.0, 102.0, 69.0, 38.0, 39.0, 23.0, 10.0, 6.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0271453857421875, -0.02625727653503418, -0.02536916732788086, -0.02448105812072754, -0.02359294891357422, -0.0227048397064209, -0.021816730499267578, -0.020928621292114258, -0.020040512084960938, -0.019152402877807617, -0.018264293670654297, -0.017376184463500977, -0.016488075256347656, -0.015599966049194336, -0.014711856842041016, -0.013823747634887695, -0.012935638427734375, -0.012047529220581055, -0.011159420013427734, -0.010271310806274414, -0.009383201599121094, -0.008495092391967773, -0.007606983184814453, -0.006718873977661133, -0.0058307647705078125, -0.004942655563354492, -0.004054546356201172, -0.0031664371490478516, -0.0022783279418945312, -0.001390218734741211, -0.0005021095275878906, 0.0003859996795654297, 0.00127410888671875, 0.0021622180938720703, 0.0030503273010253906, 0.003938436508178711, 0.004826545715332031, 0.0057146549224853516, 0.006602764129638672, 0.007490873336791992, 0.008378982543945312, 0.009267091751098633, 0.010155200958251953, 0.011043310165405273, 0.011931419372558594, 0.012819528579711914, 0.013707637786865234, 0.014595746994018555, 0.015483856201171875, 0.016371965408325195, 0.017260074615478516, 0.018148183822631836, 0.019036293029785156, 0.019924402236938477, 0.020812511444091797, 0.021700620651245117, 0.022588729858398438, 0.023476839065551758, 0.024364948272705078, 0.0252530574798584, 0.02614116668701172, 0.02702927589416504, 0.02791738510131836, 0.02880549430847168, 0.029693603515625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 8.0, 5.0, 7.0, 5.0, 6.0, 15.0, 12.0, 14.0, 15.0, 23.0, 26.0, 28.0, 32.0, 30.0, 28.0, 31.0, 41.0, 38.0, 45.0, 49.0, 49.0, 52.0, 57.0, 41.0, 45.0, 44.0, 26.0, 41.0, 35.0, 27.0, 18.0, 15.0, 17.0, 12.0, 12.0, 18.0, 8.0, 12.0, 5.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0123748779296875, -0.011954307556152344, -0.011533737182617188, -0.011113166809082031, -0.010692596435546875, -0.010272026062011719, -0.009851455688476562, -0.009430885314941406, -0.00901031494140625, -0.008589744567871094, -0.008169174194335938, -0.007748603820800781, -0.007328033447265625, -0.006907463073730469, -0.0064868927001953125, -0.006066322326660156, -0.005645751953125, -0.005225181579589844, -0.0048046112060546875, -0.004384040832519531, -0.003963470458984375, -0.0035429000854492188, -0.0031223297119140625, -0.0027017593383789062, -0.00228118896484375, -0.0018606185913085938, -0.0014400482177734375, -0.0010194778442382812, -0.000598907470703125, -0.00017833709716796875, 0.0002422332763671875, 0.0006628036499023438, 0.0010833740234375, 0.0015039443969726562, 0.0019245147705078125, 0.0023450851440429688, 0.002765655517578125, 0.0031862258911132812, 0.0036067962646484375, 0.004027366638183594, 0.00444793701171875, 0.004868507385253906, 0.0052890777587890625, 0.005709648132324219, 0.006130218505859375, 0.006550788879394531, 0.0069713592529296875, 0.007391929626464844, 0.0078125, 0.008233070373535156, 0.008653640747070312, 0.009074211120605469, 0.009494781494140625, 0.009915351867675781, 0.010335922241210938, 0.010756492614746094, 0.01117706298828125, 0.011597633361816406, 0.012018203735351562, 0.012438774108886719, 0.012859344482421875, 0.013279914855957031, 0.013700485229492188, 0.014121055603027344, 0.0145416259765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 1.0, 6.0, 13.0, 22.0, 15.0, 41.0, 52.0, 70.0, 92.0, 148.0, 203.0, 332.0, 460.0, 722.0, 1065.0, 1574.0, 2197.0, 3375.0, 5242.0, 7933.0, 12618.0, 19441.0, 31504.0, 52790.0, 92689.0, 179467.0, 270942.0, 155927.0, 82878.0, 47490.0, 28375.0, 17702.0, 11472.0, 7301.0, 4804.0, 3124.0, 2091.0, 1436.0, 880.0, 609.0, 454.0, 297.0, 245.0, 152.0, 116.0, 67.0, 48.0, 33.0, 17.0, 9.0, 9.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0247955322265625, -0.023979902267456055, -0.02316427230834961, -0.022348642349243164, -0.02153301239013672, -0.020717382431030273, -0.019901752471923828, -0.019086122512817383, -0.018270492553710938, -0.017454862594604492, -0.016639232635498047, -0.0158236026763916, -0.015007972717285156, -0.014192342758178711, -0.013376712799072266, -0.01256108283996582, -0.011745452880859375, -0.01092982292175293, -0.010114192962646484, -0.009298563003540039, -0.008482933044433594, -0.0076673030853271484, -0.006851673126220703, -0.006036043167114258, -0.0052204132080078125, -0.004404783248901367, -0.003589153289794922, -0.0027735233306884766, -0.0019578933715820312, -0.001142263412475586, -0.0003266334533691406, 0.0004889965057373047, 0.00130462646484375, 0.0021202564239501953, 0.0029358863830566406, 0.003751516342163086, 0.004567146301269531, 0.0053827762603759766, 0.006198406219482422, 0.007014036178588867, 0.007829666137695312, 0.008645296096801758, 0.009460926055908203, 0.010276556015014648, 0.011092185974121094, 0.011907815933227539, 0.012723445892333984, 0.01353907585144043, 0.014354705810546875, 0.01517033576965332, 0.015985965728759766, 0.01680159568786621, 0.017617225646972656, 0.0184328556060791, 0.019248485565185547, 0.020064115524291992, 0.020879745483398438, 0.021695375442504883, 0.022511005401611328, 0.023326635360717773, 0.02414226531982422, 0.024957895278930664, 0.02577352523803711, 0.026589155197143555, 0.02740478515625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 12.0, 7.0, 15.0, 19.0, 14.0, 26.0, 18.0, 20.0, 23.0, 26.0, 24.0, 27.0, 32.0, 40.0, 39.0, 37.0, 48.0, 42.0, 29.0, 41.0, 36.0, 38.0, 41.0, 40.0, 33.0, 45.0, 18.0, 24.0, 20.0, 21.0, 21.0, 15.0, 20.0, 18.0, 13.0, 6.0, 10.0, 7.0, 4.0, 2.0, 9.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00785064697265625, -0.007609844207763672, -0.007369041442871094, -0.007128238677978516, -0.0068874359130859375, -0.006646633148193359, -0.006405830383300781, -0.006165027618408203, -0.005924224853515625, -0.005683422088623047, -0.005442619323730469, -0.005201816558837891, -0.0049610137939453125, -0.004720211029052734, -0.004479408264160156, -0.004238605499267578, -0.003997802734375, -0.003756999969482422, -0.0035161972045898438, -0.0032753944396972656, -0.0030345916748046875, -0.0027937889099121094, -0.0025529861450195312, -0.002312183380126953, -0.002071380615234375, -0.0018305778503417969, -0.0015897750854492188, -0.0013489723205566406, -0.0011081695556640625, -0.0008673667907714844, -0.0006265640258789062, -0.0003857612609863281, -0.00014495849609375, 9.584426879882812e-05, 0.00033664703369140625, 0.0005774497985839844, 0.0008182525634765625, 0.0010590553283691406, 0.0012998580932617188, 0.0015406608581542969, 0.001781463623046875, 0.002022266387939453, 0.0022630691528320312, 0.0025038719177246094, 0.0027446746826171875, 0.0029854774475097656, 0.0032262802124023438, 0.003467082977294922, 0.0037078857421875, 0.003948688507080078, 0.004189491271972656, 0.004430294036865234, 0.0046710968017578125, 0.004911899566650391, 0.005152702331542969, 0.005393505096435547, 0.005634307861328125, 0.005875110626220703, 0.006115913391113281, 0.006356716156005859, 0.0065975189208984375, 0.006838321685791016, 0.007079124450683594, 0.007319927215576172, 0.00756072998046875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 8.0, 8.0, 8.0, 15.0, 7.0, 20.0, 19.0, 27.0, 54.0, 72.0, 105.0, 138.0, 181.0, 252.0, 379.0, 512.0, 678.0, 972.0, 1438.0, 2384.0, 3976.0, 7441.0, 22781.0, 899779.0, 80099.0, 12595.0, 5513.0, 3028.0, 1849.0, 1250.0, 844.0, 608.0, 438.0, 322.0, 208.0, 142.0, 118.0, 82.0, 58.0, 44.0, 35.0, 16.0, 16.0, 15.0, 6.0, 8.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0038089752197265625, -0.003685206174850464, -0.0035614371299743652, -0.0034376680850982666, -0.003313899040222168, -0.0031901299953460693, -0.0030663609504699707, -0.002942591905593872, -0.0028188228607177734, -0.002695053815841675, -0.002571284770965576, -0.0024475157260894775, -0.002323746681213379, -0.0021999776363372803, -0.0020762085914611816, -0.001952439546585083, -0.0018286705017089844, -0.0017049014568328857, -0.0015811324119567871, -0.0014573633670806885, -0.0013335943222045898, -0.0012098252773284912, -0.0010860562324523926, -0.0009622871875762939, -0.0008385181427001953, -0.0007147490978240967, -0.000590980052947998, -0.0004672110080718994, -0.0003434419631958008, -0.00021967291831970215, -9.590387344360352e-05, 2.7865171432495117e-05, 0.00015163421630859375, 0.0002754032611846924, 0.000399172306060791, 0.0005229413509368896, 0.0006467103958129883, 0.0007704794406890869, 0.0008942484855651855, 0.0010180175304412842, 0.0011417865753173828, 0.0012655556201934814, 0.00138932466506958, 0.0015130937099456787, 0.0016368627548217773, 0.001760631799697876, 0.0018844008445739746, 0.0020081698894500732, 0.002131938934326172, 0.0022557079792022705, 0.002379477024078369, 0.0025032460689544678, 0.0026270151138305664, 0.002750784158706665, 0.0028745532035827637, 0.0029983222484588623, 0.003122091293334961, 0.0032458603382110596, 0.003369629383087158, 0.003493398427963257, 0.0036171674728393555, 0.003740936517715454, 0.0038647055625915527, 0.003988474607467651, 0.00411224365234375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 0.0, 0.0, 16.0, 0.0, 20.0, 0.0, 39.0, 0.0, 48.0, 0.0, 77.0, 0.0, 0.0, 99.0, 0.0, 378.0, 0.0, 116.0, 0.0, 72.0, 0.0, 49.0, 0.0, 0.0, 41.0, 0.0, 16.0, 0.0, 10.0, 0.0, 7.0, 0.0, 4.0, 0.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.266659617424011e-07, -8.996576070785522e-07, -8.726492524147034e-07, -8.456408977508545e-07, -8.186325430870056e-07, -7.916241884231567e-07, -7.646158337593079e-07, -7.37607479095459e-07, -7.105991244316101e-07, -6.835907697677612e-07, -6.565824151039124e-07, -6.295740604400635e-07, -6.025657057762146e-07, -5.755573511123657e-07, -5.485489964485168e-07, -5.21540641784668e-07, -4.945322871208191e-07, -4.675239324569702e-07, -4.4051557779312134e-07, -4.1350722312927246e-07, -3.864988684654236e-07, -3.594905138015747e-07, -3.3248215913772583e-07, -3.0547380447387695e-07, -2.784654498100281e-07, -2.514570951461792e-07, -2.2444874048233032e-07, -1.9744038581848145e-07, -1.7043203115463257e-07, -1.434236764907837e-07, -1.1641532182693481e-07, -8.940696716308594e-08, -6.239861249923706e-08, -3.5390257835388184e-08, -8.381903171539307e-09, 1.862645149230957e-08, 4.563480615615845e-08, 7.264316082000732e-08, 9.96515154838562e-08, 1.2665987014770508e-07, 1.5366822481155396e-07, 1.8067657947540283e-07, 2.076849341392517e-07, 2.3469328880310059e-07, 2.6170164346694946e-07, 2.8870999813079834e-07, 3.157183527946472e-07, 3.427267074584961e-07, 3.6973506212234497e-07, 3.9674341678619385e-07, 4.237517714500427e-07, 4.507601261138916e-07, 4.777684807777405e-07, 5.047768354415894e-07, 5.317851901054382e-07, 5.587935447692871e-07, 5.85801899433136e-07, 6.128102540969849e-07, 6.398186087608337e-07, 6.668269634246826e-07, 6.938353180885315e-07, 7.208436727523804e-07, 7.478520274162292e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 7.0, 5.0, 14.0, 23.0, 21.0, 32.0, 40.0, 56.0, 75.0, 99.0, 126.0, 174.0, 237.0, 305.0, 414.0, 607.0, 725.0, 984.0, 1388.0, 1981.0, 3093.0, 6400.0, 17337.0, 182179.0, 794260.0, 20084.0, 6880.0, 3327.0, 2108.0, 1466.0, 1005.0, 844.0, 554.0, 449.0, 316.0, 247.0, 175.0, 138.0, 99.0, 74.0, 63.0, 41.0, 26.0, 17.0, 20.0, 15.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00383758544921875, -0.003717869520187378, -0.003598153591156006, -0.003478437662124634, -0.0033587217330932617, -0.0032390058040618896, -0.0031192898750305176, -0.0029995739459991455, -0.0028798580169677734, -0.0027601420879364014, -0.0026404261589050293, -0.0025207102298736572, -0.002400994300842285, -0.002281278371810913, -0.002161562442779541, -0.002041846513748169, -0.0019221305847167969, -0.0018024146556854248, -0.0016826987266540527, -0.0015629827976226807, -0.0014432668685913086, -0.0013235509395599365, -0.0012038350105285645, -0.0010841190814971924, -0.0009644031524658203, -0.0008446872234344482, -0.0007249712944030762, -0.0006052553653717041, -0.00048553943634033203, -0.00036582350730895996, -0.0002461075782775879, -0.00012639164924621582, -6.67572021484375e-06, 0.00011304020881652832, 0.0002327561378479004, 0.00035247206687927246, 0.00047218799591064453, 0.0005919039249420166, 0.0007116198539733887, 0.0008313357830047607, 0.0009510517120361328, 0.0010707676410675049, 0.001190483570098877, 0.001310199499130249, 0.001429915428161621, 0.0015496313571929932, 0.0016693472862243652, 0.0017890632152557373, 0.0019087791442871094, 0.0020284950733184814, 0.0021482110023498535, 0.0022679269313812256, 0.0023876428604125977, 0.0025073587894439697, 0.002627074718475342, 0.002746790647506714, 0.002866506576538086, 0.002986222505569458, 0.00310593843460083, 0.003225654363632202, 0.0033453702926635742, 0.0034650862216949463, 0.0035848021507263184, 0.0037045180797576904, 0.0038242340087890625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 6.0, 16.0, 21.0, 63.0, 644.0, 143.0, 46.0, 18.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012121200561523438, -0.0011740624904632568, -0.00113600492477417, -0.001097947359085083, -0.001059889793395996, -0.0010218322277069092, -0.0009837746620178223, -0.0009457170963287354, -0.0009076595306396484, -0.0008696019649505615, -0.0008315443992614746, -0.0007934868335723877, -0.0007554292678833008, -0.0007173717021942139, -0.000679314136505127, -0.00064125657081604, -0.0006031990051269531, -0.0005651414394378662, -0.0005270838737487793, -0.0004890263080596924, -0.00045096874237060547, -0.00041291117668151855, -0.00037485361099243164, -0.0003367960453033447, -0.0002987384796142578, -0.0002606809139251709, -0.00022262334823608398, -0.00018456578254699707, -0.00014650821685791016, -0.00010845065116882324, -7.039308547973633e-05, -3.2335519790649414e-05, 5.7220458984375e-06, 4.3779611587524414e-05, 8.183717727661133e-05, 0.00011989474296569824, 0.00015795230865478516, 0.00019600987434387207, 0.00023406744003295898, 0.0002721250057220459, 0.0003101825714111328, 0.0003482401371002197, 0.00038629770278930664, 0.00042435526847839355, 0.00046241283416748047, 0.0005004703998565674, 0.0005385279655456543, 0.0005765855312347412, 0.0006146430969238281, 0.000652700662612915, 0.000690758228302002, 0.0007288157939910889, 0.0007668733596801758, 0.0008049309253692627, 0.0008429884910583496, 0.0008810460567474365, 0.0009191036224365234, 0.0009571611881256104, 0.0009952187538146973, 0.0010332763195037842, 0.001071333885192871, 0.001109391450881958, 0.001147449016571045, 0.0011855065822601318, 0.0012235641479492188]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 5.0, 10.0, 4.0, 10.0, 10.0, 11.0, 20.0, 37.0, 32.0, 38.0, 56.0, 65.0, 70.0, 109.0, 70.0, 87.0, 86.0, 52.0, 50.0, 31.0, 32.0, 29.0, 11.0, 19.0, 9.0, 5.0, 6.0, 4.0, 10.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01886601746082306, -0.01830318383872509, -0.01774035207927227, -0.0171775184571743, -0.01661468669772148, -0.016051853075623512, -0.015489019453525543, -0.014926186762750149, -0.014363354071974754, -0.01380052138119936, -0.013237688690423965, -0.012674855068325996, -0.012112022377550602, -0.011549189686775208, -0.010986356064677238, -0.010423523373901844, -0.00986069068312645, -0.009297857992351055, -0.00873502530157566, -0.008172191679477692, -0.007609358988702297, -0.007046526297926903, -0.006483693141490221, -0.005920859985053539, -0.005358027294278145, -0.00479519460350275, -0.004232361447066069, -0.0036695285234600306, -0.0031066955998539925, -0.0025438626762479544, -0.0019810297526419163, -0.0014181965962052345, -0.0008553657680749893, -0.0002925328444689512, 0.00027030007913708687, 0.000833133002743125, 0.001395965926349163, 0.001958798849955201, 0.0025216317735612392, 0.003084464929997921, 0.0036472976207733154, 0.00421013031154871, 0.004772963467985392, 0.005335796624422073, 0.005898629315197468, 0.006461462005972862, 0.007024295162409544, 0.007587128318846226, 0.00814996100962162, 0.008712793700397015, 0.009275626391172409, 0.009838460013270378, 0.010401292704045773, 0.010964125394821167, 0.011526959016919136, 0.01208979170769453, 0.012652624398469925, 0.01321545708924532, 0.013778289780020714, 0.014341123402118683, 0.014903956092894077, 0.015466788783669472, 0.01602962240576744, 0.01659245416522026, 0.01715528778731823]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 5.0, 7.0, 8.0, 12.0, 15.0, 12.0, 24.0, 18.0, 16.0, 23.0, 19.0, 18.0, 23.0, 29.0, 29.0, 35.0, 31.0, 29.0, 49.0, 48.0, 31.0, 44.0, 38.0, 51.0, 36.0, 38.0, 22.0, 23.0, 32.0, 24.0, 34.0, 26.0, 20.0, 20.0, 12.0, 13.0, 12.0, 8.0, 5.0, 10.0, 8.0, 9.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.012421466410160065, -0.012032251805067062, -0.01164303719997406, -0.011253821663558483, -0.01086460705846548, -0.010475392453372478, -0.010086176916956902, -0.0096969623118639, -0.009307747706770897, -0.008918533101677895, -0.008529318496584892, -0.008140102960169315, -0.007750888355076313, -0.007361673749983311, -0.006972458679229021, -0.0065832436084747314, -0.006194029003381729, -0.005804814398288727, -0.005415599327534437, -0.0050263842567801476, -0.004637169651687145, -0.004247955046594143, -0.0038587399758398533, -0.0034695251379162073, -0.0030803102999925613, -0.0026910954620689154, -0.0023018806241452694, -0.0019126657862216234, -0.0015234509482979774, -0.0011342361103743315, -0.0007450212724506855, -0.00035580643452703953, 3.340747207403183e-05, 0.0004226223099976778, 0.0008118371479213238, 0.0012010519858449697, 0.0015902668237686157, 0.0019794816616922617, 0.0023686964996159077, 0.0027579113375395536, 0.0031471261754631996, 0.0035363410133868456, 0.0039255558513104916, 0.004314770922064781, 0.0047039855271577835, 0.005093200132250786, 0.0054824152030050755, 0.005871630273759365, 0.006260844878852367, 0.00665005948394537, 0.007039274554699659, 0.007428489625453949, 0.007817704230546951, 0.008206918835639954, 0.008596133440732956, 0.008985348977148533, 0.009374563582241535, 0.009763778187334538, 0.010152993723750114, 0.010542208328843117, 0.010931422933936119, 0.011320637539029121, 0.011709852144122124, 0.0120990676805377, 0.012488282285630703]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 9.0, 22.0, 31.0, 39.0, 66.0, 87.0, 143.0, 210.0, 298.0, 472.0, 626.0, 921.0, 1406.0, 2008.0, 2895.0, 4447.0, 6360.0, 9440.0, 14512.0, 22907.0, 36032.0, 60067.0, 102221.0, 189718.0, 443961.0, 1340623.0, 1157652.0, 381563.0, 169815.0, 94096.0, 55330.0, 33679.0, 21193.0, 13389.0, 8968.0, 5876.0, 4096.0, 2722.0, 1917.0, 1349.0, 937.0, 639.0, 472.0, 328.0, 224.0, 159.0, 115.0, 74.0, 64.0, 38.0, 20.0, 21.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0], "bins": [-0.01514434814453125, -0.01466989517211914, -0.014195442199707031, -0.013720989227294922, -0.013246536254882812, -0.012772083282470703, -0.012297630310058594, -0.011823177337646484, -0.011348724365234375, -0.010874271392822266, -0.010399818420410156, -0.009925365447998047, -0.009450912475585938, -0.008976459503173828, -0.008502006530761719, -0.00802755355834961, -0.0075531005859375, -0.007078647613525391, -0.006604194641113281, -0.006129741668701172, -0.0056552886962890625, -0.005180835723876953, -0.004706382751464844, -0.004231929779052734, -0.003757476806640625, -0.0032830238342285156, -0.0028085708618164062, -0.002334117889404297, -0.0018596649169921875, -0.0013852119445800781, -0.0009107589721679688, -0.0004363059997558594, 3.814697265625e-05, 0.0005125999450683594, 0.0009870529174804688, 0.0014615058898925781, 0.0019359588623046875, 0.002410411834716797, 0.0028848648071289062, 0.0033593177795410156, 0.003833770751953125, 0.004308223724365234, 0.004782676696777344, 0.005257129669189453, 0.0057315826416015625, 0.006206035614013672, 0.006680488586425781, 0.007154941558837891, 0.00762939453125, 0.00810384750366211, 0.008578300476074219, 0.009052753448486328, 0.009527206420898438, 0.010001659393310547, 0.010476112365722656, 0.010950565338134766, 0.011425018310546875, 0.011899471282958984, 0.012373924255371094, 0.012848377227783203, 0.013322830200195312, 0.013797283172607422, 0.014271736145019531, 0.01474618911743164, 0.01522064208984375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 7.0, 7.0, 7.0, 8.0, 14.0, 13.0, 17.0, 12.0, 18.0, 22.0, 24.0, 20.0, 35.0, 24.0, 36.0, 37.0, 37.0, 31.0, 45.0, 37.0, 45.0, 47.0, 52.0, 39.0, 44.0, 31.0, 33.0, 41.0, 29.0, 28.0, 19.0, 21.0, 18.0, 11.0, 17.0, 11.0, 16.0, 7.0, 8.0, 2.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.007320404052734375, -0.007088005542755127, -0.006855607032775879, -0.006623208522796631, -0.006390810012817383, -0.006158411502838135, -0.005926012992858887, -0.005693614482879639, -0.005461215972900391, -0.005228817462921143, -0.0049964189529418945, -0.0047640204429626465, -0.0045316219329833984, -0.00429922342300415, -0.004066824913024902, -0.0038344264030456543, -0.0036020278930664062, -0.003369629383087158, -0.00313723087310791, -0.002904832363128662, -0.002672433853149414, -0.002440035343170166, -0.002207636833190918, -0.00197523832321167, -0.0017428398132324219, -0.0015104413032531738, -0.0012780427932739258, -0.0010456442832946777, -0.0008132457733154297, -0.0005808472633361816, -0.0003484487533569336, -0.00011605024337768555, 0.0001163482666015625, 0.00034874677658081055, 0.0005811452865600586, 0.0008135437965393066, 0.0010459423065185547, 0.0012783408164978027, 0.0015107393264770508, 0.0017431378364562988, 0.001975536346435547, 0.002207934856414795, 0.002440333366394043, 0.002672731876373291, 0.002905130386352539, 0.003137528896331787, 0.003369927406311035, 0.003602325916290283, 0.0038347244262695312, 0.004067122936248779, 0.004299521446228027, 0.004531919956207275, 0.0047643184661865234, 0.0049967169761657715, 0.0052291154861450195, 0.005461513996124268, 0.005693912506103516, 0.005926311016082764, 0.006158709526062012, 0.00639110803604126, 0.006623506546020508, 0.006855905055999756, 0.007088303565979004, 0.007320702075958252, 0.0075531005859375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 8.0, 23.0, 23.0, 17.0, 34.0, 70.0, 86.0, 124.0, 189.0, 251.0, 363.0, 591.0, 861.0, 1338.0, 2203.0, 3379.0, 5453.0, 8719.0, 14308.0, 23958.0, 40423.0, 69338.0, 125885.0, 241447.0, 529696.0, 1275344.0, 994767.0, 409756.0, 196040.0, 103738.0, 58304.0, 34323.0, 20504.0, 12126.0, 7528.0, 4623.0, 2977.0, 1872.0, 1249.0, 774.0, 523.0, 337.0, 229.0, 163.0, 103.0, 82.0, 42.0, 26.0, 22.0, 15.0, 9.0, 6.0, 6.0, 3.0, 6.0, 3.0], "bins": [-0.01322174072265625, -0.01283109188079834, -0.01244044303894043, -0.01204979419708252, -0.01165914535522461, -0.0112684965133667, -0.010877847671508789, -0.010487198829650879, -0.010096549987792969, -0.009705901145935059, -0.009315252304077148, -0.008924603462219238, -0.008533954620361328, -0.008143305778503418, -0.007752656936645508, -0.007362008094787598, -0.0069713592529296875, -0.006580710411071777, -0.006190061569213867, -0.005799412727355957, -0.005408763885498047, -0.005018115043640137, -0.0046274662017822266, -0.004236817359924316, -0.0038461685180664062, -0.003455519676208496, -0.003064870834350586, -0.0026742219924926758, -0.0022835731506347656, -0.0018929243087768555, -0.0015022754669189453, -0.0011116266250610352, -0.000720977783203125, -0.00033032894134521484, 6.031990051269531e-05, 0.00045096874237060547, 0.0008416175842285156, 0.0012322664260864258, 0.001622915267944336, 0.002013564109802246, 0.0024042129516601562, 0.0027948617935180664, 0.0031855106353759766, 0.0035761594772338867, 0.003966808319091797, 0.004357457160949707, 0.004748106002807617, 0.005138754844665527, 0.0055294036865234375, 0.005920052528381348, 0.006310701370239258, 0.006701350212097168, 0.007091999053955078, 0.007482647895812988, 0.007873296737670898, 0.008263945579528809, 0.008654594421386719, 0.009045243263244629, 0.009435892105102539, 0.00982654094696045, 0.01021718978881836, 0.01060783863067627, 0.01099848747253418, 0.01138913631439209, 0.01177978515625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 9.0, 14.0, 17.0, 18.0, 24.0, 49.0, 47.0, 66.0, 68.0, 96.0, 99.0, 117.0, 139.0, 157.0, 181.0, 238.0, 240.0, 271.0, 315.0, 296.0, 281.0, 208.0, 210.0, 166.0, 126.0, 132.0, 90.0, 87.0, 62.0, 49.0, 50.0, 36.0, 24.0, 17.0, 20.0, 11.0, 10.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004108428955078125, -0.003973603248596191, -0.003838777542114258, -0.0037039518356323242, -0.0035691261291503906, -0.003434300422668457, -0.0032994747161865234, -0.00316464900970459, -0.0030298233032226562, -0.0028949975967407227, -0.002760171890258789, -0.0026253461837768555, -0.002490520477294922, -0.0023556947708129883, -0.0022208690643310547, -0.002086043357849121, -0.0019512176513671875, -0.001816391944885254, -0.0016815662384033203, -0.0015467405319213867, -0.0014119148254394531, -0.0012770891189575195, -0.001142263412475586, -0.0010074377059936523, -0.0008726119995117188, -0.0007377862930297852, -0.0006029605865478516, -0.00046813488006591797, -0.0003333091735839844, -0.00019848346710205078, -6.365776062011719e-05, 7.11679458618164e-05, 0.00020599365234375, 0.0003408193588256836, 0.0004756450653076172, 0.0006104707717895508, 0.0007452964782714844, 0.000880122184753418, 0.0010149478912353516, 0.0011497735977172852, 0.0012845993041992188, 0.0014194250106811523, 0.001554250717163086, 0.0016890764236450195, 0.0018239021301269531, 0.0019587278366088867, 0.0020935535430908203, 0.002228379249572754, 0.0023632049560546875, 0.002498030662536621, 0.0026328563690185547, 0.0027676820755004883, 0.002902507781982422, 0.0030373334884643555, 0.003172159194946289, 0.0033069849014282227, 0.0034418106079101562, 0.00357663631439209, 0.0037114620208740234, 0.003846287727355957, 0.003981113433837891, 0.004115939140319824, 0.004250764846801758, 0.004385590553283691, 0.004520416259765625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 4.0, 0.0, 6.0, 4.0, 11.0, 9.0, 17.0, 20.0, 16.0, 31.0, 35.0, 40.0, 54.0, 69.0, 62.0, 62.0, 78.0, 71.0, 77.0, 66.0, 53.0, 38.0, 19.0, 24.0, 17.0, 19.0, 9.0, 21.0, 9.0, 16.0, 7.0, 5.0, 3.0, 5.0, 9.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00880158506333828, -0.00848508533090353, -0.00816858559846878, -0.007852085866034031, -0.007535586133599281, -0.007219086401164532, -0.006902586668729782, -0.0065860869362950325, -0.006269587203860283, -0.005953087471425533, -0.005636587738990784, -0.005320088006556034, -0.0050035882741212845, -0.004687088541686535, -0.004370588809251785, -0.004054089076817036, -0.0037375888787209988, -0.003421089146286249, -0.0031045894138514996, -0.00278808968141675, -0.0024715899489820004, -0.0021550902165472507, -0.0018385902512818575, -0.0015220905188471079, -0.0012055907864123583, -0.0008890910539776087, -0.0005725912633351982, -0.00025609147269278765, 6.0408259741961956e-05, 0.00037690799217671156, 0.000693407841026783, 0.0010099075734615326, 0.0013264073058962822, 0.0016429070383310318, 0.0019594067707657814, 0.002275906503200531, 0.0025924062356352806, 0.00290890596807003, 0.0032254059333354235, 0.003541905665770173, 0.0038584053982049227, 0.004174905363470316, 0.0044914050959050655, 0.004807904828339815, 0.005124404560774565, 0.005440904293209314, 0.005757404025644064, 0.0060739037580788136, 0.006390403490513563, 0.006706903222948313, 0.007023402955383062, 0.007339902687817812, 0.007656402420252562, 0.007972902618348598, 0.008289402350783348, 0.008605902083218098, 0.008922401815652847, 0.009238901548087597, 0.009555401280522346, 0.009871901012957096, 0.010188400745391846, 0.010504900477826595, 0.010821400210261345, 0.011137899942696095, 0.011454399675130844]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 2.0, 7.0, 9.0, 14.0, 14.0, 11.0, 14.0, 23.0, 28.0, 12.0, 19.0, 28.0, 26.0, 15.0, 36.0, 37.0, 39.0, 33.0, 38.0, 31.0, 36.0, 39.0, 36.0, 43.0, 41.0, 43.0, 31.0, 24.0, 21.0, 35.0, 26.0, 27.0, 25.0, 22.0, 12.0, 12.0, 6.0, 11.0, 6.0, 11.0, 11.0, 4.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0074461097829043865, -0.007212478201836348, -0.006978847086429596, -0.006745215505361557, -0.006511583924293518, -0.006277952343225479, -0.0060443212278187275, -0.0058106896467506886, -0.005577058531343937, -0.005343426950275898, -0.005109795834869146, -0.004876164253801107, -0.0046425326727330685, -0.004408901557326317, -0.004175269976258278, -0.003941638395190239, -0.0037080068141222, -0.0034743754658848047, -0.003240743884816766, -0.0030071125365793705, -0.0027734809555113316, -0.0025398496072739363, -0.002306218259036541, -0.002072586677968502, -0.0018389553297311068, -0.0016053238650783896, -0.0013716924004256725, -0.0011380610521882772, -0.0009044295875355601, -0.000670798122882843, -0.00043716677464544773, -0.00020353530999273062, 3.0096154659986496e-05, 0.00026372759020887315, 0.0004973590257577598, 0.000730990432202816, 0.0009646218968555331, 0.0011982533615082502, 0.0014318847097456455, 0.0016655161743983626, 0.0018991476390510798, 0.002132778987288475, 0.002366410568356514, 0.0026000419165939093, 0.0028336732648313046, 0.0030673048458993435, 0.0033009361941367388, 0.003534567542374134, 0.003768199123442173, 0.004001830704510212, 0.004235461819916964, 0.0044690934009850025, 0.0047027249820530415, 0.004936356097459793, 0.005169987678527832, 0.005403619259595871, 0.00563725084066391, 0.005870882421731949, 0.0061045135371387005, 0.006338145118206739, 0.006571776699274778, 0.00680540781468153, 0.007039039395749569, 0.007272670976817608, 0.0075063020922243595]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 12.0, 11.0, 17.0, 25.0, 43.0, 49.0, 66.0, 118.0, 196.0, 225.0, 372.0, 567.0, 773.0, 1252.0, 1965.0, 3006.0, 4753.0, 7897.0, 13192.0, 22750.0, 41929.0, 80141.0, 166587.0, 312671.0, 190548.0, 90015.0, 46565.0, 25115.0, 14374.0, 8571.0, 5286.0, 3292.0, 2085.0, 1350.0, 855.0, 615.0, 393.0, 269.0, 213.0, 116.0, 67.0, 61.0, 52.0, 26.0, 11.0, 13.0, 9.0, 11.0, 6.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.00479888916015625, -0.004646956920623779, -0.004495024681091309, -0.004343092441558838, -0.004191160202026367, -0.0040392279624938965, -0.0038872957229614258, -0.003735363483428955, -0.0035834312438964844, -0.0034314990043640137, -0.003279566764831543, -0.0031276345252990723, -0.0029757022857666016, -0.002823770046234131, -0.00267183780670166, -0.0025199055671691895, -0.0023679733276367188, -0.002216041088104248, -0.0020641088485717773, -0.0019121766090393066, -0.001760244369506836, -0.0016083121299743652, -0.0014563798904418945, -0.0013044476509094238, -0.0011525154113769531, -0.0010005831718444824, -0.0008486509323120117, -0.000696718692779541, -0.0005447864532470703, -0.0003928542137145996, -0.0002409219741821289, -8.89897346496582e-05, 6.29425048828125e-05, 0.0002148747444152832, 0.0003668069839477539, 0.0005187392234802246, 0.0006706714630126953, 0.000822603702545166, 0.0009745359420776367, 0.0011264681816101074, 0.0012784004211425781, 0.0014303326606750488, 0.0015822649002075195, 0.0017341971397399902, 0.001886129379272461, 0.0020380616188049316, 0.0021899938583374023, 0.002341926097869873, 0.0024938583374023438, 0.0026457905769348145, 0.002797722816467285, 0.002949655055999756, 0.0031015872955322266, 0.0032535195350646973, 0.003405451774597168, 0.0035573840141296387, 0.0037093162536621094, 0.00386124849319458, 0.004013180732727051, 0.0041651129722595215, 0.004317045211791992, 0.004468977451324463, 0.004620909690856934, 0.004772841930389404, 0.004924774169921875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 8.0, 12.0, 5.0, 17.0, 13.0, 17.0, 13.0, 19.0, 24.0, 23.0, 23.0, 28.0, 32.0, 31.0, 31.0, 43.0, 39.0, 36.0, 33.0, 47.0, 47.0, 35.0, 41.0, 35.0, 31.0, 35.0, 33.0, 20.0, 31.0, 26.0, 17.0, 15.0, 27.0, 14.0, 12.0, 13.0, 9.0, 11.0, 4.0, 13.0, 10.0, 1.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.007488250732421875, -0.007242739200592041, -0.006997227668762207, -0.006751716136932373, -0.006506204605102539, -0.006260693073272705, -0.006015181541442871, -0.005769670009613037, -0.005524158477783203, -0.005278646945953369, -0.005033135414123535, -0.004787623882293701, -0.004542112350463867, -0.004296600818634033, -0.004051089286804199, -0.0038055777549743652, -0.0035600662231445312, -0.0033145546913146973, -0.0030690431594848633, -0.0028235316276550293, -0.0025780200958251953, -0.0023325085639953613, -0.0020869970321655273, -0.0018414855003356934, -0.0015959739685058594, -0.0013504624366760254, -0.0011049509048461914, -0.0008594393730163574, -0.0006139278411865234, -0.00036841630935668945, -0.00012290477752685547, 0.00012260675430297852, 0.0003681182861328125, 0.0006136298179626465, 0.0008591413497924805, 0.0011046528816223145, 0.0013501644134521484, 0.0015956759452819824, 0.0018411874771118164, 0.0020866990089416504, 0.0023322105407714844, 0.0025777220726013184, 0.0028232336044311523, 0.0030687451362609863, 0.0033142566680908203, 0.0035597681999206543, 0.0038052797317504883, 0.004050791263580322, 0.004296302795410156, 0.00454181432723999, 0.004787325859069824, 0.005032837390899658, 0.005278348922729492, 0.005523860454559326, 0.00576937198638916, 0.006014883518218994, 0.006260395050048828, 0.006505906581878662, 0.006751418113708496, 0.00699692964553833, 0.007242441177368164, 0.007487952709197998, 0.007733464241027832, 0.007978975772857666, 0.0082244873046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 21.0, 22.0, 27.0, 47.0, 59.0, 72.0, 119.0, 161.0, 236.0, 300.0, 422.0, 672.0, 999.0, 1459.0, 2085.0, 3084.0, 4674.0, 7423.0, 13562.0, 27014.0, 68912.0, 266026.0, 468394.0, 103339.0, 36695.0, 16880.0, 9339.0, 5381.0, 3496.0, 2365.0, 1641.0, 1102.0, 748.0, 534.0, 358.0, 252.0, 190.0, 126.0, 95.0, 64.0, 41.0, 30.0, 17.0, 21.0, 9.0, 7.0, 7.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.007358551025390625, -0.007122516632080078, -0.006886482238769531, -0.006650447845458984, -0.0064144134521484375, -0.006178379058837891, -0.005942344665527344, -0.005706310272216797, -0.00547027587890625, -0.005234241485595703, -0.004998207092285156, -0.004762172698974609, -0.0045261383056640625, -0.004290103912353516, -0.004054069519042969, -0.003818035125732422, -0.003582000732421875, -0.003345966339111328, -0.0031099319458007812, -0.0028738975524902344, -0.0026378631591796875, -0.0024018287658691406, -0.0021657943725585938, -0.0019297599792480469, -0.0016937255859375, -0.0014576911926269531, -0.0012216567993164062, -0.0009856224060058594, -0.0007495880126953125, -0.0005135536193847656, -0.00027751922607421875, -4.1484832763671875e-05, 0.000194549560546875, 0.0004305839538574219, 0.0006666183471679688, 0.0009026527404785156, 0.0011386871337890625, 0.0013747215270996094, 0.0016107559204101562, 0.0018467903137207031, 0.00208282470703125, 0.002318859100341797, 0.0025548934936523438, 0.0027909278869628906, 0.0030269622802734375, 0.0032629966735839844, 0.0034990310668945312, 0.003735065460205078, 0.003971099853515625, 0.004207134246826172, 0.004443168640136719, 0.004679203033447266, 0.0049152374267578125, 0.005151271820068359, 0.005387306213378906, 0.005623340606689453, 0.005859375, 0.006095409393310547, 0.006331443786621094, 0.006567478179931641, 0.0068035125732421875, 0.007039546966552734, 0.007275581359863281, 0.007511615753173828, 0.007747650146484375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 4.0, 2.0, 7.0, 5.0, 9.0, 18.0, 10.0, 10.0, 14.0, 12.0, 18.0, 17.0, 31.0, 39.0, 32.0, 31.0, 33.0, 29.0, 36.0, 49.0, 33.0, 38.0, 36.0, 35.0, 40.0, 39.0, 33.0, 24.0, 36.0, 35.0, 32.0, 29.0, 27.0, 21.0, 19.0, 11.0, 18.0, 18.0, 10.0, 7.0, 7.0, 8.0, 8.0, 8.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005153656005859375, -0.004993140697479248, -0.004832625389099121, -0.004672110080718994, -0.004511594772338867, -0.00435107946395874, -0.004190564155578613, -0.004030048847198486, -0.0038695335388183594, -0.0037090182304382324, -0.0035485029220581055, -0.0033879876136779785, -0.0032274723052978516, -0.0030669569969177246, -0.0029064416885375977, -0.0027459263801574707, -0.0025854110717773438, -0.002424895763397217, -0.00226438045501709, -0.002103865146636963, -0.001943349838256836, -0.001782834529876709, -0.001622319221496582, -0.001461803913116455, -0.0013012886047363281, -0.0011407732963562012, -0.0009802579879760742, -0.0008197426795959473, -0.0006592273712158203, -0.0004987120628356934, -0.0003381967544555664, -0.00017768144607543945, -1.71661376953125e-05, 0.00014334917068481445, 0.0003038644790649414, 0.00046437978744506836, 0.0006248950958251953, 0.0007854104042053223, 0.0009459257125854492, 0.0011064410209655762, 0.0012669563293457031, 0.00142747163772583, 0.001587986946105957, 0.001748502254486084, 0.001909017562866211, 0.002069532871246338, 0.002230048179626465, 0.002390563488006592, 0.0025510787963867188, 0.0027115941047668457, 0.0028721094131469727, 0.0030326247215270996, 0.0031931400299072266, 0.0033536553382873535, 0.0035141706466674805, 0.0036746859550476074, 0.0038352012634277344, 0.003995716571807861, 0.004156231880187988, 0.004316747188568115, 0.004477262496948242, 0.004637777805328369, 0.004798293113708496, 0.004958808422088623, 0.00511932373046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 9.0, 20.0, 15.0, 28.0, 29.0, 65.0, 61.0, 75.0, 142.0, 159.0, 229.0, 330.0, 467.0, 650.0, 910.0, 1218.0, 1809.0, 2904.0, 4413.0, 7527.0, 14038.0, 31647.0, 109659.0, 656451.0, 140889.0, 36359.0, 15776.0, 8397.0, 4806.0, 2997.0, 1988.0, 1246.0, 860.0, 703.0, 449.0, 333.0, 244.0, 176.0, 133.0, 99.0, 64.0, 53.0, 45.0, 19.0, 18.0, 10.0, 9.0, 12.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0006017684936523438, -0.000582084059715271, -0.0005623996257781982, -0.0005427151918411255, -0.0005230307579040527, -0.00050334632396698, -0.0004836618900299072, -0.00046397745609283447, -0.0004442930221557617, -0.00042460858821868896, -0.0004049241542816162, -0.00038523972034454346, -0.0003655552864074707, -0.00034587085247039795, -0.0003261864185333252, -0.00030650198459625244, -0.0002868175506591797, -0.00026713311672210693, -0.0002474486827850342, -0.00022776424884796143, -0.00020807981491088867, -0.00018839538097381592, -0.00016871094703674316, -0.0001490265130996704, -0.00012934207916259766, -0.0001096576452255249, -8.997321128845215e-05, -7.02887773513794e-05, -5.060434341430664e-05, -3.091990947723389e-05, -1.1235475540161133e-05, 8.448958396911621e-06, 2.8133392333984375e-05, 4.781782627105713e-05, 6.750226020812988e-05, 8.718669414520264e-05, 0.00010687112808227539, 0.00012655556201934814, 0.0001462399959564209, 0.00016592442989349365, 0.0001856088638305664, 0.00020529329776763916, 0.00022497773170471191, 0.00024466216564178467, 0.0002643465995788574, 0.0002840310335159302, 0.00030371546745300293, 0.0003233999013900757, 0.00034308433532714844, 0.0003627687692642212, 0.00038245320320129395, 0.0004021376371383667, 0.00042182207107543945, 0.0004415065050125122, 0.00046119093894958496, 0.0004808753728866577, 0.0005005598068237305, 0.0005202442407608032, 0.000539928674697876, 0.0005596131086349487, 0.0005792975425720215, 0.0005989819765090942, 0.000618666410446167, 0.0006383508443832397, 0.0006580352783203125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 6.0, 0.0, 19.0, 0.0, 16.0, 0.0, 25.0, 0.0, 56.0, 0.0, 70.0, 0.0, 81.0, 0.0, 84.0, 0.0, 99.0, 0.0, 78.0, 0.0, 102.0, 0.0, 90.0, 0.0, 78.0, 0.0, 62.0, 0.0, 47.0, 0.0, 33.0, 0.0, 22.0, 0.0, 16.0, 0.0, 8.0, 0.0, 8.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07, 9.834766387939453e-07, 1.0132789611816406e-06, 1.043081283569336e-06, 1.0728836059570312e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 14.0, 16.0, 21.0, 57.0, 68.0, 76.0, 119.0, 183.0, 265.0, 408.0, 549.0, 838.0, 1161.0, 1748.0, 2511.0, 3922.0, 6293.0, 10183.0, 16976.0, 29442.0, 56033.0, 118856.0, 353093.0, 243483.0, 92260.0, 45587.0, 24949.0, 14695.0, 8694.0, 5400.0, 3440.0, 2340.0, 1558.0, 1004.0, 699.0, 527.0, 356.0, 199.0, 171.0, 116.0, 76.0, 43.0, 33.0, 30.0, 16.0, 6.0, 6.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.0006504058837890625, -0.0006299838423728943, -0.0006095618009567261, -0.0005891397595405579, -0.0005687177181243896, -0.0005482956767082214, -0.0005278736352920532, -0.000507451593875885, -0.0004870295524597168, -0.0004666075110435486, -0.00044618546962738037, -0.00042576342821121216, -0.00040534138679504395, -0.00038491934537887573, -0.0003644973039627075, -0.0003440752625465393, -0.0003236532211303711, -0.0003032311797142029, -0.00028280913829803467, -0.00026238709688186646, -0.00024196505546569824, -0.00022154301404953003, -0.00020112097263336182, -0.0001806989312171936, -0.0001602768898010254, -0.00013985484838485718, -0.00011943280696868896, -9.901076555252075e-05, -7.858872413635254e-05, -5.8166682720184326e-05, -3.774464130401611e-05, -1.73225998878479e-05, 3.0994415283203125e-06, 2.3521482944488525e-05, 4.394352436065674e-05, 6.436556577682495e-05, 8.478760719299316e-05, 0.00010520964860916138, 0.0001256316900253296, 0.0001460537314414978, 0.00016647577285766602, 0.00018689781427383423, 0.00020731985569000244, 0.00022774189710617065, 0.00024816393852233887, 0.0002685859799385071, 0.0002890080213546753, 0.0003094300627708435, 0.0003298521041870117, 0.00035027414560317993, 0.00037069618701934814, 0.00039111822843551636, 0.00041154026985168457, 0.0004319623112678528, 0.000452384352684021, 0.0004728063941001892, 0.0004932284355163574, 0.0005136504769325256, 0.0005340725183486938, 0.0005544945597648621, 0.0005749166011810303, 0.0005953386425971985, 0.0006157606840133667, 0.0006361827254295349, 0.0006566047668457031]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 6.0, 11.0, 15.0, 14.0, 12.0, 18.0, 20.0, 28.0, 42.0, 34.0, 42.0, 55.0, 61.0, 64.0, 79.0, 60.0, 60.0, 49.0, 47.0, 33.0, 27.0, 34.0, 30.0, 14.0, 18.0, 21.0, 17.0, 13.0, 7.0, 7.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00019788742065429688, -0.00019161775708198547, -0.00018534809350967407, -0.00017907842993736267, -0.00017280876636505127, -0.00016653910279273987, -0.00016026943922042847, -0.00015399977564811707, -0.00014773011207580566, -0.00014146044850349426, -0.00013519078493118286, -0.00012892112135887146, -0.00012265145778656006, -0.00011638179421424866, -0.00011011213064193726, -0.00010384246706962585, -9.757280349731445e-05, -9.130313992500305e-05, -8.503347635269165e-05, -7.876381278038025e-05, -7.249414920806885e-05, -6.622448563575745e-05, -5.9954822063446045e-05, -5.3685158491134644e-05, -4.741549491882324e-05, -4.114583134651184e-05, -3.487616777420044e-05, -2.8606504201889038e-05, -2.2336840629577637e-05, -1.6067177057266235e-05, -9.797513484954834e-06, -3.5278499126434326e-06, 2.7418136596679688e-06, 9.01147723197937e-06, 1.528114080429077e-05, 2.1550804376602173e-05, 2.7820467948913574e-05, 3.4090131521224976e-05, 4.035979509353638e-05, 4.662945866584778e-05, 5.289912223815918e-05, 5.916878581047058e-05, 6.543844938278198e-05, 7.170811295509338e-05, 7.797777652740479e-05, 8.424744009971619e-05, 9.051710367202759e-05, 9.678676724433899e-05, 0.00010305643081665039, 0.00010932609438896179, 0.0001155957579612732, 0.0001218654215335846, 0.000128135085105896, 0.0001344047486782074, 0.0001406744122505188, 0.0001469440758228302, 0.0001532137393951416, 0.000159483402967453, 0.0001657530665397644, 0.0001720227301120758, 0.0001782923936843872, 0.0001845620572566986, 0.00019083172082901, 0.0001971013844013214, 0.0002033710479736328]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 3.0, 1.0, 2.0, 5.0, 14.0, 8.0, 11.0, 25.0, 15.0, 35.0, 39.0, 45.0, 53.0, 68.0, 70.0, 63.0, 69.0, 80.0, 73.0, 51.0, 48.0, 42.0, 20.0, 21.0, 21.0, 18.0, 20.0, 12.0, 10.0, 13.0, 5.0, 5.0, 4.0, 6.0, 7.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.008999732322990894, -0.008686278015375137, -0.008372822776436806, -0.008059367537498474, -0.007745913229882717, -0.007432458456605673, -0.0071190036833286285, -0.006805548910051584, -0.00649209413677454, -0.006178639363497496, -0.005865184590220451, -0.005551729816943407, -0.005238275043666363, -0.0049248202703893185, -0.004611365497112274, -0.00429791072383523, -0.003984455950558186, -0.0036710011772811413, -0.003357546404004097, -0.0030440916307270527, -0.0027306368574500084, -0.002417182084172964, -0.00210372731089592, -0.0017902725376188755, -0.0014768177643418312, -0.001163362991064787, -0.0008499082177877426, -0.0005364534445106983, -0.00022299867123365402, 9.045610204339027e-05, 0.00040391087532043457, 0.0007173656485974789, 0.0010308194905519485, 0.0013442742638289928, 0.0016577290371060371, 0.0019711838103830814, 0.0022846385836601257, 0.00259809335693717, 0.0029115481302142143, 0.0032250029034912586, 0.003538457676768303, 0.003851912450045347, 0.0041653672233223915, 0.004478821996599436, 0.00479227676987648, 0.005105731543153524, 0.005419186316430569, 0.005732641089707613, 0.006046095862984657, 0.006359550636261702, 0.006673005409538746, 0.00698646018281579, 0.0072999149560928345, 0.007613369729369879, 0.007926824502646923, 0.00824027881026268, 0.008553734049201012, 0.008867189288139343, 0.0091806435957551, 0.009494097903370857, 0.009807553142309189, 0.01012100838124752, 0.010434462688863277, 0.010747916996479034, 0.011061372235417366]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 6.0, 4.0, 9.0, 14.0, 13.0, 11.0, 11.0, 23.0, 23.0, 20.0, 17.0, 30.0, 26.0, 18.0, 22.0, 42.0, 39.0, 28.0, 42.0, 35.0, 32.0, 43.0, 32.0, 36.0, 46.0, 47.0, 37.0, 24.0, 22.0, 34.0, 21.0, 31.0, 21.0, 25.0, 16.0, 12.0, 8.0, 8.0, 7.0, 9.0, 8.0, 10.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.007468620780855417, -0.007236379664391279, -0.0070041390135884285, -0.0067718978971242905, -0.00653965724632144, -0.006307416129857302, -0.006075175479054451, -0.005842934362590313, -0.005610693711787462, -0.005378452595323324, -0.0051462119445204735, -0.0049139708280563354, -0.004681730177253485, -0.004449489060789347, -0.004217248409986496, -0.003985007293522358, -0.0037527664098888636, -0.003520525526255369, -0.003288284642621875, -0.0030560437589883804, -0.002823802875354886, -0.0025915619917213917, -0.0023593208752572536, -0.002127080224454403, -0.0018948392244055867, -0.0016625983407720923, -0.001430357457138598, -0.0011981164570897818, -0.0009658756316639483, -0.000733634689822793, -0.0005013938061892986, -0.00026915292255580425, -3.6912038922309875e-05, 0.00019532885926309973, 0.00042756975744850934, 0.0006598106701858342, 0.0008920515538193285, 0.0011242924956604838, 0.0013565333792939782, 0.0015887742629274726, 0.001821015146560967, 0.002053256146609783, 0.0022854970302432775, 0.002517737913876772, 0.0027499787975102663, 0.0029822196811437607, 0.003214460564777255, 0.0034467014484107494, 0.003678942332044244, 0.003911183215677738, 0.004143424332141876, 0.004375664982944727, 0.004607906099408865, 0.004840146750211716, 0.005072387866675854, 0.0053046285174787045, 0.0055368696339428425, 0.0057691107504069805, 0.006001351401209831, 0.006233592517673969, 0.00646583316847682, 0.006698074284940958, 0.006930314935743809, 0.007162556052207947, 0.0073947967030107975]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 9.0, 19.0, 25.0, 33.0, 52.0, 61.0, 88.0, 122.0, 188.0, 263.0, 358.0, 511.0, 693.0, 1085.0, 1499.0, 2104.0, 3051.0, 4474.0, 6203.0, 9134.0, 13395.0, 19410.0, 29503.0, 44773.0, 70896.0, 120526.0, 207023.0, 198604.0, 114798.0, 67825.0, 43124.0, 28004.0, 18885.0, 12841.0, 8896.0, 6021.0, 4234.0, 2854.0, 2063.0, 1463.0, 1039.0, 720.0, 516.0, 365.0, 253.0, 180.0, 134.0, 75.0, 59.0, 38.0, 20.0, 28.0, 15.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.01229095458984375, -0.011893868446350098, -0.011496782302856445, -0.011099696159362793, -0.01070261001586914, -0.010305523872375488, -0.009908437728881836, -0.009511351585388184, -0.009114265441894531, -0.008717179298400879, -0.008320093154907227, -0.007923007011413574, -0.007525920867919922, -0.0071288347244262695, -0.006731748580932617, -0.006334662437438965, -0.0059375762939453125, -0.00554049015045166, -0.005143404006958008, -0.0047463178634643555, -0.004349231719970703, -0.003952145576477051, -0.0035550594329833984, -0.003157973289489746, -0.0027608871459960938, -0.0023638010025024414, -0.001966714859008789, -0.0015696287155151367, -0.0011725425720214844, -0.000775456428527832, -0.0003783702850341797, 1.8715858459472656e-05, 0.000415802001953125, 0.0008128881454467773, 0.0012099742889404297, 0.001607060432434082, 0.0020041465759277344, 0.0024012327194213867, 0.002798318862915039, 0.0031954050064086914, 0.0035924911499023438, 0.003989577293395996, 0.0043866634368896484, 0.004783749580383301, 0.005180835723876953, 0.0055779218673706055, 0.005975008010864258, 0.00637209415435791, 0.0067691802978515625, 0.007166266441345215, 0.007563352584838867, 0.00796043872833252, 0.008357524871826172, 0.008754611015319824, 0.009151697158813477, 0.009548783302307129, 0.009945869445800781, 0.010342955589294434, 0.010740041732788086, 0.011137127876281738, 0.01153421401977539, 0.011931300163269043, 0.012328386306762695, 0.012725472450256348, 0.01312255859375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 8.0, 10.0, 9.0, 9.0, 16.0, 14.0, 22.0, 20.0, 25.0, 32.0, 20.0, 29.0, 26.0, 26.0, 36.0, 39.0, 41.0, 42.0, 41.0, 34.0, 40.0, 40.0, 36.0, 49.0, 40.0, 34.0, 30.0, 23.0, 27.0, 21.0, 20.0, 26.0, 16.0, 8.0, 10.0, 10.0, 11.0, 5.0, 8.0, 8.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00664520263671875, -0.0064389705657958984, -0.006232738494873047, -0.006026506423950195, -0.005820274353027344, -0.005614042282104492, -0.005407810211181641, -0.005201578140258789, -0.0049953460693359375, -0.004789113998413086, -0.004582881927490234, -0.004376649856567383, -0.004170417785644531, -0.00396418571472168, -0.003757953643798828, -0.0035517215728759766, -0.003345489501953125, -0.0031392574310302734, -0.002933025360107422, -0.0027267932891845703, -0.0025205612182617188, -0.002314329147338867, -0.0021080970764160156, -0.001901865005493164, -0.0016956329345703125, -0.001489400863647461, -0.0012831687927246094, -0.0010769367218017578, -0.0008707046508789062, -0.0006644725799560547, -0.0004582405090332031, -0.00025200843811035156, -4.57763671875e-05, 0.00016045570373535156, 0.0003666877746582031, 0.0005729198455810547, 0.0007791519165039062, 0.0009853839874267578, 0.0011916160583496094, 0.001397848129272461, 0.0016040802001953125, 0.001810312271118164, 0.0020165443420410156, 0.002222776412963867, 0.0024290084838867188, 0.0026352405548095703, 0.002841472625732422, 0.0030477046966552734, 0.003253936767578125, 0.0034601688385009766, 0.003666400909423828, 0.0038726329803466797, 0.004078865051269531, 0.004285097122192383, 0.004491329193115234, 0.004697561264038086, 0.0049037933349609375, 0.005110025405883789, 0.005316257476806641, 0.005522489547729492, 0.005728721618652344, 0.005934953689575195, 0.006141185760498047, 0.0063474178314208984, 0.00655364990234375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 7.0, 13.0, 23.0, 32.0, 41.0, 58.0, 99.0, 138.0, 204.0, 302.0, 485.0, 663.0, 1020.0, 1521.0, 2272.0, 3361.0, 5184.0, 7765.0, 12096.0, 19083.0, 30809.0, 50327.0, 84113.0, 148556.0, 235997.0, 180581.0, 103163.0, 60356.0, 36706.0, 22372.0, 14297.0, 9163.0, 5860.0, 3937.0, 2680.0, 1752.0, 1117.0, 790.0, 534.0, 357.0, 241.0, 162.0, 101.0, 68.0, 50.0, 30.0, 31.0, 10.0, 13.0, 7.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0], "bins": [-0.0143280029296875, -0.013889551162719727, -0.013451099395751953, -0.01301264762878418, -0.012574195861816406, -0.012135744094848633, -0.01169729232788086, -0.011258840560913086, -0.010820388793945312, -0.010381937026977539, -0.009943485260009766, -0.009505033493041992, -0.009066581726074219, -0.008628129959106445, -0.008189678192138672, -0.0077512264251708984, -0.007312774658203125, -0.0068743228912353516, -0.006435871124267578, -0.005997419357299805, -0.005558967590332031, -0.005120515823364258, -0.004682064056396484, -0.004243612289428711, -0.0038051605224609375, -0.003366708755493164, -0.0029282569885253906, -0.002489805221557617, -0.0020513534545898438, -0.0016129016876220703, -0.0011744499206542969, -0.0007359981536865234, -0.00029754638671875, 0.00014090538024902344, 0.0005793571472167969, 0.0010178089141845703, 0.0014562606811523438, 0.0018947124481201172, 0.0023331642150878906, 0.002771615982055664, 0.0032100677490234375, 0.003648519515991211, 0.004086971282958984, 0.004525423049926758, 0.004963874816894531, 0.005402326583862305, 0.005840778350830078, 0.0062792301177978516, 0.006717681884765625, 0.0071561336517333984, 0.007594585418701172, 0.008033037185668945, 0.008471488952636719, 0.008909940719604492, 0.009348392486572266, 0.009786844253540039, 0.010225296020507812, 0.010663747787475586, 0.01110219955444336, 0.011540651321411133, 0.011979103088378906, 0.01241755485534668, 0.012856006622314453, 0.013294458389282227, 0.01373291015625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 13.0, 10.0, 4.0, 14.0, 13.0, 18.0, 25.0, 19.0, 34.0, 27.0, 28.0, 44.0, 26.0, 42.0, 36.0, 43.0, 48.0, 43.0, 36.0, 34.0, 46.0, 38.0, 27.0, 43.0, 38.0, 25.0, 40.0, 28.0, 26.0, 19.0, 20.0, 15.0, 19.0, 13.0, 9.0, 6.0, 7.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00437164306640625, -0.004222750663757324, -0.0040738582611083984, -0.003924965858459473, -0.003776073455810547, -0.003627181053161621, -0.0034782886505126953, -0.0033293962478637695, -0.0031805038452148438, -0.003031611442565918, -0.002882719039916992, -0.0027338266372680664, -0.0025849342346191406, -0.002436041831970215, -0.002287149429321289, -0.0021382570266723633, -0.0019893646240234375, -0.0018404722213745117, -0.001691579818725586, -0.0015426874160766602, -0.0013937950134277344, -0.0012449026107788086, -0.0010960102081298828, -0.000947117805480957, -0.0007982254028320312, -0.0006493330001831055, -0.0005004405975341797, -0.0003515481948852539, -0.00020265579223632812, -5.3763389587402344e-05, 9.512901306152344e-05, 0.00024402141571044922, 0.000392913818359375, 0.0005418062210083008, 0.0006906986236572266, 0.0008395910263061523, 0.0009884834289550781, 0.001137375831604004, 0.0012862682342529297, 0.0014351606369018555, 0.0015840530395507812, 0.001732945442199707, 0.0018818378448486328, 0.0020307302474975586, 0.0021796226501464844, 0.00232851505279541, 0.002477407455444336, 0.0026262998580932617, 0.0027751922607421875, 0.0029240846633911133, 0.003072977066040039, 0.003221869468688965, 0.0033707618713378906, 0.0035196542739868164, 0.003668546676635742, 0.003817439079284668, 0.003966331481933594, 0.0041152238845825195, 0.004264116287231445, 0.004413008689880371, 0.004561901092529297, 0.004710793495178223, 0.0048596858978271484, 0.005008578300476074, 0.005157470703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 13.0, 17.0, 25.0, 35.0, 33.0, 38.0, 64.0, 82.0, 103.0, 116.0, 161.0, 234.0, 313.0, 478.0, 755.0, 1194.0, 2115.0, 3695.0, 7223.0, 17853.0, 154577.0, 815050.0, 24722.0, 8759.0, 4371.0, 2362.0, 1418.0, 850.0, 521.0, 363.0, 240.0, 177.0, 140.0, 107.0, 70.0, 65.0, 55.0, 38.0, 31.0, 20.0, 13.0, 11.0, 8.0, 15.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0020847320556640625, -0.002021804451942444, -0.001958876848220825, -0.0018959492444992065, -0.0018330216407775879, -0.0017700940370559692, -0.0017071664333343506, -0.001644238829612732, -0.0015813112258911133, -0.0015183836221694946, -0.001455456018447876, -0.0013925284147262573, -0.0013296008110046387, -0.00126667320728302, -0.0012037456035614014, -0.0011408179998397827, -0.001077890396118164, -0.0010149627923965454, -0.0009520351886749268, -0.0008891075849533081, -0.0008261799812316895, -0.0007632523775100708, -0.0007003247737884521, -0.0006373971700668335, -0.0005744695663452148, -0.0005115419626235962, -0.00044861435890197754, -0.0003856867551803589, -0.00032275915145874023, -0.0002598315477371216, -0.00019690394401550293, -0.00013397634029388428, -7.104873657226562e-05, -8.121132850646973e-06, 5.480647087097168e-05, 0.00011773407459259033, 0.00018066167831420898, 0.00024358928203582764, 0.0003065168857574463, 0.00036944448947906494, 0.0004323720932006836, 0.0004952996969223022, 0.0005582273006439209, 0.0006211549043655396, 0.0006840825080871582, 0.0007470101118087769, 0.0008099377155303955, 0.0008728653192520142, 0.0009357929229736328, 0.0009987205266952515, 0.0010616481304168701, 0.0011245757341384888, 0.0011875033378601074, 0.001250430941581726, 0.0013133585453033447, 0.0013762861490249634, 0.001439213752746582, 0.0015021413564682007, 0.0015650689601898193, 0.001627996563911438, 0.0016909241676330566, 0.0017538517713546753, 0.001816779375076294, 0.0018797069787979126, 0.0019426345825195312]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 6.0, 6.0, 0.0, 12.0, 22.0, 0.0, 28.0, 39.0, 0.0, 68.0, 87.0, 0.0, 133.0, 0.0, 198.0, 121.0, 0.0, 105.0, 64.0, 0.0, 39.0, 26.0, 0.0, 19.0, 12.0, 0.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.212581992149353e-06, -1.173466444015503e-06, -1.1343508958816528e-06, -1.0952353477478027e-06, -1.0561197996139526e-06, -1.0170042514801025e-06, -9.778887033462524e-07, -9.387731552124023e-07, -8.996576070785522e-07, -8.605420589447021e-07, -8.21426510810852e-07, -7.82310962677002e-07, -7.431954145431519e-07, -7.040798664093018e-07, -6.649643182754517e-07, -6.258487701416016e-07, -5.867332220077515e-07, -5.476176738739014e-07, -5.085021257400513e-07, -4.6938657760620117e-07, -4.302710294723511e-07, -3.91155481338501e-07, -3.520399332046509e-07, -3.129243850708008e-07, -2.738088369369507e-07, -2.3469328880310059e-07, -1.955777406692505e-07, -1.564621925354004e-07, -1.1734664440155029e-07, -7.82310962677002e-08, -3.91155481338501e-08, 0.0, 3.91155481338501e-08, 7.82310962677002e-08, 1.1734664440155029e-07, 1.564621925354004e-07, 1.955777406692505e-07, 2.3469328880310059e-07, 2.738088369369507e-07, 3.129243850708008e-07, 3.520399332046509e-07, 3.91155481338501e-07, 4.302710294723511e-07, 4.6938657760620117e-07, 5.085021257400513e-07, 5.476176738739014e-07, 5.867332220077515e-07, 6.258487701416016e-07, 6.649643182754517e-07, 7.040798664093018e-07, 7.431954145431519e-07, 7.82310962677002e-07, 8.21426510810852e-07, 8.605420589447021e-07, 8.996576070785522e-07, 9.387731552124023e-07, 9.778887033462524e-07, 1.0170042514801025e-06, 1.0561197996139526e-06, 1.0952353477478027e-06, 1.1343508958816528e-06, 1.173466444015503e-06, 1.212581992149353e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 12.0, 14.0, 18.0, 30.0, 34.0, 47.0, 77.0, 85.0, 142.0, 161.0, 218.0, 312.0, 452.0, 604.0, 780.0, 1133.0, 1639.0, 2402.0, 3837.0, 6562.0, 11985.0, 27678.0, 830481.0, 116550.0, 18384.0, 9196.0, 5359.0, 3165.0, 2135.0, 1375.0, 1060.0, 679.0, 523.0, 387.0, 268.0, 198.0, 142.0, 105.0, 97.0, 64.0, 38.0, 34.0, 26.0, 13.0, 10.0, 9.0, 7.0, 3.0, 7.0, 2.0, 1.0, 3.0], "bins": [-0.0018892288208007812, -0.0018349438905715942, -0.0017806589603424072, -0.0017263740301132202, -0.0016720890998840332, -0.0016178041696548462, -0.0015635192394256592, -0.0015092343091964722, -0.0014549493789672852, -0.0014006644487380981, -0.0013463795185089111, -0.0012920945882797241, -0.0012378096580505371, -0.00118352472782135, -0.001129239797592163, -0.001074954867362976, -0.001020669937133789, -0.000966385006904602, -0.000912100076675415, -0.000857815146446228, -0.000803530216217041, -0.000749245285987854, -0.000694960355758667, -0.00064067542552948, -0.000586390495300293, -0.000532105565071106, -0.00047782063484191895, -0.00042353570461273193, -0.0003692507743835449, -0.0003149658441543579, -0.0002606809139251709, -0.0002063959836959839, -0.00015211105346679688, -9.782612323760986e-05, -4.354119300842285e-05, 1.074373722076416e-05, 6.502866744995117e-05, 0.00011931359767913818, 0.0001735985279083252, 0.0002278834581375122, 0.0002821683883666992, 0.00033645331859588623, 0.00039073824882507324, 0.00044502317905426025, 0.0004993081092834473, 0.0005535930395126343, 0.0006078779697418213, 0.0006621628999710083, 0.0007164478302001953, 0.0007707327604293823, 0.0008250176906585693, 0.0008793026208877563, 0.0009335875511169434, 0.0009878724813461304, 0.0010421574115753174, 0.0010964423418045044, 0.0011507272720336914, 0.0012050122022628784, 0.0012592971324920654, 0.0013135820627212524, 0.0013678669929504395, 0.0014221519231796265, 0.0014764368534088135, 0.0015307217836380005, 0.0015850067138671875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 0.0, 1.0, 5.0, 2.0, 10.0, 8.0, 9.0, 8.0, 10.0, 27.0, 153.0, 574.0, 95.0, 29.0, 8.0, 13.0, 5.0, 6.0, 9.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005717277526855469, -0.000554598867893219, -0.0005374699831008911, -0.0005203410983085632, -0.0005032122135162354, -0.00048608332872390747, -0.0004689544439315796, -0.0004518255591392517, -0.00043469667434692383, -0.00041756778955459595, -0.00040043890476226807, -0.0003833100199699402, -0.0003661811351776123, -0.0003490522503852844, -0.00033192336559295654, -0.00031479448080062866, -0.0002976655960083008, -0.0002805367112159729, -0.000263407826423645, -0.00024627894163131714, -0.00022915005683898926, -0.00021202117204666138, -0.0001948922872543335, -0.00017776340246200562, -0.00016063451766967773, -0.00014350563287734985, -0.00012637674808502197, -0.00010924786329269409, -9.211897850036621e-05, -7.499009370803833e-05, -5.786120891571045e-05, -4.073232412338257e-05, -2.3603439331054688e-05, -6.474554538726807e-06, 1.0654330253601074e-05, 2.7783215045928955e-05, 4.4912099838256836e-05, 6.204098463058472e-05, 7.91698694229126e-05, 9.629875421524048e-05, 0.00011342763900756836, 0.00013055652379989624, 0.00014768540859222412, 0.000164814293384552, 0.00018194317817687988, 0.00019907206296920776, 0.00021620094776153564, 0.00023332983255386353, 0.0002504587173461914, 0.0002675876021385193, 0.00028471648693084717, 0.00030184537172317505, 0.00031897425651550293, 0.0003361031413078308, 0.0003532320261001587, 0.00037036091089248657, 0.00038748979568481445, 0.00040461868047714233, 0.0004217475652694702, 0.0004388764500617981, 0.000456005334854126, 0.00047313421964645386, 0.0004902631044387817, 0.0005073919892311096, 0.0005245208740234375]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0, 5.0, 11.0, 10.0, 13.0, 23.0, 29.0, 40.0, 48.0, 59.0, 95.0, 96.0, 108.0, 90.0, 85.0, 68.0, 55.0, 41.0, 25.0, 23.0, 16.0, 10.0, 7.0, 13.0, 7.0, 9.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014963689260184765, -0.014568050391972065, -0.01417241245508194, -0.01377677358686924, -0.01338113471865654, -0.012985496781766415, -0.012589857913553715, -0.01219421997666359, -0.01179858110845089, -0.01140294224023819, -0.011007304303348064, -0.010611665435135365, -0.010216026566922665, -0.00982038863003254, -0.00942474976181984, -0.00902911089360714, -0.00863347202539444, -0.00823783315718174, -0.007842195220291615, -0.007446556352078915, -0.007050917949527502, -0.0066552795469760895, -0.00625964067876339, -0.005864002276211977, -0.005468363873660564, -0.005072725471109152, -0.004677086602896452, -0.004281448200345039, -0.003885809797793627, -0.0034901711624115705, -0.0030945325270295143, -0.0026988941244781017, -0.002303255721926689, -0.0019076172029599547, -0.0015119786839932203, -0.001116340048611164, -0.0007207015296444297, -0.0003250630106776953, 7.057562470436096e-05, 0.00046621402725577354, 0.0008618526626378298, 0.0012574911816045642, 0.0016531297005712986, 0.002048768335953355, 0.002444406971335411, 0.0028400453738868237, 0.00323568400926888, 0.0036313224118202925, 0.004026961047202349, 0.004422599449753761, 0.004818238317966461, 0.005213876720517874, 0.005609515123069286, 0.006005153991281986, 0.006400792393833399, 0.006796430796384811, 0.007192069664597511, 0.007587708067148924, 0.007983346469700336, 0.008378985337913036, 0.008774624206125736, 0.009170262143015862, 0.009565901011228561, 0.009961539879441261, 0.010357177816331387]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 3.0, 3.0, 7.0, 9.0, 12.0, 19.0, 14.0, 15.0, 17.0, 16.0, 31.0, 32.0, 20.0, 29.0, 40.0, 34.0, 33.0, 36.0, 41.0, 39.0, 41.0, 49.0, 47.0, 41.0, 33.0, 42.0, 33.0, 32.0, 32.0, 27.0, 21.0, 26.0, 20.0, 19.0, 16.0, 10.0, 5.0, 5.0, 11.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007256050128489733, -0.007025315426290035, -0.006794581189751625, -0.006563846487551928, -0.00633311178535223, -0.00610237754881382, -0.005871642846614122, -0.005640908144414425, -0.005410173442214727, -0.00517943874001503, -0.00494870450347662, -0.004717969801276922, -0.004487235099077225, -0.0042565008625388145, -0.004025766160339117, -0.0037950314581394196, -0.0035642969887703657, -0.003333562519401312, -0.0031028278172016144, -0.0028720933478325605, -0.002641358645632863, -0.002410624176263809, -0.0021798894740641117, -0.0019491550046950579, -0.0017184204189106822, -0.0014876858331263065, -0.0012569512473419309, -0.0010262166615575552, -0.0007954821339808404, -0.0005647476064041257, -0.00033401302061975, -0.00010327843483537436, 0.0001274561509490013, 0.000358190736733377, 0.0005889253225177526, 0.0008196598500944674, 0.001050394494086504, 0.0012811289634555578, 0.0015118635492399335, 0.0017425981350243092, 0.0019733328372240067, 0.0022040673065930605, 0.002434802008792758, 0.002665536478161812, 0.0028962711803615093, 0.003127005649730563, 0.003357740119099617, 0.0035884748212993145, 0.0038192092906683683, 0.004049943760037422, 0.00428067846223712, 0.004511413164436817, 0.004742147400975227, 0.004972882103174925, 0.005203616805374622, 0.0054343510419130325, 0.00566508574411273, 0.0058958204463124275, 0.006126554682850838, 0.006357289385050535, 0.006588024087250233, 0.006818758323788643, 0.00704949302598834, 0.007280227728188038, 0.007510962430387735]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 11.0, 13.0, 16.0, 14.0, 35.0, 53.0, 68.0, 132.0, 200.0, 300.0, 455.0, 686.0, 1138.0, 1712.0, 2742.0, 4348.0, 7254.0, 12688.0, 22054.0, 41295.0, 80776.0, 170517.0, 463031.0, 1636357.0, 1153666.0, 318497.0, 131924.0, 65074.0, 34010.0, 18556.0, 10750.0, 6112.0, 3786.0, 2292.0, 1419.0, 846.0, 523.0, 314.0, 218.0, 135.0, 91.0, 58.0, 31.0, 24.0, 14.0, 12.0, 11.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.01100921630859375, -0.010663390159606934, -0.010317564010620117, -0.0099717378616333, -0.009625911712646484, -0.009280085563659668, -0.008934259414672852, -0.008588433265686035, -0.008242607116699219, -0.007896780967712402, -0.007550954818725586, -0.0072051286697387695, -0.006859302520751953, -0.006513476371765137, -0.00616765022277832, -0.005821824073791504, -0.0054759979248046875, -0.005130171775817871, -0.004784345626831055, -0.004438519477844238, -0.004092693328857422, -0.0037468671798706055, -0.003401041030883789, -0.0030552148818969727, -0.0027093887329101562, -0.00236356258392334, -0.0020177364349365234, -0.001671910285949707, -0.0013260841369628906, -0.0009802579879760742, -0.0006344318389892578, -0.0002886056900024414, 5.7220458984375e-05, 0.0004030466079711914, 0.0007488727569580078, 0.0010946989059448242, 0.0014405250549316406, 0.001786351203918457, 0.0021321773529052734, 0.00247800350189209, 0.0028238296508789062, 0.0031696557998657227, 0.003515481948852539, 0.0038613080978393555, 0.004207134246826172, 0.004552960395812988, 0.004898786544799805, 0.005244612693786621, 0.0055904388427734375, 0.005936264991760254, 0.00628209114074707, 0.006627917289733887, 0.006973743438720703, 0.0073195695877075195, 0.007665395736694336, 0.008011221885681152, 0.008357048034667969, 0.008702874183654785, 0.009048700332641602, 0.009394526481628418, 0.009740352630615234, 0.01008617877960205, 0.010432004928588867, 0.010777831077575684, 0.0111236572265625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 10.0, 6.0, 8.0, 11.0, 15.0, 18.0, 10.0, 22.0, 27.0, 28.0, 35.0, 24.0, 26.0, 27.0, 40.0, 40.0, 29.0, 42.0, 55.0, 41.0, 42.0, 40.0, 44.0, 45.0, 39.0, 36.0, 39.0, 25.0, 24.0, 27.0, 27.0, 10.0, 17.0, 10.0, 17.0, 7.0, 8.0, 5.0, 11.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.005092620849609375, -0.004947483539581299, -0.004802346229553223, -0.0046572089195251465, -0.00451207160949707, -0.004366934299468994, -0.004221796989440918, -0.004076659679412842, -0.003931522369384766, -0.0037863850593566895, -0.0036412477493286133, -0.003496110439300537, -0.003350973129272461, -0.0032058358192443848, -0.0030606985092163086, -0.0029155611991882324, -0.0027704238891601562, -0.00262528657913208, -0.002480149269104004, -0.0023350119590759277, -0.0021898746490478516, -0.0020447373390197754, -0.0018996000289916992, -0.001754462718963623, -0.0016093254089355469, -0.0014641880989074707, -0.0013190507888793945, -0.0011739134788513184, -0.0010287761688232422, -0.000883638858795166, -0.0007385015487670898, -0.0005933642387390137, -0.0004482269287109375, -0.00030308961868286133, -0.00015795230865478516, -1.2814998626708984e-05, 0.0001323223114013672, 0.00027745962142944336, 0.00042259693145751953, 0.0005677342414855957, 0.0007128715515136719, 0.000858008861541748, 0.0010031461715698242, 0.0011482834815979004, 0.0012934207916259766, 0.0014385581016540527, 0.001583695411682129, 0.001728832721710205, 0.0018739700317382812, 0.0020191073417663574, 0.0021642446517944336, 0.0023093819618225098, 0.002454519271850586, 0.002599656581878662, 0.0027447938919067383, 0.0028899312019348145, 0.0030350685119628906, 0.003180205821990967, 0.003325343132019043, 0.003470480442047119, 0.0036156177520751953, 0.0037607550621032715, 0.0039058923721313477, 0.004051029682159424, 0.0041961669921875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 17.0, 21.0, 31.0, 28.0, 83.0, 114.0, 141.0, 245.0, 431.0, 593.0, 925.0, 1489.0, 2281.0, 3754.0, 6083.0, 10097.0, 17865.0, 33255.0, 65827.0, 143627.0, 348488.0, 967402.0, 1574675.0, 586044.0, 226213.0, 98054.0, 47458.0, 24468.0, 13646.0, 7851.0, 4873.0, 2943.0, 1923.0, 1179.0, 706.0, 525.0, 356.0, 192.0, 127.0, 82.0, 55.0, 35.0, 27.0, 17.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0089111328125, -0.008626103401184082, -0.008341073989868164, -0.008056044578552246, -0.007771015167236328, -0.00748598575592041, -0.007200956344604492, -0.006915926933288574, -0.006630897521972656, -0.006345868110656738, -0.00606083869934082, -0.005775809288024902, -0.005490779876708984, -0.005205750465393066, -0.0049207210540771484, -0.0046356916427612305, -0.0043506622314453125, -0.0040656328201293945, -0.0037806034088134766, -0.0034955739974975586, -0.0032105445861816406, -0.0029255151748657227, -0.0026404857635498047, -0.0023554563522338867, -0.0020704269409179688, -0.0017853975296020508, -0.0015003681182861328, -0.0012153387069702148, -0.0009303092956542969, -0.0006452798843383789, -0.00036025047302246094, -7.522106170654297e-05, 0.000209808349609375, 0.000494837760925293, 0.0007798671722412109, 0.001064896583557129, 0.0013499259948730469, 0.0016349554061889648, 0.0019199848175048828, 0.0022050142288208008, 0.0024900436401367188, 0.0027750730514526367, 0.0030601024627685547, 0.0033451318740844727, 0.0036301612854003906, 0.003915190696716309, 0.0042002201080322266, 0.0044852495193481445, 0.0047702789306640625, 0.0050553083419799805, 0.0053403377532958984, 0.005625367164611816, 0.005910396575927734, 0.006195425987243652, 0.00648045539855957, 0.006765484809875488, 0.007050514221191406, 0.007335543632507324, 0.007620573043823242, 0.00790560245513916, 0.008190631866455078, 0.008475661277770996, 0.008760690689086914, 0.009045720100402832, 0.00933074951171875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 6.0, 10.0, 11.0, 18.0, 16.0, 23.0, 28.0, 30.0, 35.0, 45.0, 65.0, 73.0, 101.0, 107.0, 113.0, 175.0, 194.0, 230.0, 261.0, 300.0, 324.0, 314.0, 264.0, 211.0, 191.0, 141.0, 155.0, 118.0, 94.0, 78.0, 55.0, 44.0, 54.0, 32.0, 26.0, 25.0, 21.0, 15.0, 15.0, 11.0, 9.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0026454925537109375, -0.0025686025619506836, -0.0024917125701904297, -0.0024148225784301758, -0.002337932586669922, -0.002261042594909668, -0.002184152603149414, -0.00210726261138916, -0.0020303726196289062, -0.0019534826278686523, -0.0018765926361083984, -0.0017997026443481445, -0.0017228126525878906, -0.0016459226608276367, -0.0015690326690673828, -0.001492142677307129, -0.001415252685546875, -0.001338362693786621, -0.0012614727020263672, -0.0011845827102661133, -0.0011076927185058594, -0.0010308027267456055, -0.0009539127349853516, -0.0008770227432250977, -0.0008001327514648438, -0.0007232427597045898, -0.0006463527679443359, -0.000569462776184082, -0.0004925727844238281, -0.0004156827926635742, -0.0003387928009033203, -0.0002619028091430664, -0.0001850128173828125, -0.0001081228256225586, -3.123283386230469e-05, 4.565715789794922e-05, 0.00012254714965820312, 0.00019943714141845703, 0.00027632713317871094, 0.00035321712493896484, 0.00043010711669921875, 0.0005069971084594727, 0.0005838871002197266, 0.0006607770919799805, 0.0007376670837402344, 0.0008145570755004883, 0.0008914470672607422, 0.0009683370590209961, 0.00104522705078125, 0.001122117042541504, 0.0011990070343017578, 0.0012758970260620117, 0.0013527870178222656, 0.0014296770095825195, 0.0015065670013427734, 0.0015834569931030273, 0.0016603469848632812, 0.0017372369766235352, 0.001814126968383789, 0.001891016960144043, 0.001967906951904297, 0.0020447969436645508, 0.0021216869354248047, 0.0021985769271850586, 0.0022754669189453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 16.0, 17.0, 33.0, 72.0, 96.0, 130.0, 122.0, 152.0, 95.0, 77.0, 54.0, 33.0, 22.0, 10.0, 14.0, 14.0, 8.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.015667475759983063, -0.015302004292607307, -0.014936532825231552, -0.014571061357855797, -0.014205589890480042, -0.013840118423104286, -0.013474646955728531, -0.013109175488352776, -0.01274370402097702, -0.012378232553601265, -0.01201276108622551, -0.011647289618849754, -0.011281818151473999, -0.010916346684098244, -0.010550875216722488, -0.010185403749346733, -0.009819931350648403, -0.009454459883272648, -0.009088988415896893, -0.008723516948521137, -0.008358045481145382, -0.007992574013769627, -0.007627102080732584, -0.007261630613356829, -0.006896159145981073, -0.006530687678605318, -0.006165216211229563, -0.00579974427819252, -0.005434272810816765, -0.0050688013434410095, -0.004703329876065254, -0.004337858408689499, -0.003972386475652456, -0.003606915008276701, -0.0032414435409009457, -0.0028759718406945467, -0.0025105003733187914, -0.002145028905943036, -0.0017795572057366371, -0.0014140857383608818, -0.0010486142709851265, -0.0006831427454017103, -0.00031767121981829405, 4.780036397278309e-05, 0.0004132718313485384, 0.0007787432987242937, 0.0011442149989306927, 0.001509686466306448, 0.0018751579336822033, 0.0022406294010579586, 0.002606100868433714, 0.002971572568640113, 0.003337044036015868, 0.0037025155033916235, 0.0040679872035980225, 0.004433458670973778, 0.004798930138349533, 0.005164401605725288, 0.005529873073101044, 0.005895344540476799, 0.006260816007852554, 0.00662628747522831, 0.006991759408265352, 0.0073572308756411076, 0.007722702343016863]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 5.0, 14.0, 14.0, 10.0, 17.0, 13.0, 15.0, 22.0, 24.0, 30.0, 22.0, 30.0, 36.0, 43.0, 32.0, 30.0, 41.0, 49.0, 55.0, 40.0, 35.0, 36.0, 37.0, 34.0, 40.0, 23.0, 17.0, 44.0, 29.0, 23.0, 17.0, 16.0, 19.0, 11.0, 17.0, 14.0, 8.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.005259410012513399, -0.005107425153255463, -0.004955440293997526, -0.00480345543473959, -0.004651470575481653, -0.004499485716223717, -0.00434750085696578, -0.004195515997707844, -0.004043531138449907, -0.003891546279191971, -0.0037395614199340343, -0.003587576560676098, -0.0034355917014181614, -0.003283606842160225, -0.0031316219829022884, -0.002979637123644352, -0.0028276522643864155, -0.002675667405128479, -0.0025236825458705425, -0.002371697686612606, -0.0022197128273546696, -0.002067727968096733, -0.0019157431088387966, -0.0017637582495808601, -0.0016117733903229237, -0.0014597885310649872, -0.0013078036718070507, -0.0011558188125491142, -0.0010038339532911777, -0.0008518490940332413, -0.0006998642347753048, -0.0005478793755173683, -0.00039589498192071915, -0.00024391012266278267, -9.192526340484619e-05, 6.0059595853090286e-05, 0.00021204445511102676, 0.00036402931436896324, 0.0005160141736268997, 0.0006679990328848362, 0.0008199838921427727, 0.0009719687514007092, 0.0011239536106586456, 0.001275938469916582, 0.0014279233291745186, 0.001579908188432455, 0.0017318930476903915, 0.001883877906948328, 0.0020358627662062645, 0.002187847625464201, 0.0023398324847221375, 0.002491817343980074, 0.0026438022032380104, 0.002795787062495947, 0.0029477719217538834, 0.00309975678101182, 0.0032517416402697563, 0.003403726499527693, 0.0035557113587856293, 0.0037076962180435658, 0.0038596810773015022, 0.004011665936559439, 0.004163650795817375, 0.004315635655075312, 0.004467620514333248]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 10.0, 4.0, 10.0, 11.0, 8.0, 19.0, 39.0, 56.0, 68.0, 126.0, 175.0, 276.0, 410.0, 700.0, 1270.0, 2177.0, 4437.0, 8898.0, 19654.0, 45805.0, 115626.0, 331072.0, 322722.0, 112304.0, 44799.0, 19237.0, 8913.0, 4388.0, 2189.0, 1249.0, 668.0, 445.0, 264.0, 156.0, 113.0, 82.0, 58.0, 37.0, 22.0, 20.0, 12.0, 13.0, 8.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031566619873046875, -0.003047764301300049, -0.00293886661529541, -0.0028299689292907715, -0.002721071243286133, -0.002612173557281494, -0.0025032758712768555, -0.002394378185272217, -0.002285480499267578, -0.0021765828132629395, -0.0020676851272583008, -0.001958787441253662, -0.0018498897552490234, -0.0017409920692443848, -0.001632094383239746, -0.0015231966972351074, -0.0014142990112304688, -0.00130540132522583, -0.0011965036392211914, -0.0010876059532165527, -0.000978708267211914, -0.0008698105812072754, -0.0007609128952026367, -0.000652015209197998, -0.0005431175231933594, -0.0004342198371887207, -0.00032532215118408203, -0.00021642446517944336, -0.00010752677917480469, 1.3709068298339844e-06, 0.00011026859283447266, 0.00021916627883911133, 0.00032806396484375, 0.00043696165084838867, 0.0005458593368530273, 0.000654757022857666, 0.0007636547088623047, 0.0008725523948669434, 0.000981450080871582, 0.0010903477668762207, 0.0011992454528808594, 0.001308143138885498, 0.0014170408248901367, 0.0015259385108947754, 0.001634836196899414, 0.0017437338829040527, 0.0018526315689086914, 0.00196152925491333, 0.0020704269409179688, 0.0021793246269226074, 0.002288222312927246, 0.0023971199989318848, 0.0025060176849365234, 0.002614915370941162, 0.0027238130569458008, 0.0028327107429504395, 0.002941608428955078, 0.003050506114959717, 0.0031594038009643555, 0.003268301486968994, 0.003377199172973633, 0.0034860968589782715, 0.00359499454498291, 0.003703892230987549, 0.0038127899169921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 5.0, 12.0, 8.0, 14.0, 12.0, 14.0, 17.0, 16.0, 16.0, 19.0, 29.0, 22.0, 31.0, 34.0, 47.0, 32.0, 37.0, 46.0, 54.0, 47.0, 42.0, 43.0, 33.0, 41.0, 51.0, 25.0, 22.0, 23.0, 26.0, 23.0, 30.0, 24.0, 22.0, 15.0, 15.0, 7.0, 13.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.005859375, -0.005698859691619873, -0.005538344383239746, -0.005377829074859619, -0.005217313766479492, -0.005056798458099365, -0.004896283149719238, -0.004735767841339111, -0.004575252532958984, -0.004414737224578857, -0.0042542219161987305, -0.0040937066078186035, -0.0039331912994384766, -0.0037726759910583496, -0.0036121606826782227, -0.0034516453742980957, -0.0032911300659179688, -0.003130614757537842, -0.002970099449157715, -0.002809584140777588, -0.002649068832397461, -0.002488553524017334, -0.002328038215637207, -0.00216752290725708, -0.002007007598876953, -0.0018464922904968262, -0.0016859769821166992, -0.0015254616737365723, -0.0013649463653564453, -0.0012044310569763184, -0.0010439157485961914, -0.0008834004402160645, -0.0007228851318359375, -0.0005623698234558105, -0.0004018545150756836, -0.00024133920669555664, -8.082389831542969e-05, 7.969141006469727e-05, 0.00024020671844482422, 0.00040072202682495117, 0.0005612373352050781, 0.0007217526435852051, 0.000882267951965332, 0.001042783260345459, 0.001203298568725586, 0.0013638138771057129, 0.0015243291854858398, 0.0016848444938659668, 0.0018453598022460938, 0.0020058751106262207, 0.0021663904190063477, 0.0023269057273864746, 0.0024874210357666016, 0.0026479363441467285, 0.0028084516525268555, 0.0029689669609069824, 0.0031294822692871094, 0.0032899975776672363, 0.0034505128860473633, 0.0036110281944274902, 0.003771543502807617, 0.003932058811187744, 0.004092574119567871, 0.004253089427947998, 0.004413604736328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 17.0, 14.0, 21.0, 34.0, 34.0, 37.0, 72.0, 111.0, 123.0, 191.0, 283.0, 434.0, 616.0, 934.0, 1392.0, 2131.0, 3543.0, 5702.0, 10294.0, 19863.0, 43056.0, 120124.0, 455318.0, 247272.0, 72210.0, 29547.0, 14603.0, 7853.0, 4572.0, 2777.0, 1774.0, 1170.0, 744.0, 513.0, 322.0, 226.0, 178.0, 125.0, 95.0, 64.0, 52.0, 28.0, 20.0, 15.0, 14.0, 11.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0033512115478515625, -0.0032386481761932373, -0.003126084804534912, -0.003013521432876587, -0.0029009580612182617, -0.0027883946895599365, -0.0026758313179016113, -0.002563267946243286, -0.002450704574584961, -0.0023381412029266357, -0.0022255778312683105, -0.0021130144596099854, -0.00200045108795166, -0.001887887716293335, -0.0017753243446350098, -0.0016627609729766846, -0.0015501976013183594, -0.0014376342296600342, -0.001325070858001709, -0.0012125074863433838, -0.0010999441146850586, -0.0009873807430267334, -0.0008748173713684082, -0.000762253999710083, -0.0006496906280517578, -0.0005371272563934326, -0.0004245638847351074, -0.0003120005130767822, -0.00019943714141845703, -8.687376976013184e-05, 2.568960189819336e-05, 0.00013825297355651855, 0.00025081634521484375, 0.00036337971687316895, 0.00047594308853149414, 0.0005885064601898193, 0.0007010698318481445, 0.0008136332035064697, 0.0009261965751647949, 0.0010387599468231201, 0.0011513233184814453, 0.0012638866901397705, 0.0013764500617980957, 0.001489013433456421, 0.001601576805114746, 0.0017141401767730713, 0.0018267035484313965, 0.0019392669200897217, 0.002051830291748047, 0.002164393663406372, 0.0022769570350646973, 0.0023895204067230225, 0.0025020837783813477, 0.002614647150039673, 0.002727210521697998, 0.0028397738933563232, 0.0029523372650146484, 0.0030649006366729736, 0.003177464008331299, 0.003290027379989624, 0.0034025907516479492, 0.0035151541233062744, 0.0036277174949645996, 0.003740280866622925, 0.00385284423828125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 14.0, 7.0, 10.0, 10.0, 16.0, 18.0, 23.0, 26.0, 38.0, 32.0, 29.0, 41.0, 38.0, 41.0, 41.0, 53.0, 38.0, 43.0, 31.0, 45.0, 52.0, 31.0, 45.0, 30.0, 37.0, 28.0, 31.0, 19.0, 24.0, 21.0, 18.0, 14.0, 13.0, 12.0, 12.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003604888916015625, -0.0034941136837005615, -0.003383338451385498, -0.0032725632190704346, -0.003161787986755371, -0.0030510127544403076, -0.002940237522125244, -0.0028294622898101807, -0.002718687057495117, -0.0026079118251800537, -0.0024971365928649902, -0.0023863613605499268, -0.0022755861282348633, -0.0021648108959198, -0.0020540356636047363, -0.0019432604312896729, -0.0018324851989746094, -0.001721709966659546, -0.0016109347343444824, -0.001500159502029419, -0.0013893842697143555, -0.001278609037399292, -0.0011678338050842285, -0.001057058572769165, -0.0009462833404541016, -0.0008355081081390381, -0.0007247328758239746, -0.0006139576435089111, -0.0005031824111938477, -0.0003924071788787842, -0.0002816319465637207, -0.00017085671424865723, -6.008148193359375e-05, 5.0693750381469727e-05, 0.0001614689826965332, 0.0002722442150115967, 0.00038301944732666016, 0.0004937946796417236, 0.0006045699119567871, 0.0007153451442718506, 0.0008261203765869141, 0.0009368956089019775, 0.001047670841217041, 0.0011584460735321045, 0.001269221305847168, 0.0013799965381622314, 0.001490771770477295, 0.0016015470027923584, 0.0017123222351074219, 0.0018230974674224854, 0.0019338726997375488, 0.0020446479320526123, 0.0021554231643676758, 0.0022661983966827393, 0.0023769736289978027, 0.002487748861312866, 0.0025985240936279297, 0.002709299325942993, 0.0028200745582580566, 0.00293084979057312, 0.0030416250228881836, 0.003152400255203247, 0.0032631754875183105, 0.003373950719833374, 0.0034847259521484375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 4.0, 5.0, 8.0, 12.0, 21.0, 16.0, 27.0, 36.0, 42.0, 50.0, 84.0, 154.0, 220.0, 302.0, 435.0, 643.0, 1213.0, 1872.0, 2918.0, 5455.0, 11779.0, 34670.0, 215258.0, 674902.0, 63740.0, 17543.0, 7335.0, 3723.0, 2133.0, 1425.0, 843.0, 506.0, 363.0, 274.0, 171.0, 102.0, 70.0, 47.0, 36.0, 35.0, 29.0, 19.0, 11.0, 1.0, 10.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0], "bins": [-0.00045299530029296875, -0.0004393532872200012, -0.0004257112741470337, -0.00041206926107406616, -0.00039842724800109863, -0.0003847852349281311, -0.0003711432218551636, -0.00035750120878219604, -0.0003438591957092285, -0.000330217182636261, -0.00031657516956329346, -0.00030293315649032593, -0.0002892911434173584, -0.00027564913034439087, -0.00026200711727142334, -0.0002483651041984558, -0.00023472309112548828, -0.00022108107805252075, -0.00020743906497955322, -0.0001937970519065857, -0.00018015503883361816, -0.00016651302576065063, -0.0001528710126876831, -0.00013922899961471558, -0.00012558698654174805, -0.00011194497346878052, -9.830296039581299e-05, -8.466094732284546e-05, -7.101893424987793e-05, -5.73769211769104e-05, -4.373490810394287e-05, -3.0092895030975342e-05, -1.6450881958007812e-05, -2.808868885040283e-06, 1.0833144187927246e-05, 2.4475157260894775e-05, 3.8117170333862305e-05, 5.1759183406829834e-05, 6.540119647979736e-05, 7.904320955276489e-05, 9.268522262573242e-05, 0.00010632723569869995, 0.00011996924877166748, 0.000133611261844635, 0.00014725327491760254, 0.00016089528799057007, 0.0001745373010635376, 0.00018817931413650513, 0.00020182132720947266, 0.00021546334028244019, 0.00022910535335540771, 0.00024274736642837524, 0.0002563893795013428, 0.0002700313925743103, 0.00028367340564727783, 0.00029731541872024536, 0.0003109574317932129, 0.0003245994448661804, 0.00033824145793914795, 0.0003518834710121155, 0.000365525484085083, 0.00037916749715805054, 0.00039280951023101807, 0.0004064515233039856, 0.0004200935363769531]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 4.0, 0.0, 14.0, 0.0, 3.0, 0.0, 25.0, 0.0, 34.0, 0.0, 35.0, 0.0, 52.0, 0.0, 50.0, 0.0, 71.0, 0.0, 75.0, 0.0, 83.0, 0.0, 110.0, 0.0, 92.0, 0.0, 96.0, 0.0, 58.0, 0.0, 50.0, 0.0, 51.0, 0.0, 24.0, 0.0, 24.0, 0.0, 22.0, 0.0, 11.0, 0.0, 10.0, 0.0, 8.0, 0.0, 8.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 18.0, 26.0, 24.0, 43.0, 51.0, 57.0, 96.0, 130.0, 202.0, 312.0, 426.0, 639.0, 979.0, 1486.0, 2530.0, 4001.0, 6592.0, 11339.0, 20188.0, 39182.0, 86467.0, 267947.0, 388230.0, 112596.0, 47674.0, 24222.0, 13182.0, 7509.0, 4668.0, 2698.0, 1697.0, 1149.0, 728.0, 474.0, 288.0, 195.0, 158.0, 99.0, 81.0, 53.0, 33.0, 29.0, 7.0, 19.0, 7.0, 10.0, 1.0, 5.0, 3.0, 3.0, 1.0], "bins": [-0.0005507469177246094, -0.0005350708961486816, -0.0005193948745727539, -0.0005037188529968262, -0.00048804283142089844, -0.0004723668098449707, -0.00045669078826904297, -0.00044101476669311523, -0.0004253387451171875, -0.00040966272354125977, -0.00039398670196533203, -0.0003783106803894043, -0.00036263465881347656, -0.00034695863723754883, -0.0003312826156616211, -0.00031560659408569336, -0.0002999305725097656, -0.0002842545509338379, -0.00026857852935791016, -0.0002529025077819824, -0.0002372264862060547, -0.00022155046463012695, -0.00020587444305419922, -0.00019019842147827148, -0.00017452239990234375, -0.00015884637832641602, -0.00014317035675048828, -0.00012749433517456055, -0.00011181831359863281, -9.614229202270508e-05, -8.046627044677734e-05, -6.479024887084961e-05, -4.9114227294921875e-05, -3.343820571899414e-05, -1.7762184143066406e-05, -2.086162567138672e-06, 1.3589859008789062e-05, 2.9265880584716797e-05, 4.494190216064453e-05, 6.0617923736572266e-05, 7.62939453125e-05, 9.196996688842773e-05, 0.00010764598846435547, 0.0001233220100402832, 0.00013899803161621094, 0.00015467405319213867, 0.0001703500747680664, 0.00018602609634399414, 0.00020170211791992188, 0.0002173781394958496, 0.00023305416107177734, 0.0002487301826477051, 0.0002644062042236328, 0.00028008222579956055, 0.0002957582473754883, 0.000311434268951416, 0.00032711029052734375, 0.0003427863121032715, 0.0003584623336791992, 0.00037413835525512695, 0.0003898143768310547, 0.0004054903984069824, 0.00042116641998291016, 0.0004368424415588379, 0.0004525184631347656]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 7.0, 2.0, 5.0, 2.0, 5.0, 4.0, 8.0, 4.0, 9.0, 12.0, 13.0, 13.0, 14.0, 17.0, 20.0, 20.0, 22.0, 20.0, 26.0, 32.0, 38.0, 53.0, 75.0, 62.0, 64.0, 71.0, 62.0, 46.0, 36.0, 38.0, 30.0, 32.0, 30.0, 20.0, 8.0, 8.0, 16.0, 8.0, 14.0, 8.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001277923583984375, -0.00012394599616527557, -0.00012009963393211365, -0.00011625327169895172, -0.0001124069094657898, -0.00010856054723262787, -0.00010471418499946594, -0.00010086782276630402, -9.702146053314209e-05, -9.317509829998016e-05, -8.932873606681824e-05, -8.548237383365631e-05, -8.163601160049438e-05, -7.778964936733246e-05, -7.394328713417053e-05, -7.00969249010086e-05, -6.625056266784668e-05, -6.240420043468475e-05, -5.855783820152283e-05, -5.47114759683609e-05, -5.0865113735198975e-05, -4.701875150203705e-05, -4.317238926887512e-05, -3.9326027035713196e-05, -3.547966480255127e-05, -3.163330256938934e-05, -2.7786940336227417e-05, -2.394057810306549e-05, -2.0094215869903564e-05, -1.6247853636741638e-05, -1.2401491403579712e-05, -8.555129170417786e-06, -4.708766937255859e-06, -8.624047040939331e-07, 2.983957529067993e-06, 6.8303197622299194e-06, 1.0676681995391846e-05, 1.4523044228553772e-05, 1.8369406461715698e-05, 2.2215768694877625e-05, 2.606213092803955e-05, 2.9908493161201477e-05, 3.37548553943634e-05, 3.760121762752533e-05, 4.1447579860687256e-05, 4.529394209384918e-05, 4.914030432701111e-05, 5.2986666560173035e-05, 5.683302879333496e-05, 6.067939102649689e-05, 6.452575325965881e-05, 6.837211549282074e-05, 7.221847772598267e-05, 7.606483995914459e-05, 7.991120219230652e-05, 8.375756442546844e-05, 8.760392665863037e-05, 9.14502888917923e-05, 9.529665112495422e-05, 9.914301335811615e-05, 0.00010298937559127808, 0.00010683573782444, 0.00011068210005760193, 0.00011452846229076385, 0.00011837482452392578]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 10.0, 18.0, 17.0, 34.0, 59.0, 96.0, 136.0, 129.0, 141.0, 112.0, 70.0, 52.0, 34.0, 21.0, 14.0, 16.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0158377792686224, -0.015469185076653957, -0.015100589953362942, -0.0147319957613945, -0.01436340156942606, -0.013994807377457619, -0.013626212254166603, -0.013257618062198162, -0.012889023870229721, -0.01252042967826128, -0.012151834554970264, -0.011783240363001823, -0.011414646171033382, -0.011046051979064941, -0.010677456855773926, -0.010308862663805485, -0.00994026754051447, -0.009571673348546028, -0.009203078225255013, -0.008834484033286572, -0.00846588984131813, -0.008097294718027115, -0.007728700526058674, -0.007360106334090233, -0.0069915116764605045, -0.006622917018830776, -0.006254322826862335, -0.005885728169232607, -0.005517133511602879, -0.0051485393196344376, -0.004779944662004709, -0.004411350004374981, -0.004042755346745253, -0.003674160921946168, -0.0033055664971470833, -0.002936971839517355, -0.0025683774147182703, -0.0021997829899191856, -0.0018311883322894573, -0.0014625939074903727, -0.001093999482691288, -0.0007254049996845424, -0.00035681051667779684, 1.178402453660965e-05, 0.0003803784493356943, 0.000748972874134779, 0.0011175675317645073, 0.001486161956563592, 0.0018547563813626766, 0.0022233508061617613, 0.002591945230960846, 0.0029605398885905743, 0.003329134313389659, 0.0036977287381887436, 0.004066323395818472, 0.0044349180534482, 0.004803512245416641, 0.0051721069030463696, 0.0055407010950148106, 0.005909295752644539, 0.00627788994461298, 0.006646484602242708, 0.0070150792598724365, 0.0073836734518408775, 0.007752268109470606]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 6.0, 13.0, 16.0, 9.0, 18.0, 14.0, 14.0, 22.0, 26.0, 29.0, 24.0, 32.0, 33.0, 44.0, 32.0, 35.0, 34.0, 55.0, 47.0, 42.0, 38.0, 35.0, 36.0, 35.0, 35.0, 24.0, 23.0, 42.0, 25.0, 23.0, 19.0, 14.0, 21.0, 11.0, 16.0, 14.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.005241374019533396, -0.005089537240564823, -0.0049377004615962505, -0.004785863682627678, -0.004634026437997818, -0.004482189659029245, -0.004330352880060673, -0.0041785161010921, -0.0040266793221235275, -0.003874842543154955, -0.0037230055313557386, -0.003571168752387166, -0.0034193319734185934, -0.003267494961619377, -0.0031156581826508045, -0.002963821403682232, -0.0028119843918830156, -0.002660147612914443, -0.0025083106011152267, -0.002356473822146654, -0.0022046370431780815, -0.002052800264209509, -0.0019009632524102926, -0.00174912647344172, -0.0015972895780578256, -0.0014454526826739311, -0.0012936159037053585, -0.001141779008321464, -0.0009899421129375696, -0.000838105333968997, -0.0006862684385851026, -0.0005344316596165299, -0.0003825947642326355, -0.00023075791250448674, -7.892106077633798e-05, 7.2915805503726e-05, 0.00022475264267995954, 0.00037658947985619307, 0.0005284263752400875, 0.0006802631542086601, 0.0008321000495925546, 0.000983936944976449, 0.0011357737239450216, 0.001287610619328916, 0.0014394475147128105, 0.0015912842936813831, 0.0017431211890652776, 0.0018949579680338502, 0.0020467948634177446, 0.0021986316423863173, 0.0023504686541855335, 0.002502305433154106, 0.0026541422121226788, 0.0028059789910912514, 0.0029578160028904676, 0.0031096527818590403, 0.0032614897936582565, 0.003413326572626829, 0.0035651635844260454, 0.003717000363394618, 0.0038688371423631907, 0.004020674154162407, 0.0041725109331309795, 0.004324347712099552, 0.004476184491068125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 18.0, 22.0, 45.0, 52.0, 76.0, 132.0, 177.0, 292.0, 422.0, 615.0, 926.0, 1396.0, 2153.0, 3280.0, 5030.0, 8000.0, 12441.0, 20308.0, 33432.0, 57313.0, 102226.0, 192382.0, 252234.0, 152593.0, 81673.0, 46569.0, 27676.0, 17028.0, 10793.0, 6620.0, 4367.0, 2866.0, 1884.0, 1148.0, 739.0, 512.0, 363.0, 240.0, 161.0, 125.0, 68.0, 53.0, 30.0, 18.0, 20.0, 7.0, 9.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00844573974609375, -0.008147478103637695, -0.00784921646118164, -0.007550954818725586, -0.007252693176269531, -0.0069544315338134766, -0.006656169891357422, -0.006357908248901367, -0.0060596466064453125, -0.005761384963989258, -0.005463123321533203, -0.0051648616790771484, -0.004866600036621094, -0.004568338394165039, -0.004270076751708984, -0.00397181510925293, -0.003673553466796875, -0.0033752918243408203, -0.0030770301818847656, -0.002778768539428711, -0.0024805068969726562, -0.0021822452545166016, -0.0018839836120605469, -0.0015857219696044922, -0.0012874603271484375, -0.0009891986846923828, -0.0006909370422363281, -0.00039267539978027344, -9.441375732421875e-05, 0.00020384788513183594, 0.0005021095275878906, 0.0008003711700439453, 0.0010986328125, 0.0013968944549560547, 0.0016951560974121094, 0.001993417739868164, 0.0022916793823242188, 0.0025899410247802734, 0.002888202667236328, 0.003186464309692383, 0.0034847259521484375, 0.003782987594604492, 0.004081249237060547, 0.0043795108795166016, 0.004677772521972656, 0.004976034164428711, 0.005274295806884766, 0.00557255744934082, 0.005870819091796875, 0.00616908073425293, 0.006467342376708984, 0.006765604019165039, 0.007063865661621094, 0.0073621273040771484, 0.007660388946533203, 0.007958650588989258, 0.008256912231445312, 0.008555173873901367, 0.008853435516357422, 0.009151697158813477, 0.009449958801269531, 0.009748220443725586, 0.01004648208618164, 0.010344743728637695, 0.01064300537109375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 9.0, 6.0, 3.0, 4.0, 8.0, 6.0, 8.0, 14.0, 13.0, 16.0, 20.0, 19.0, 22.0, 24.0, 40.0, 29.0, 42.0, 36.0, 30.0, 41.0, 49.0, 52.0, 44.0, 47.0, 43.0, 32.0, 38.0, 37.0, 29.0, 31.0, 35.0, 28.0, 33.0, 17.0, 18.0, 12.0, 25.0, 15.0, 12.0, 2.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005077362060546875, -0.004934132099151611, -0.004790902137756348, -0.004647672176361084, -0.00450444221496582, -0.004361212253570557, -0.004217982292175293, -0.004074752330780029, -0.003931522369384766, -0.003788292407989502, -0.0036450624465942383, -0.0035018324851989746, -0.003358602523803711, -0.0032153725624084473, -0.0030721426010131836, -0.00292891263961792, -0.0027856826782226562, -0.0026424527168273926, -0.002499222755432129, -0.0023559927940368652, -0.0022127628326416016, -0.002069532871246338, -0.0019263029098510742, -0.0017830729484558105, -0.0016398429870605469, -0.0014966130256652832, -0.0013533830642700195, -0.0012101531028747559, -0.0010669231414794922, -0.0009236931800842285, -0.0007804632186889648, -0.0006372332572937012, -0.0004940032958984375, -0.00035077333450317383, -0.00020754337310791016, -6.431341171264648e-05, 7.891654968261719e-05, 0.00022214651107788086, 0.00036537647247314453, 0.0005086064338684082, 0.0006518363952636719, 0.0007950663566589355, 0.0009382963180541992, 0.0010815262794494629, 0.0012247562408447266, 0.0013679862022399902, 0.001511216163635254, 0.0016544461250305176, 0.0017976760864257812, 0.001940906047821045, 0.0020841360092163086, 0.0022273659706115723, 0.002370595932006836, 0.0025138258934020996, 0.0026570558547973633, 0.002800285816192627, 0.0029435157775878906, 0.0030867457389831543, 0.003229975700378418, 0.0033732056617736816, 0.0035164356231689453, 0.003659665584564209, 0.0038028955459594727, 0.003946125507354736, 0.00408935546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 18.0, 15.0, 43.0, 56.0, 56.0, 107.0, 155.0, 191.0, 298.0, 440.0, 621.0, 1007.0, 1574.0, 2358.0, 3525.0, 5370.0, 8145.0, 12489.0, 19603.0, 30804.0, 50713.0, 85828.0, 148672.0, 224772.0, 180598.0, 105373.0, 62563.0, 37409.0, 23295.0, 14608.0, 9398.0, 6094.0, 4123.0, 2741.0, 1808.0, 1178.0, 809.0, 551.0, 383.0, 247.0, 174.0, 113.0, 64.0, 42.0, 40.0, 25.0, 22.0, 9.0, 10.0, 10.0, 6.0, 1.0, 0.0, 4.0], "bins": [-0.009124755859375, -0.008853912353515625, -0.00858306884765625, -0.008312225341796875, -0.0080413818359375, -0.007770538330078125, -0.00749969482421875, -0.007228851318359375, -0.0069580078125, -0.006687164306640625, -0.00641632080078125, -0.006145477294921875, -0.0058746337890625, -0.005603790283203125, -0.00533294677734375, -0.005062103271484375, -0.004791259765625, -0.004520416259765625, -0.00424957275390625, -0.003978729248046875, -0.0037078857421875, -0.003437042236328125, -0.00316619873046875, -0.002895355224609375, -0.00262451171875, -0.002353668212890625, -0.00208282470703125, -0.001811981201171875, -0.0015411376953125, -0.001270294189453125, -0.00099945068359375, -0.000728607177734375, -0.000457763671875, -0.000186920166015625, 8.392333984375e-05, 0.000354766845703125, 0.0006256103515625, 0.000896453857421875, 0.00116729736328125, 0.001438140869140625, 0.001708984375, 0.001979827880859375, 0.00225067138671875, 0.002521514892578125, 0.0027923583984375, 0.003063201904296875, 0.00333404541015625, 0.003604888916015625, 0.003875732421875, 0.004146575927734375, 0.00441741943359375, 0.004688262939453125, 0.0049591064453125, 0.005229949951171875, 0.00550079345703125, 0.005771636962890625, 0.00604248046875, 0.006313323974609375, 0.00658416748046875, 0.006855010986328125, 0.0071258544921875, 0.007396697998046875, 0.00766754150390625, 0.007938385009765625, 0.008209228515625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 6.0, 10.0, 11.0, 7.0, 15.0, 15.0, 21.0, 26.0, 12.0, 26.0, 22.0, 20.0, 16.0, 31.0, 24.0, 22.0, 38.0, 42.0, 32.0, 35.0, 36.0, 44.0, 33.0, 30.0, 27.0, 38.0, 42.0, 36.0, 31.0, 24.0, 28.0, 23.0, 28.0, 22.0, 12.0, 19.0, 10.0, 9.0, 12.0, 9.0, 14.0, 1.0, 5.0, 8.0, 2.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0026874542236328125, -0.00260886549949646, -0.0025302767753601074, -0.002451688051223755, -0.0023730993270874023, -0.00229451060295105, -0.0022159218788146973, -0.0021373331546783447, -0.002058744430541992, -0.0019801557064056396, -0.0019015669822692871, -0.0018229782581329346, -0.001744389533996582, -0.0016658008098602295, -0.001587212085723877, -0.0015086233615875244, -0.0014300346374511719, -0.0013514459133148193, -0.0012728571891784668, -0.0011942684650421143, -0.0011156797409057617, -0.0010370910167694092, -0.0009585022926330566, -0.0008799135684967041, -0.0008013248443603516, -0.000722736120223999, -0.0006441473960876465, -0.0005655586719512939, -0.0004869699478149414, -0.00040838122367858887, -0.00032979249954223633, -0.0002512037754058838, -0.00017261505126953125, -9.402632713317871e-05, -1.5437602996826172e-05, 6.315112113952637e-05, 0.0001417398452758789, 0.00022032856941223145, 0.000298917293548584, 0.0003775060176849365, 0.00045609474182128906, 0.0005346834659576416, 0.0006132721900939941, 0.0006918609142303467, 0.0007704496383666992, 0.0008490383625030518, 0.0009276270866394043, 0.0010062158107757568, 0.0010848045349121094, 0.001163393259048462, 0.0012419819831848145, 0.001320570707321167, 0.0013991594314575195, 0.001477748155593872, 0.0015563368797302246, 0.0016349256038665771, 0.0017135143280029297, 0.0017921030521392822, 0.0018706917762756348, 0.0019492805004119873, 0.00202786922454834, 0.0021064579486846924, 0.002185046672821045, 0.0022636353969573975, 0.00234222412109375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 5.0, 6.0, 13.0, 7.0, 27.0, 30.0, 41.0, 66.0, 86.0, 138.0, 164.0, 226.0, 350.0, 466.0, 618.0, 807.0, 1168.0, 1613.0, 2270.0, 3498.0, 5875.0, 11765.0, 28862.0, 97255.0, 526002.0, 264396.0, 59120.0, 19909.0, 8785.0, 4850.0, 2976.0, 1996.0, 1436.0, 1033.0, 731.0, 544.0, 410.0, 299.0, 213.0, 131.0, 110.0, 71.0, 55.0, 37.0, 28.0, 27.0, 8.0, 10.0, 12.0, 7.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0008411407470703125, -0.0008169785141944885, -0.0007928162813186646, -0.0007686540484428406, -0.0007444918155670166, -0.0007203295826911926, -0.0006961673498153687, -0.0006720051169395447, -0.0006478428840637207, -0.0006236806511878967, -0.0005995184183120728, -0.0005753561854362488, -0.0005511939525604248, -0.0005270317196846008, -0.0005028694868087769, -0.0004787072539329529, -0.0004545450210571289, -0.00043038278818130493, -0.00040622055530548096, -0.000382058322429657, -0.000357896089553833, -0.00033373385667800903, -0.00030957162380218506, -0.0002854093909263611, -0.0002612471580505371, -0.00023708492517471313, -0.00021292269229888916, -0.00018876045942306519, -0.0001645982265472412, -0.00014043599367141724, -0.00011627376079559326, -9.211152791976929e-05, -6.794929504394531e-05, -4.378706216812134e-05, -1.9624829292297363e-05, 4.537403583526611e-06, 2.8699636459350586e-05, 5.286186933517456e-05, 7.702410221099854e-05, 0.00010118633508682251, 0.00012534856796264648, 0.00014951080083847046, 0.00017367303371429443, 0.0001978352665901184, 0.00022199749946594238, 0.00024615973234176636, 0.00027032196521759033, 0.0002944841980934143, 0.0003186464309692383, 0.00034280866384506226, 0.00036697089672088623, 0.0003911331295967102, 0.0004152953624725342, 0.00043945759534835815, 0.00046361982822418213, 0.0004877820611000061, 0.0005119442939758301, 0.000536106526851654, 0.000560268759727478, 0.000584430992603302, 0.000608593225479126, 0.00063275545835495, 0.0006569176912307739, 0.0006810799241065979, 0.0007052421569824219]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 4.0, 0.0, 7.0, 0.0, 6.0, 0.0, 16.0, 0.0, 0.0, 19.0, 0.0, 42.0, 0.0, 82.0, 0.0, 89.0, 0.0, 161.0, 0.0, 0.0, 150.0, 0.0, 150.0, 0.0, 110.0, 0.0, 74.0, 0.0, 29.0, 0.0, 0.0, 29.0, 0.0, 19.0, 0.0, 12.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.940696716308594e-07, -8.670613169670105e-07, -8.400529623031616e-07, -8.130446076393127e-07, -7.860362529754639e-07, -7.59027898311615e-07, -7.320195436477661e-07, -7.050111889839172e-07, -6.780028343200684e-07, -6.509944796562195e-07, -6.239861249923706e-07, -5.969777703285217e-07, -5.699694156646729e-07, -5.42961061000824e-07, -5.159527063369751e-07, -4.889443516731262e-07, -4.6193599700927734e-07, -4.3492764234542847e-07, -4.079192876815796e-07, -3.809109330177307e-07, -3.5390257835388184e-07, -3.2689422369003296e-07, -2.998858690261841e-07, -2.728775143623352e-07, -2.4586915969848633e-07, -2.1886080503463745e-07, -1.9185245037078857e-07, -1.648440957069397e-07, -1.3783574104309082e-07, -1.1082738637924194e-07, -8.381903171539307e-08, -5.681067705154419e-08, -2.9802322387695312e-08, -2.7939677238464355e-09, 2.421438694000244e-08, 5.122274160385132e-08, 7.82310962677002e-08, 1.0523945093154907e-07, 1.3224780559539795e-07, 1.5925616025924683e-07, 1.862645149230957e-07, 2.1327286958694458e-07, 2.4028122425079346e-07, 2.6728957891464233e-07, 2.942979335784912e-07, 3.213062882423401e-07, 3.4831464290618896e-07, 3.7532299757003784e-07, 4.023313522338867e-07, 4.293397068977356e-07, 4.5634806156158447e-07, 4.833564162254333e-07, 5.103647708892822e-07, 5.373731255531311e-07, 5.6438148021698e-07, 5.913898348808289e-07, 6.183981895446777e-07, 6.454065442085266e-07, 6.724148988723755e-07, 6.994232535362244e-07, 7.264316082000732e-07, 7.534399628639221e-07, 7.80448317527771e-07, 8.074566721916199e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 15.0, 32.0, 42.0, 74.0, 99.0, 152.0, 237.0, 329.0, 576.0, 907.0, 1523.0, 2610.0, 4735.0, 9507.0, 24013.0, 99155.0, 660206.0, 184297.0, 34423.0, 12077.0, 5721.0, 3044.0, 1800.0, 1056.0, 687.0, 413.0, 281.0, 182.0, 125.0, 82.0, 46.0, 40.0, 21.0, 17.0, 10.0, 7.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011205673217773438, -0.0010862499475479126, -0.0010519325733184814, -0.0010176151990890503, -0.0009832978248596191, -0.000948980450630188, -0.0009146630764007568, -0.0008803457021713257, -0.0008460283279418945, -0.0008117109537124634, -0.0007773935794830322, -0.0007430762052536011, -0.0007087588310241699, -0.0006744414567947388, -0.0006401240825653076, -0.0006058067083358765, -0.0005714893341064453, -0.0005371719598770142, -0.000502854585647583, -0.00046853721141815186, -0.0004342198371887207, -0.00039990246295928955, -0.0003655850887298584, -0.00033126771450042725, -0.0002969503402709961, -0.00026263296604156494, -0.0002283155918121338, -0.00019399821758270264, -0.00015968084335327148, -0.00012536346912384033, -9.104609489440918e-05, -5.672872066497803e-05, -2.2411346435546875e-05, 1.1906027793884277e-05, 4.622340202331543e-05, 8.054077625274658e-05, 0.00011485815048217773, 0.0001491755247116089, 0.00018349289894104004, 0.0002178102731704712, 0.00025212764739990234, 0.0002864450216293335, 0.00032076239585876465, 0.0003550797700881958, 0.00038939714431762695, 0.0004237145185470581, 0.00045803189277648926, 0.0004923492670059204, 0.0005266666412353516, 0.0005609840154647827, 0.0005953013896942139, 0.000629618763923645, 0.0006639361381530762, 0.0006982535123825073, 0.0007325708866119385, 0.0007668882608413696, 0.0008012056350708008, 0.0008355230093002319, 0.0008698403835296631, 0.0009041577577590942, 0.0009384751319885254, 0.0009727925062179565, 0.0010071098804473877, 0.0010414272546768188, 0.00107574462890625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 10.0, 11.0, 15.0, 26.0, 33.0, 85.0, 124.0, 215.0, 174.0, 106.0, 63.0, 34.0, 20.0, 20.0, 10.0, 4.0, 7.0, 6.0, 5.0, 9.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003266334533691406, -0.00031667202711105347, -0.0003067106008529663, -0.00029674917459487915, -0.000286787748336792, -0.00027682632207870483, -0.0002668648958206177, -0.0002569034695625305, -0.00024694204330444336, -0.0002369806170463562, -0.00022701919078826904, -0.00021705776453018188, -0.00020709633827209473, -0.00019713491201400757, -0.0001871734857559204, -0.00017721205949783325, -0.0001672506332397461, -0.00015728920698165894, -0.00014732778072357178, -0.00013736635446548462, -0.00012740492820739746, -0.0001174435019493103, -0.00010748207569122314, -9.752064943313599e-05, -8.755922317504883e-05, -7.759779691696167e-05, -6.763637065887451e-05, -5.7674944400787354e-05, -4.7713518142700195e-05, -3.775209188461304e-05, -2.779066562652588e-05, -1.782923936843872e-05, -7.867813110351562e-06, 2.0936131477355957e-06, 1.2055039405822754e-05, 2.2016465663909912e-05, 3.197789192199707e-05, 4.193931818008423e-05, 5.190074443817139e-05, 6.186217069625854e-05, 7.18235969543457e-05, 8.178502321243286e-05, 9.174644947052002e-05, 0.00010170787572860718, 0.00011166930198669434, 0.0001216307282447815, 0.00013159215450286865, 0.0001415535807609558, 0.00015151500701904297, 0.00016147643327713013, 0.00017143785953521729, 0.00018139928579330444, 0.0001913607120513916, 0.00020132213830947876, 0.00021128356456756592, 0.00022124499082565308, 0.00023120641708374023, 0.0002411678433418274, 0.00025112926959991455, 0.0002610906958580017, 0.00027105212211608887, 0.000281013548374176, 0.0002909749746322632, 0.00030093640089035034, 0.0003108978271484375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 6.0, 8.0, 20.0, 20.0, 35.0, 70.0, 121.0, 131.0, 166.0, 138.0, 99.0, 65.0, 40.0, 24.0, 15.0, 14.0, 14.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016416918486356735, -0.016030171886086464, -0.015643423423171043, -0.015256675891578197, -0.014869928359985352, -0.01448318175971508, -0.01409643329679966, -0.013709686696529388, -0.013322939164936543, -0.012936191633343697, -0.01254944410175085, -0.012162696570158005, -0.011775949038565159, -0.011389201506972313, -0.011002454906702042, -0.010615707375109196, -0.01022895984351635, -0.009842212311923504, -0.009455464780330658, -0.009068717248737812, -0.008681969717144966, -0.008295223116874695, -0.007908474653959274, -0.007521728053689003, -0.0071349795907735825, -0.0067482320591807365, -0.006361484527587891, -0.005974736995995045, -0.005587989930063486, -0.00520124239847064, -0.004814494866877794, -0.004427747800946236, -0.00404100026935339, -0.003654252737760544, -0.0032675054389983416, -0.0028807579074054956, -0.0024940106086432934, -0.0021072630770504475, -0.0017205155454576015, -0.0013337682466953993, -0.0009470207151025534, -0.0005602732999250293, -0.00017352582653984427, 0.00021322164684534073, 0.0005999690620228648, 0.000986716477200389, 0.0013734640087932348, 0.001760211307555437, 0.002146958839148283, 0.002533706370741129, 0.002920453669503331, 0.003307201201096177, 0.0036939484998583794, 0.004080696031451225, 0.004467443563044071, 0.004854191094636917, 0.005240938626229763, 0.005627686157822609, 0.006014433689415455, 0.006401181221008301, 0.006787928286939859, 0.007174675818532705, 0.007561423350125551, 0.00794817041605711, 0.008334917947649956]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 11.0, 7.0, 9.0, 17.0, 16.0, 17.0, 14.0, 18.0, 19.0, 25.0, 27.0, 27.0, 36.0, 31.0, 28.0, 42.0, 34.0, 31.0, 37.0, 42.0, 37.0, 49.0, 42.0, 36.0, 29.0, 36.0, 27.0, 26.0, 35.0, 26.0, 21.0, 29.0, 21.0, 7.0, 19.0, 15.0, 8.0, 9.0, 6.0, 7.0, 1.0, 2.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.004762752912938595, -0.004628139082342386, -0.004493525251746178, -0.004358911421149969, -0.0042242975905537605, -0.004089683294296265, -0.003955069463700056, -0.0038204556331038475, -0.003685841802507639, -0.0035512279719114304, -0.003416614141315222, -0.0032820000778883696, -0.003147386247292161, -0.0030127724166959524, -0.0028781583532691, -0.0027435445226728916, -0.002608930692076683, -0.0024743168614804745, -0.002339703030884266, -0.0022050889674574137, -0.002070475136861205, -0.0019358613062649965, -0.0018012473592534661, -0.0016666334122419357, -0.0015320195816457272, -0.0013974057510495186, -0.0012627918040379882, -0.0011281778570264578, -0.0009935640264302492, -0.0008589501376263797, -0.0007243362488225102, -0.0005897223600186408, -0.0004551082383841276, -0.00032049434958025813, -0.00018588046077638865, -5.126657197251916e-05, 8.334731683135033e-05, 0.0002179612056352198, 0.0003525750944390893, 0.0004871889832429588, 0.0006218028720468283, 0.0007564167608506978, 0.0008910306496545672, 0.0010256445966660976, 0.0011602584272623062, 0.0012948722578585148, 0.0014294862048700452, 0.0015641001518815756, 0.0016987139824777842, 0.0018333278130739927, 0.001967941876500845, 0.0021025557070970535, 0.002237169537693262, 0.0023717833682894707, 0.0025063971988856792, 0.0026410112623125315, 0.00277562509290874, 0.0029102389235049486, 0.003044852986931801, 0.0031794668175280094, 0.003314080648124218, 0.0034486944787204266, 0.003583308309316635, 0.0037179223727434874, 0.003852536203339696]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 14.0, 7.0, 10.0, 19.0, 33.0, 35.0, 58.0, 79.0, 112.0, 155.0, 248.0, 387.0, 571.0, 868.0, 1395.0, 2195.0, 3431.0, 5718.0, 9672.0, 16944.0, 31610.0, 65089.0, 153083.0, 516692.0, 1853893.0, 1066170.0, 261860.0, 100792.0, 46657.0, 24310.0, 13228.0, 7487.0, 4368.0, 2627.0, 1644.0, 1004.0, 644.0, 425.0, 260.0, 173.0, 106.0, 79.0, 50.0, 30.0, 19.0, 11.0, 11.0, 4.0, 4.0, 6.0, 0.0, 2.0], "bins": [-0.010162353515625, -0.009885787963867188, -0.009609222412109375, -0.009332656860351562, -0.00905609130859375, -0.008779525756835938, -0.008502960205078125, -0.008226394653320312, -0.0079498291015625, -0.0076732635498046875, -0.007396697998046875, -0.0071201324462890625, -0.00684356689453125, -0.0065670013427734375, -0.006290435791015625, -0.0060138702392578125, -0.0057373046875, -0.0054607391357421875, -0.005184173583984375, -0.0049076080322265625, -0.00463104248046875, -0.0043544769287109375, -0.004077911376953125, -0.0038013458251953125, -0.0035247802734375, -0.0032482147216796875, -0.002971649169921875, -0.0026950836181640625, -0.00241851806640625, -0.0021419525146484375, -0.001865386962890625, -0.0015888214111328125, -0.001312255859375, -0.0010356903076171875, -0.000759124755859375, -0.0004825592041015625, -0.00020599365234375, 7.05718994140625e-05, 0.000347137451171875, 0.0006237030029296875, 0.0009002685546875, 0.0011768341064453125, 0.001453399658203125, 0.0017299652099609375, 0.00200653076171875, 0.0022830963134765625, 0.002559661865234375, 0.0028362274169921875, 0.00311279296875, 0.0033893585205078125, 0.003665924072265625, 0.0039424896240234375, 0.00421905517578125, 0.0044956207275390625, 0.004772186279296875, 0.0050487518310546875, 0.0053253173828125, 0.0056018829345703125, 0.005878448486328125, 0.0061550140380859375, 0.00643157958984375, 0.0067081451416015625, 0.006984710693359375, 0.0072612762451171875, 0.007537841796875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 9.0, 7.0, 9.0, 11.0, 10.0, 15.0, 18.0, 23.0, 18.0, 32.0, 17.0, 24.0, 29.0, 39.0, 44.0, 38.0, 29.0, 31.0, 46.0, 35.0, 37.0, 47.0, 40.0, 48.0, 34.0, 40.0, 27.0, 29.0, 24.0, 20.0, 34.0, 23.0, 21.0, 20.0, 11.0, 10.0, 14.0, 9.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0], "bins": [-0.004108428955078125, -0.003996789455413818, -0.0038851499557495117, -0.003773510456085205, -0.0036618709564208984, -0.003550231456756592, -0.003438591957092285, -0.0033269524574279785, -0.003215312957763672, -0.0031036734580993652, -0.0029920339584350586, -0.002880394458770752, -0.0027687549591064453, -0.0026571154594421387, -0.002545475959777832, -0.0024338364601135254, -0.0023221969604492188, -0.002210557460784912, -0.0020989179611206055, -0.001987278461456299, -0.0018756389617919922, -0.0017639994621276855, -0.001652359962463379, -0.0015407204627990723, -0.0014290809631347656, -0.001317441463470459, -0.0012058019638061523, -0.0010941624641418457, -0.000982522964477539, -0.0008708834648132324, -0.0007592439651489258, -0.0006476044654846191, -0.0005359649658203125, -0.00042432546615600586, -0.0003126859664916992, -0.00020104646682739258, -8.940696716308594e-05, 2.2232532501220703e-05, 0.00013387203216552734, 0.000245511531829834, 0.0003571510314941406, 0.00046879053115844727, 0.0005804300308227539, 0.0006920695304870605, 0.0008037090301513672, 0.0009153485298156738, 0.0010269880294799805, 0.0011386275291442871, 0.0012502670288085938, 0.0013619065284729004, 0.001473546028137207, 0.0015851855278015137, 0.0016968250274658203, 0.001808464527130127, 0.0019201040267944336, 0.0020317435264587402, 0.002143383026123047, 0.0022550225257873535, 0.00236666202545166, 0.002478301525115967, 0.0025899410247802734, 0.00270158052444458, 0.0028132200241088867, 0.0029248595237731934, 0.0030364990234375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 9.0, 13.0, 20.0, 35.0, 45.0, 85.0, 121.0, 185.0, 268.0, 467.0, 762.0, 1173.0, 1891.0, 3306.0, 5454.0, 9266.0, 16138.0, 29687.0, 56162.0, 116422.0, 270864.0, 771380.0, 1765331.0, 677519.0, 244376.0, 106543.0, 52008.0, 27418.0, 15356.0, 8803.0, 5264.0, 3060.0, 1803.0, 1127.0, 725.0, 445.0, 266.0, 187.0, 112.0, 64.0, 44.0, 32.0, 16.0, 10.0, 5.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007663726806640625, -0.007420003414154053, -0.0071762800216674805, -0.006932556629180908, -0.006688833236694336, -0.006445109844207764, -0.006201386451721191, -0.005957663059234619, -0.005713939666748047, -0.005470216274261475, -0.005226492881774902, -0.00498276948928833, -0.004739046096801758, -0.0044953227043151855, -0.004251599311828613, -0.004007875919342041, -0.0037641525268554688, -0.0035204291343688965, -0.0032767057418823242, -0.003032982349395752, -0.0027892589569091797, -0.0025455355644226074, -0.002301812171936035, -0.002058088779449463, -0.0018143653869628906, -0.0015706419944763184, -0.001326918601989746, -0.0010831952095031738, -0.0008394718170166016, -0.0005957484245300293, -0.00035202503204345703, -0.00010830163955688477, 0.0001354217529296875, 0.00037914514541625977, 0.000622868537902832, 0.0008665919303894043, 0.0011103153228759766, 0.0013540387153625488, 0.001597762107849121, 0.0018414855003356934, 0.0020852088928222656, 0.002328932285308838, 0.00257265567779541, 0.0028163790702819824, 0.0030601024627685547, 0.003303825855255127, 0.0035475492477416992, 0.0037912726402282715, 0.004034996032714844, 0.004278719425201416, 0.004522442817687988, 0.0047661662101745605, 0.005009889602661133, 0.005253612995147705, 0.005497336387634277, 0.00574105978012085, 0.005984783172607422, 0.006228506565093994, 0.006472229957580566, 0.006715953350067139, 0.006959676742553711, 0.007203400135040283, 0.0074471235275268555, 0.007690846920013428, 0.0079345703125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 6.0, 2.0, 17.0, 9.0, 24.0, 22.0, 24.0, 28.0, 41.0, 55.0, 62.0, 71.0, 95.0, 121.0, 147.0, 191.0, 222.0, 248.0, 326.0, 387.0, 377.0, 274.0, 262.0, 208.0, 152.0, 126.0, 114.0, 98.0, 77.0, 54.0, 40.0, 59.0, 27.0, 22.0, 20.0, 8.0, 6.0, 14.0, 11.0, 6.0, 6.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0023059844970703125, -0.002237468957901001, -0.0021689534187316895, -0.002100437879562378, -0.0020319223403930664, -0.001963406801223755, -0.0018948912620544434, -0.0018263757228851318, -0.0017578601837158203, -0.0016893446445465088, -0.0016208291053771973, -0.0015523135662078857, -0.0014837980270385742, -0.0014152824878692627, -0.0013467669486999512, -0.0012782514095306396, -0.0012097358703613281, -0.0011412203311920166, -0.001072704792022705, -0.0010041892528533936, -0.000935673713684082, -0.0008671581745147705, -0.000798642635345459, -0.0007301270961761475, -0.0006616115570068359, -0.0005930960178375244, -0.0005245804786682129, -0.00045606493949890137, -0.00038754940032958984, -0.0003190338611602783, -0.0002505183219909668, -0.00018200278282165527, -0.00011348724365234375, -4.4971704483032227e-05, 2.3543834686279297e-05, 9.205937385559082e-05, 0.00016057491302490234, 0.00022909045219421387, 0.0002976059913635254, 0.0003661215305328369, 0.00043463706970214844, 0.00050315260887146, 0.0005716681480407715, 0.000640183687210083, 0.0007086992263793945, 0.0007772147655487061, 0.0008457303047180176, 0.0009142458438873291, 0.0009827613830566406, 0.0010512769222259521, 0.0011197924613952637, 0.0011883080005645752, 0.0012568235397338867, 0.0013253390789031982, 0.0013938546180725098, 0.0014623701572418213, 0.0015308856964111328, 0.0015994012355804443, 0.0016679167747497559, 0.0017364323139190674, 0.001804947853088379, 0.0018734633922576904, 0.001941978931427002, 0.0020104944705963135, 0.002079010009765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 12.0, 15.0, 20.0, 26.0, 27.0, 34.0, 50.0, 58.0, 77.0, 91.0, 99.0, 82.0, 77.0, 58.0, 52.0, 39.0, 33.0, 29.0, 18.0, 14.0, 12.0, 13.0, 10.0, 8.0, 4.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007178177125751972, -0.006970182526856661, -0.0067621879279613495, -0.006554193329066038, -0.006346198730170727, -0.006138204131275415, -0.005930209532380104, -0.00572221539914608, -0.005514220334589481, -0.00530622573569417, -0.005098231136798859, -0.004890236537903547, -0.004682241939008236, -0.004474247340112925, -0.004266252741217613, -0.004058258607983589, -0.003850264009088278, -0.0036422694101929665, -0.003434274811297655, -0.0032262802124023438, -0.0030182856135070324, -0.002810291014611721, -0.0026022966485470533, -0.002394302049651742, -0.0021863074507564306, -0.0019783128518611193, -0.001770318252965808, -0.0015623237704858184, -0.001354329171590507, -0.0011463345726951957, -0.0009383400902152061, -0.0007303454913198948, -0.0005223513580858707, -0.00031435678829438984, -0.00010636221850290895, 0.0001016323221847415, 0.00030962692108005285, 0.0005176215199753642, 0.0007256160024553537, 0.0009336106013506651, 0.0011416052002459764, 0.0013495997991412878, 0.0015575943980365992, 0.0017655888805165887, 0.001973583362996578, 0.0021815779618918896, 0.002389572560787201, 0.0025975671596825123, 0.0028055617585778236, 0.003013556357473135, 0.0032215509563684464, 0.0034295455552637577, 0.003637540154159069, 0.0038455347530543804, 0.004053529351949692, 0.004261523485183716, 0.0044695185497403145, 0.004677513148635626, 0.004885507747530937, 0.0050935023464262486, 0.00530149694532156, 0.005509491544216871, 0.005717486143112183, 0.005925480276346207, 0.006133474875241518]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 8.0, 4.0, 14.0, 4.0, 12.0, 7.0, 8.0, 15.0, 15.0, 23.0, 13.0, 22.0, 27.0, 26.0, 27.0, 33.0, 31.0, 38.0, 38.0, 36.0, 33.0, 32.0, 35.0, 46.0, 39.0, 43.0, 31.0, 34.0, 26.0, 31.0, 34.0, 21.0, 29.0, 25.0, 31.0, 15.0, 16.0, 16.0, 13.0, 10.0, 6.0, 6.0, 10.0, 9.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004247389268130064, -0.004127685911953449, -0.0040079825557768345, -0.0038882791996002197, -0.003768575843423605, -0.00364887248724699, -0.0035291691310703754, -0.0034094657748937607, -0.003289762418717146, -0.003170059062540531, -0.0030503557063639164, -0.0029306523501873016, -0.002810948994010687, -0.002691245637834072, -0.0025715422816574574, -0.0024518389254808426, -0.002332135336473584, -0.0022124319802969694, -0.0020927286241203547, -0.00197302526794374, -0.0018533219117671251, -0.0017336185555905104, -0.0016139150829985738, -0.001494211726821959, -0.0013745083706453443, -0.0012548050144687295, -0.0011351016582921147, -0.0010153981857001781, -0.0008956948877312243, -0.0007759915315546095, -0.0006562881171703339, -0.0005365847609937191, -0.000416881637647748, -0.00029717828147113323, -0.00017747489619068801, -5.7771510910242796e-05, 6.193184526637197e-05, 0.00018163520144298673, 0.0003013386158272624, 0.00042104197200387716, 0.0005407453281804919, 0.0006604486843571067, 0.0007801520405337214, 0.0008998554549179971, 0.0010195588693022728, 0.0011392622254788876, 0.0012589655816555023, 0.001378668937832117, 0.0014983722940087318, 0.0016180756501853466, 0.0017377790063619614, 0.0018574823625385761, 0.001977185718715191, 0.0020968890748918056, 0.0022165924310684204, 0.002336295787245035, 0.00245599914342165, 0.0025757024995982647, 0.0026954058557748795, 0.0028151092119514942, 0.002934812568128109, 0.0030545159243047237, 0.0031742192804813385, 0.0032939226366579533, 0.0034136262256652117]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 2.0, 11.0, 11.0, 19.0, 34.0, 41.0, 63.0, 89.0, 123.0, 171.0, 255.0, 412.0, 542.0, 845.0, 1162.0, 1823.0, 2634.0, 3874.0, 5654.0, 8750.0, 13636.0, 21853.0, 36367.0, 65200.0, 125982.0, 253810.0, 236568.0, 115273.0, 60493.0, 34389.0, 20395.0, 12960.0, 8185.0, 5585.0, 3669.0, 2392.0, 1665.0, 1072.0, 809.0, 535.0, 376.0, 248.0, 200.0, 123.0, 86.0, 56.0, 34.0, 26.0, 16.0, 15.0, 11.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0017452239990234375, -0.0016905814409255981, -0.0016359388828277588, -0.0015812963247299194, -0.00152665376663208, -0.0014720112085342407, -0.0014173686504364014, -0.001362726092338562, -0.0013080835342407227, -0.0012534409761428833, -0.001198798418045044, -0.0011441558599472046, -0.0010895133018493652, -0.0010348707437515259, -0.0009802281856536865, -0.0009255856275558472, -0.0008709430694580078, -0.0008163005113601685, -0.0007616579532623291, -0.0007070153951644897, -0.0006523728370666504, -0.000597730278968811, -0.0005430877208709717, -0.0004884451627731323, -0.00043380260467529297, -0.0003791600465774536, -0.00032451748847961426, -0.0002698749303817749, -0.00021523237228393555, -0.0001605898141860962, -0.00010594725608825684, -5.130469799041748e-05, 3.337860107421875e-06, 5.798041820526123e-05, 0.00011262297630310059, 0.00016726553440093994, 0.0002219080924987793, 0.00027655065059661865, 0.000331193208694458, 0.00038583576679229736, 0.0004404783248901367, 0.0004951208829879761, 0.0005497634410858154, 0.0006044059991836548, 0.0006590485572814941, 0.0007136911153793335, 0.0007683336734771729, 0.0008229762315750122, 0.0008776187896728516, 0.0009322613477706909, 0.0009869039058685303, 0.0010415464639663696, 0.001096189022064209, 0.0011508315801620483, 0.0012054741382598877, 0.001260116696357727, 0.0013147592544555664, 0.0013694018125534058, 0.0014240443706512451, 0.0014786869287490845, 0.0015333294868469238, 0.0015879720449447632, 0.0016426146030426025, 0.001697257161140442, 0.0017518997192382812]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 6.0, 8.0, 6.0, 8.0, 17.0, 14.0, 21.0, 26.0, 18.0, 24.0, 27.0, 26.0, 37.0, 36.0, 26.0, 44.0, 41.0, 46.0, 32.0, 45.0, 35.0, 34.0, 40.0, 36.0, 45.0, 31.0, 28.0, 35.0, 27.0, 20.0, 21.0, 23.0, 16.0, 15.0, 12.0, 9.0, 8.0, 8.0, 7.0, 8.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004421234130859375, -0.004292100667953491, -0.004162967205047607, -0.004033833742141724, -0.00390470027923584, -0.003775566816329956, -0.0036464333534240723, -0.0035172998905181885, -0.0033881664276123047, -0.003259032964706421, -0.003129899501800537, -0.0030007660388946533, -0.0028716325759887695, -0.0027424991130828857, -0.002613365650177002, -0.002484232187271118, -0.0023550987243652344, -0.0022259652614593506, -0.002096831798553467, -0.001967698335647583, -0.0018385648727416992, -0.0017094314098358154, -0.0015802979469299316, -0.0014511644840240479, -0.001322031021118164, -0.0011928975582122803, -0.0010637640953063965, -0.0009346306324005127, -0.0008054971694946289, -0.0006763637065887451, -0.0005472302436828613, -0.00041809678077697754, -0.00028896331787109375, -0.00015982985496520996, -3.069639205932617e-05, 9.843707084655762e-05, 0.0002275705337524414, 0.0003567039966583252, 0.000485837459564209, 0.0006149709224700928, 0.0007441043853759766, 0.0008732378482818604, 0.0010023713111877441, 0.001131504774093628, 0.0012606382369995117, 0.0013897716999053955, 0.0015189051628112793, 0.001648038625717163, 0.0017771720886230469, 0.0019063055515289307, 0.0020354390144348145, 0.0021645724773406982, 0.002293705940246582, 0.002422839403152466, 0.0025519728660583496, 0.0026811063289642334, 0.002810239791870117, 0.002939373254776001, 0.0030685067176818848, 0.0031976401805877686, 0.0033267736434936523, 0.003455907106399536, 0.00358504056930542, 0.0037141740322113037, 0.0038433074951171875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 7.0, 11.0, 10.0, 22.0, 32.0, 55.0, 80.0, 170.0, 319.0, 545.0, 986.0, 1838.0, 3541.0, 7480.0, 15920.0, 38600.0, 118719.0, 492456.0, 254584.0, 66513.0, 24797.0, 10915.0, 5288.0, 2535.0, 1339.0, 772.0, 427.0, 237.0, 143.0, 69.0, 52.0, 24.0, 18.0, 9.0, 14.0, 11.0, 6.0, 2.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027446746826171875, -0.0026381313800811768, -0.002531588077545166, -0.0024250447750091553, -0.0023185014724731445, -0.002211958169937134, -0.002105414867401123, -0.0019988715648651123, -0.0018923282623291016, -0.0017857849597930908, -0.00167924165725708, -0.0015726983547210693, -0.0014661550521850586, -0.0013596117496490479, -0.0012530684471130371, -0.0011465251445770264, -0.0010399818420410156, -0.0009334385395050049, -0.0008268952369689941, -0.0007203519344329834, -0.0006138086318969727, -0.0005072653293609619, -0.00040072202682495117, -0.00029417872428894043, -0.0001876354217529297, -8.109211921691895e-05, 2.5451183319091797e-05, 0.00013199448585510254, 0.00023853778839111328, 0.000345081090927124, 0.00045162439346313477, 0.0005581676959991455, 0.0006647109985351562, 0.000771254301071167, 0.0008777976036071777, 0.0009843409061431885, 0.0010908842086791992, 0.00119742751121521, 0.0013039708137512207, 0.0014105141162872314, 0.0015170574188232422, 0.001623600721359253, 0.0017301440238952637, 0.0018366873264312744, 0.0019432306289672852, 0.002049773931503296, 0.0021563172340393066, 0.0022628605365753174, 0.002369403839111328, 0.002475947141647339, 0.0025824904441833496, 0.0026890337467193604, 0.002795577049255371, 0.002902120351791382, 0.0030086636543273926, 0.0031152069568634033, 0.003221750259399414, 0.003328293561935425, 0.0034348368644714355, 0.0035413801670074463, 0.003647923469543457, 0.0037544667720794678, 0.0038610100746154785, 0.003967553377151489, 0.0040740966796875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 2.0, 10.0, 7.0, 10.0, 13.0, 14.0, 23.0, 21.0, 16.0, 27.0, 40.0, 19.0, 45.0, 35.0, 41.0, 24.0, 34.0, 44.0, 44.0, 32.0, 36.0, 45.0, 38.0, 37.0, 39.0, 30.0, 28.0, 21.0, 28.0, 17.0, 26.0, 23.0, 12.0, 20.0, 18.0, 20.0, 3.0, 10.0, 9.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00232696533203125, -0.0022462308406829834, -0.002165496349334717, -0.00208476185798645, -0.0020040273666381836, -0.001923292875289917, -0.0018425583839416504, -0.0017618238925933838, -0.0016810894012451172, -0.0016003549098968506, -0.001519620418548584, -0.0014388859272003174, -0.0013581514358520508, -0.0012774169445037842, -0.0011966824531555176, -0.001115947961807251, -0.0010352134704589844, -0.0009544789791107178, -0.0008737444877624512, -0.0007930099964141846, -0.000712275505065918, -0.0006315410137176514, -0.0005508065223693848, -0.00047007203102111816, -0.00038933753967285156, -0.00030860304832458496, -0.00022786855697631836, -0.00014713406562805176, -6.639957427978516e-05, 1.4334917068481445e-05, 9.506940841674805e-05, 0.00017580389976501465, 0.00025653839111328125, 0.00033727288246154785, 0.00041800737380981445, 0.0004987418651580811, 0.0005794763565063477, 0.0006602108478546143, 0.0007409453392028809, 0.0008216798305511475, 0.0009024143218994141, 0.0009831488132476807, 0.0010638833045959473, 0.0011446177959442139, 0.0012253522872924805, 0.001306086778640747, 0.0013868212699890137, 0.0014675557613372803, 0.0015482902526855469, 0.0016290247440338135, 0.00170975923538208, 0.0017904937267303467, 0.0018712282180786133, 0.0019519627094268799, 0.0020326972007751465, 0.002113431692123413, 0.0021941661834716797, 0.0022749006748199463, 0.002355635166168213, 0.0024363696575164795, 0.002517104148864746, 0.0025978386402130127, 0.0026785731315612793, 0.002759307622909546, 0.0028400421142578125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 11.0, 27.0, 23.0, 45.0, 83.0, 125.0, 183.0, 243.0, 405.0, 626.0, 971.0, 1548.0, 2562.0, 4549.0, 8595.0, 17658.0, 45165.0, 191152.0, 619166.0, 95937.0, 30039.0, 13212.0, 6703.0, 3649.0, 2159.0, 1323.0, 777.0, 536.0, 389.0, 237.0, 146.0, 93.0, 65.0, 56.0, 33.0, 19.0, 10.0, 7.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020599365234375, -0.00019871443510055542, -0.00019143521785736084, -0.00018415600061416626, -0.00017687678337097168, -0.0001695975661277771, -0.00016231834888458252, -0.00015503913164138794, -0.00014775991439819336, -0.00014048069715499878, -0.0001332014799118042, -0.00012592226266860962, -0.00011864304542541504, -0.00011136382818222046, -0.00010408461093902588, -9.68053936958313e-05, -8.952617645263672e-05, -8.224695920944214e-05, -7.496774196624756e-05, -6.768852472305298e-05, -6.04093074798584e-05, -5.313009023666382e-05, -4.585087299346924e-05, -3.857165575027466e-05, -3.129243850708008e-05, -2.4013221263885498e-05, -1.6734004020690918e-05, -9.454786777496338e-06, -2.175569534301758e-06, 5.103647708892822e-06, 1.2382864952087402e-05, 1.9662082195281982e-05, 2.6941299438476562e-05, 3.422051668167114e-05, 4.149973392486572e-05, 4.87789511680603e-05, 5.605816841125488e-05, 6.333738565444946e-05, 7.061660289764404e-05, 7.789582014083862e-05, 8.51750373840332e-05, 9.245425462722778e-05, 9.973347187042236e-05, 0.00010701268911361694, 0.00011429190635681152, 0.0001215711236000061, 0.00012885034084320068, 0.00013612955808639526, 0.00014340877532958984, 0.00015068799257278442, 0.000157967209815979, 0.00016524642705917358, 0.00017252564430236816, 0.00017980486154556274, 0.00018708407878875732, 0.0001943632960319519, 0.00020164251327514648, 0.00020892173051834106, 0.00021620094776153564, 0.00022348016500473022, 0.0002307593822479248, 0.00023803859949111938, 0.00024531781673431396, 0.00025259703397750854, 0.0002598762512207031]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 11.0, 3.0, 6.0, 10.0, 10.0, 11.0, 23.0, 15.0, 63.0, 40.0, 42.0, 47.0, 55.0, 55.0, 66.0, 86.0, 111.0, 43.0, 47.0, 42.0, 42.0, 30.0, 30.0, 15.0, 19.0, 8.0, 7.0, 8.0, 4.0, 7.0, 3.0, 5.0, 8.0, 3.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.086162567138672e-06, -2.0191073417663574e-06, -1.952052116394043e-06, -1.8849968910217285e-06, -1.817941665649414e-06, -1.7508864402770996e-06, -1.6838312149047852e-06, -1.6167759895324707e-06, -1.5497207641601562e-06, -1.4826655387878418e-06, -1.4156103134155273e-06, -1.3485550880432129e-06, -1.2814998626708984e-06, -1.214444637298584e-06, -1.1473894119262695e-06, -1.080334186553955e-06, -1.0132789611816406e-06, -9.462237358093262e-07, -8.791685104370117e-07, -8.121132850646973e-07, -7.450580596923828e-07, -6.780028343200684e-07, -6.109476089477539e-07, -5.438923835754395e-07, -4.76837158203125e-07, -4.0978193283081055e-07, -3.427267074584961e-07, -2.7567148208618164e-07, -2.086162567138672e-07, -1.4156103134155273e-07, -7.450580596923828e-08, -7.450580596923828e-09, 5.960464477539063e-08, 1.2665987014770508e-07, 1.9371509552001953e-07, 2.60770320892334e-07, 3.2782554626464844e-07, 3.948807716369629e-07, 4.6193599700927734e-07, 5.289912223815918e-07, 5.960464477539062e-07, 6.631016731262207e-07, 7.301568984985352e-07, 7.972121238708496e-07, 8.642673492431641e-07, 9.313225746154785e-07, 9.98377799987793e-07, 1.0654330253601074e-06, 1.1324882507324219e-06, 1.1995434761047363e-06, 1.2665987014770508e-06, 1.3336539268493652e-06, 1.4007091522216797e-06, 1.4677643775939941e-06, 1.5348196029663086e-06, 1.601874828338623e-06, 1.6689300537109375e-06, 1.735985279083252e-06, 1.8030405044555664e-06, 1.8700957298278809e-06, 1.9371509552001953e-06, 2.0042061805725098e-06, 2.0712614059448242e-06, 2.1383166313171387e-06, 2.205371856689453e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 10.0, 24.0, 29.0, 45.0, 60.0, 92.0, 146.0, 214.0, 321.0, 514.0, 769.0, 1211.0, 1860.0, 2939.0, 4711.0, 7622.0, 12557.0, 21041.0, 36572.0, 69547.0, 144442.0, 355391.0, 193569.0, 86912.0, 44340.0, 25023.0, 14690.0, 8891.0, 5529.0, 3385.0, 2139.0, 1378.0, 878.0, 557.0, 416.0, 240.0, 150.0, 104.0, 81.0, 58.0, 37.0, 23.0, 6.0, 13.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020241737365722656, -0.00019535422325134277, -0.00018829107284545898, -0.0001812279224395752, -0.0001741647720336914, -0.00016710162162780762, -0.00016003847122192383, -0.00015297532081604004, -0.00014591217041015625, -0.00013884902000427246, -0.00013178586959838867, -0.00012472271919250488, -0.0001176595687866211, -0.0001105964183807373, -0.00010353326797485352, -9.647011756896973e-05, -8.940696716308594e-05, -8.234381675720215e-05, -7.528066635131836e-05, -6.821751594543457e-05, -6.115436553955078e-05, -5.409121513366699e-05, -4.70280647277832e-05, -3.9964914321899414e-05, -3.2901763916015625e-05, -2.5838613510131836e-05, -1.8775463104248047e-05, -1.1712312698364258e-05, -4.649162292480469e-06, 2.4139881134033203e-06, 9.47713851928711e-06, 1.65402889251709e-05, 2.3603439331054688e-05, 3.0666589736938477e-05, 3.7729740142822266e-05, 4.4792890548706055e-05, 5.1856040954589844e-05, 5.891919136047363e-05, 6.598234176635742e-05, 7.304549217224121e-05, 8.0108642578125e-05, 8.717179298400879e-05, 9.423494338989258e-05, 0.00010129809379577637, 0.00010836124420166016, 0.00011542439460754395, 0.00012248754501342773, 0.00012955069541931152, 0.0001366138458251953, 0.0001436769962310791, 0.0001507401466369629, 0.00015780329704284668, 0.00016486644744873047, 0.00017192959785461426, 0.00017899274826049805, 0.00018605589866638184, 0.00019311904907226562, 0.00020018219947814941, 0.0002072453498840332, 0.000214308500289917, 0.00022137165069580078, 0.00022843480110168457, 0.00023549795150756836, 0.00024256110191345215, 0.00024962425231933594]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 11.0, 5.0, 6.0, 10.0, 8.0, 11.0, 20.0, 14.0, 19.0, 23.0, 25.0, 25.0, 41.0, 36.0, 56.0, 57.0, 70.0, 69.0, 66.0, 74.0, 42.0, 34.0, 39.0, 36.0, 26.0, 29.0, 24.0, 24.0, 17.0, 21.0, 11.0, 4.0, 7.0, 9.0, 13.0, 5.0, 2.0, 1.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.1484832763671875e-05, -4.0158629417419434e-05, -3.883242607116699e-05, -3.750622272491455e-05, -3.618001937866211e-05, -3.485381603240967e-05, -3.3527612686157227e-05, -3.2201409339904785e-05, -3.0875205993652344e-05, -2.9549002647399902e-05, -2.822279930114746e-05, -2.689659595489502e-05, -2.5570392608642578e-05, -2.4244189262390137e-05, -2.2917985916137695e-05, -2.1591782569885254e-05, -2.0265579223632812e-05, -1.893937587738037e-05, -1.761317253112793e-05, -1.6286969184875488e-05, -1.4960765838623047e-05, -1.3634562492370605e-05, -1.2308359146118164e-05, -1.0982155799865723e-05, -9.655952453613281e-06, -8.32974910736084e-06, -7.0035457611083984e-06, -5.677342414855957e-06, -4.351139068603516e-06, -3.0249357223510742e-06, -1.6987323760986328e-06, -3.725290298461914e-07, 9.5367431640625e-07, 2.2798776626586914e-06, 3.606081008911133e-06, 4.932284355163574e-06, 6.258487701416016e-06, 7.584691047668457e-06, 8.910894393920898e-06, 1.023709774017334e-05, 1.1563301086425781e-05, 1.2889504432678223e-05, 1.4215707778930664e-05, 1.5541911125183105e-05, 1.6868114471435547e-05, 1.8194317817687988e-05, 1.952052116394043e-05, 2.084672451019287e-05, 2.2172927856445312e-05, 2.3499131202697754e-05, 2.4825334548950195e-05, 2.6151537895202637e-05, 2.7477741241455078e-05, 2.880394458770752e-05, 3.013014793395996e-05, 3.14563512802124e-05, 3.2782554626464844e-05, 3.4108757972717285e-05, 3.5434961318969727e-05, 3.676116466522217e-05, 3.808736801147461e-05, 3.941357135772705e-05, 4.073977470397949e-05, 4.2065978050231934e-05, 4.3392181396484375e-05]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 7.0, 9.0, 12.0, 16.0, 18.0, 32.0, 24.0, 48.0, 52.0, 70.0, 80.0, 92.0, 102.0, 78.0, 75.0, 58.0, 30.0, 48.0, 30.0, 17.0, 19.0, 14.0, 11.0, 14.0, 4.0, 7.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007445210590958595, -0.007232679519802332, -0.007020148914307356, -0.0068076178431510925, -0.0065950872376561165, -0.006382556166499853, -0.00617002509534359, -0.005957494489848614, -0.00574496341869235, -0.005532432347536087, -0.005319901742041111, -0.005107370670884848, -0.004894840065389872, -0.004682308994233608, -0.004469778388738632, -0.004257247317582369, -0.0040447162464261055, -0.003832185408100486, -0.003619654569774866, -0.0034071234986186028, -0.003194592660292983, -0.0029820618219673634, -0.0027695309836417437, -0.002557000145316124, -0.002344469539821148, -0.0021319387014955282, -0.0019194077467545867, -0.001706876908428967, -0.0014943459536880255, -0.0012818151153624058, -0.001069284277036786, -0.0008567533222958446, -0.000644222367554903, -0.0004316914710216224, -0.00021916060359217227, -6.629736162722111e-06, 0.0002059011603705585, 0.0004184320569038391, 0.0006309628952294588, 0.0008434938499704003, 0.00105602468829602, 0.0012685555266216397, 0.0014810864813625813, 0.001693617319688201, 0.0019061481580138206, 0.002118679229170084, 0.00233120983466506, 0.0025437409058213234, 0.002756271744146943, 0.002968802582472563, 0.0031813334207981825, 0.003393864259123802, 0.0036063953302800655, 0.0038189261686056852, 0.004031457006931305, 0.004243988078087568, 0.004456518683582544, 0.004669049754738808, 0.004881580360233784, 0.005094111431390047, 0.005306642036885023, 0.0055191731080412865, 0.0057317037135362625, 0.005944234784692526, 0.006156765855848789]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 7.0, 10.0, 10.0, 5.0, 11.0, 8.0, 6.0, 17.0, 14.0, 22.0, 14.0, 22.0, 29.0, 27.0, 25.0, 33.0, 36.0, 36.0, 39.0, 32.0, 30.0, 36.0, 41.0, 44.0, 40.0, 39.0, 31.0, 37.0, 25.0, 31.0, 32.0, 19.0, 28.0, 26.0, 28.0, 17.0, 16.0, 17.0, 13.0, 9.0, 5.0, 7.0, 10.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004233601037412882, -0.004113647621124983, -0.003993694204837084, -0.003873740788549185, -0.0037537873722612858, -0.0036338339559733868, -0.0035138805396854877, -0.0033939271233975887, -0.0032739737071096897, -0.0031540202908217907, -0.0030340668745338917, -0.0029141134582459927, -0.0027941600419580936, -0.0026742066256701946, -0.0025542532093822956, -0.0024342997930943966, -0.0023143466096371412, -0.002194393193349242, -0.002074439777061343, -0.001954486360773444, -0.0018345329444855452, -0.0017145795281976461, -0.001594626228325069, -0.00147467281203717, -0.001354719395749271, -0.001234765979461372, -0.0011148125631734729, -0.0009948592633008957, -0.0008749057888053358, -0.0007549523725174367, -0.0006349990144371986, -0.0005150455981492996, -0.00039509241469204426, -0.00027513899840414524, -0.00015518561122007668, -3.523222403600812e-05, 8.47211922518909e-05, 0.00020467460853978992, 0.000324627966620028, 0.00044458138290792704, 0.000564534799195826, 0.0006844882154837251, 0.0008044416317716241, 0.0009243949898518622, 0.0010443483479321003, 0.0011643017642199993, 0.0012842551805078983, 0.0014042085967957973, 0.0015241620130836964, 0.0016441154293715954, 0.0017640688456594944, 0.0018840222619473934, 0.0020039756782352924, 0.0021239290945231915, 0.0022438825108110905, 0.0023638359270989895, 0.0024837893433868885, 0.0026037427596747875, 0.0027236961759626865, 0.0028436495922505856, 0.0029636030085384846, 0.0030835564248263836, 0.0032035098411142826, 0.0033234632574021816, 0.003443416440859437]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 6.0, 7.0, 15.0, 28.0, 31.0, 31.0, 71.0, 84.0, 118.0, 172.0, 242.0, 401.0, 551.0, 808.0, 1130.0, 1790.0, 2512.0, 3947.0, 5855.0, 8934.0, 13793.0, 20810.0, 33736.0, 54610.0, 89026.0, 145929.0, 198015.0, 172578.0, 111185.0, 66594.0, 41433.0, 25672.0, 16485.0, 10686.0, 7118.0, 4634.0, 3060.0, 2011.0, 1422.0, 929.0, 622.0, 460.0, 317.0, 209.0, 127.0, 124.0, 72.0, 53.0, 34.0, 27.0, 19.0, 15.0, 5.0, 9.0, 4.0, 4.0, 1.0, 4.0, 2.0], "bins": [-0.00742340087890625, -0.007189333438873291, -0.006955265998840332, -0.006721198558807373, -0.006487131118774414, -0.006253063678741455, -0.006018996238708496, -0.005784928798675537, -0.005550861358642578, -0.005316793918609619, -0.00508272647857666, -0.004848659038543701, -0.004614591598510742, -0.004380524158477783, -0.004146456718444824, -0.003912389278411865, -0.0036783218383789062, -0.0034442543983459473, -0.0032101869583129883, -0.0029761195182800293, -0.0027420520782470703, -0.0025079846382141113, -0.0022739171981811523, -0.0020398497581481934, -0.0018057823181152344, -0.0015717148780822754, -0.0013376474380493164, -0.0011035799980163574, -0.0008695125579833984, -0.0006354451179504395, -0.00040137767791748047, -0.00016731023788452148, 6.67572021484375e-05, 0.0003008246421813965, 0.0005348920822143555, 0.0007689595222473145, 0.0010030269622802734, 0.0012370944023132324, 0.0014711618423461914, 0.0017052292823791504, 0.0019392967224121094, 0.0021733641624450684, 0.0024074316024780273, 0.0026414990425109863, 0.0028755664825439453, 0.0031096339225769043, 0.0033437013626098633, 0.0035777688026428223, 0.0038118362426757812, 0.00404590368270874, 0.004279971122741699, 0.004514038562774658, 0.004748106002807617, 0.004982173442840576, 0.005216240882873535, 0.005450308322906494, 0.005684375762939453, 0.005918443202972412, 0.006152510643005371, 0.00638657808303833, 0.006620645523071289, 0.006854712963104248, 0.007088780403137207, 0.007322847843170166, 0.007556915283203125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 7.0, 4.0, 6.0, 2.0, 13.0, 10.0, 6.0, 14.0, 13.0, 19.0, 27.0, 23.0, 25.0, 31.0, 32.0, 26.0, 37.0, 32.0, 37.0, 33.0, 41.0, 38.0, 50.0, 31.0, 39.0, 43.0, 44.0, 32.0, 24.0, 30.0, 29.0, 28.0, 23.0, 26.0, 25.0, 13.0, 9.0, 15.0, 8.0, 14.0, 8.0, 11.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003936767578125, -0.003818124532699585, -0.00369948148727417, -0.003580838441848755, -0.00346219539642334, -0.003343552350997925, -0.0032249093055725098, -0.0031062662601470947, -0.0029876232147216797, -0.0028689801692962646, -0.0027503371238708496, -0.0026316940784454346, -0.0025130510330200195, -0.0023944079875946045, -0.0022757649421691895, -0.0021571218967437744, -0.0020384788513183594, -0.0019198358058929443, -0.0018011927604675293, -0.0016825497150421143, -0.0015639066696166992, -0.0014452636241912842, -0.0013266205787658691, -0.001207977533340454, -0.001089334487915039, -0.000970691442489624, -0.000852048397064209, -0.0007334053516387939, -0.0006147623062133789, -0.0004961192607879639, -0.00037747621536254883, -0.0002588331699371338, -0.00014019012451171875, -2.154707908630371e-05, 9.709596633911133e-05, 0.00021573901176452637, 0.0003343820571899414, 0.00045302510261535645, 0.0005716681480407715, 0.0006903111934661865, 0.0008089542388916016, 0.0009275972843170166, 0.0010462403297424316, 0.0011648833751678467, 0.0012835264205932617, 0.0014021694660186768, 0.0015208125114440918, 0.0016394555568695068, 0.0017580986022949219, 0.001876741647720337, 0.001995384693145752, 0.002114027738571167, 0.002232670783996582, 0.002351313829421997, 0.002469956874847412, 0.002588599920272827, 0.002707242965698242, 0.0028258860111236572, 0.0029445290565490723, 0.0030631721019744873, 0.0031818151473999023, 0.0033004581928253174, 0.0034191012382507324, 0.0035377442836761475, 0.0036563873291015625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 5.0, 6.0, 8.0, 12.0, 15.0, 27.0, 29.0, 74.0, 93.0, 129.0, 204.0, 262.0, 361.0, 513.0, 791.0, 1144.0, 1799.0, 2598.0, 3989.0, 5837.0, 8815.0, 14015.0, 22515.0, 37001.0, 61873.0, 106759.0, 176745.0, 222292.0, 151580.0, 89670.0, 52681.0, 31497.0, 19563.0, 12119.0, 7897.0, 5176.0, 3357.0, 2243.0, 1552.0, 1066.0, 698.0, 484.0, 332.0, 234.0, 175.0, 111.0, 74.0, 57.0, 30.0, 22.0, 18.0, 10.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00818634033203125, -0.007925152778625488, -0.0076639652252197266, -0.007402777671813965, -0.007141590118408203, -0.006880402565002441, -0.00661921501159668, -0.006358027458190918, -0.006096839904785156, -0.0058356523513793945, -0.005574464797973633, -0.005313277244567871, -0.005052089691162109, -0.004790902137756348, -0.004529714584350586, -0.004268527030944824, -0.0040073394775390625, -0.0037461519241333008, -0.003484964370727539, -0.0032237768173217773, -0.0029625892639160156, -0.002701401710510254, -0.002440214157104492, -0.0021790266036987305, -0.0019178390502929688, -0.001656651496887207, -0.0013954639434814453, -0.0011342763900756836, -0.0008730888366699219, -0.0006119012832641602, -0.00035071372985839844, -8.952617645263672e-05, 0.000171661376953125, 0.0004328489303588867, 0.0006940364837646484, 0.0009552240371704102, 0.0012164115905761719, 0.0014775991439819336, 0.0017387866973876953, 0.001999974250793457, 0.0022611618041992188, 0.0025223493576049805, 0.002783536911010742, 0.003044724464416504, 0.0033059120178222656, 0.0035670995712280273, 0.003828287124633789, 0.004089474678039551, 0.0043506622314453125, 0.004611849784851074, 0.004873037338256836, 0.005134224891662598, 0.005395412445068359, 0.005656599998474121, 0.005917787551879883, 0.0061789751052856445, 0.006440162658691406, 0.006701350212097168, 0.00696253776550293, 0.007223725318908691, 0.007484912872314453, 0.007746100425720215, 0.008007287979125977, 0.008268475532531738, 0.0085296630859375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 4.0, 7.0, 8.0, 9.0, 10.0, 11.0, 14.0, 16.0, 13.0, 19.0, 35.0, 36.0, 32.0, 43.0, 36.0, 52.0, 51.0, 52.0, 34.0, 48.0, 41.0, 50.0, 44.0, 29.0, 37.0, 40.0, 30.0, 35.0, 23.0, 20.0, 20.0, 23.0, 13.0, 13.0, 12.0, 7.0, 8.0, 6.0, 3.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026798248291015625, -0.0025913119316101074, -0.0025027990341186523, -0.0024142861366271973, -0.002325773239135742, -0.002237260341644287, -0.002148747444152832, -0.002060234546661377, -0.001971721649169922, -0.0018832087516784668, -0.0017946958541870117, -0.0017061829566955566, -0.0016176700592041016, -0.0015291571617126465, -0.0014406442642211914, -0.0013521313667297363, -0.0012636184692382812, -0.0011751055717468262, -0.001086592674255371, -0.000998079776763916, -0.0009095668792724609, -0.0008210539817810059, -0.0007325410842895508, -0.0006440281867980957, -0.0005555152893066406, -0.00046700239181518555, -0.00037848949432373047, -0.0002899765968322754, -0.0002014636993408203, -0.00011295080184936523, -2.4437904357910156e-05, 6.407499313354492e-05, 0.000152587890625, 0.00024110078811645508, 0.00032961368560791016, 0.00041812658309936523, 0.0005066394805908203, 0.0005951523780822754, 0.0006836652755737305, 0.0007721781730651855, 0.0008606910705566406, 0.0009492039680480957, 0.0010377168655395508, 0.0011262297630310059, 0.001214742660522461, 0.001303255558013916, 0.001391768455505371, 0.0014802813529968262, 0.0015687942504882812, 0.0016573071479797363, 0.0017458200454711914, 0.0018343329429626465, 0.0019228458404541016, 0.0020113587379455566, 0.0020998716354370117, 0.002188384532928467, 0.002276897430419922, 0.002365410327911377, 0.002453923225402832, 0.002542436122894287, 0.002630949020385742, 0.0027194619178771973, 0.0028079748153686523, 0.0028964877128601074, 0.0029850006103515625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 7.0, 10.0, 21.0, 22.0, 54.0, 74.0, 110.0, 164.0, 262.0, 385.0, 538.0, 867.0, 1437.0, 2207.0, 3519.0, 5985.0, 10182.0, 19585.0, 42369.0, 124199.0, 524886.0, 199973.0, 56473.0, 24480.0, 12660.0, 6898.0, 4135.0, 2581.0, 1598.0, 1006.0, 634.0, 423.0, 289.0, 180.0, 110.0, 85.0, 51.0, 34.0, 20.0, 10.0, 3.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0036163330078125, -0.0035055875778198242, -0.0033948421478271484, -0.0032840967178344727, -0.003173351287841797, -0.003062605857849121, -0.0029518604278564453, -0.0028411149978637695, -0.0027303695678710938, -0.002619624137878418, -0.002508878707885742, -0.0023981332778930664, -0.0022873878479003906, -0.002176642417907715, -0.002065896987915039, -0.0019551515579223633, -0.0018444061279296875, -0.0017336606979370117, -0.001622915267944336, -0.0015121698379516602, -0.0014014244079589844, -0.0012906789779663086, -0.0011799335479736328, -0.001069188117980957, -0.0009584426879882812, -0.0008476972579956055, -0.0007369518280029297, -0.0006262063980102539, -0.0005154609680175781, -0.00040471553802490234, -0.00029397010803222656, -0.00018322467803955078, -7.2479248046875e-05, 3.826618194580078e-05, 0.00014901161193847656, 0.00025975704193115234, 0.0003705024719238281, 0.0004812479019165039, 0.0005919933319091797, 0.0007027387619018555, 0.0008134841918945312, 0.000924229621887207, 0.0010349750518798828, 0.0011457204818725586, 0.0012564659118652344, 0.0013672113418579102, 0.001477956771850586, 0.0015887022018432617, 0.0016994476318359375, 0.0018101930618286133, 0.001920938491821289, 0.002031683921813965, 0.0021424293518066406, 0.0022531747817993164, 0.002363920211791992, 0.002474665641784668, 0.0025854110717773438, 0.0026961565017700195, 0.0028069019317626953, 0.002917647361755371, 0.003028392791748047, 0.0031391382217407227, 0.0032498836517333984, 0.0033606290817260742, 0.00347137451171875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 19.0, 0.0, 0.0, 21.0, 0.0, 0.0, 39.0, 0.0, 0.0, 59.0, 0.0, 0.0, 110.0, 0.0, 0.0, 84.0, 0.0, 0.0, 117.0, 0.0, 0.0, 121.0, 0.0, 0.0, 125.0, 0.0, 106.0, 0.0, 0.0, 74.0, 0.0, 0.0, 57.0, 0.0, 0.0, 38.0, 0.0, 0.0, 18.0, 0.0, 0.0, 6.0, 0.0, 0.0, 8.0, 0.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.755573511123657e-07, -5.550682544708252e-07, -5.345791578292847e-07, -5.140900611877441e-07, -4.936009645462036e-07, -4.731118679046631e-07, -4.5262277126312256e-07, -4.3213367462158203e-07, -4.116445779800415e-07, -3.91155481338501e-07, -3.7066638469696045e-07, -3.501772880554199e-07, -3.296881914138794e-07, -3.0919909477233887e-07, -2.8870999813079834e-07, -2.682209014892578e-07, -2.477318048477173e-07, -2.2724270820617676e-07, -2.0675361156463623e-07, -1.862645149230957e-07, -1.6577541828155518e-07, -1.4528632164001465e-07, -1.2479722499847412e-07, -1.043081283569336e-07, -8.381903171539307e-08, -6.332993507385254e-08, -4.284083843231201e-08, -2.2351741790771484e-08, -1.862645149230957e-09, 1.862645149230957e-08, 3.91155481338501e-08, 5.960464477539063e-08, 8.009374141693115e-08, 1.0058283805847168e-07, 1.210719347000122e-07, 1.4156103134155273e-07, 1.6205012798309326e-07, 1.825392246246338e-07, 2.0302832126617432e-07, 2.2351741790771484e-07, 2.4400651454925537e-07, 2.644956111907959e-07, 2.849847078323364e-07, 3.0547380447387695e-07, 3.259629011154175e-07, 3.46451997756958e-07, 3.6694109439849854e-07, 3.8743019104003906e-07, 4.079192876815796e-07, 4.284083843231201e-07, 4.4889748096466064e-07, 4.6938657760620117e-07, 4.898756742477417e-07, 5.103647708892822e-07, 5.308538675308228e-07, 5.513429641723633e-07, 5.718320608139038e-07, 5.923211574554443e-07, 6.128102540969849e-07, 6.332993507385254e-07, 6.537884473800659e-07, 6.742775440216064e-07, 6.94766640663147e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 14.0, 12.0, 20.0, 32.0, 29.0, 48.0, 62.0, 109.0, 137.0, 180.0, 270.0, 402.0, 525.0, 765.0, 1060.0, 1466.0, 2085.0, 3113.0, 4603.0, 7296.0, 12300.0, 21977.0, 45452.0, 124325.0, 529708.0, 173085.0, 55094.0, 25883.0, 13876.0, 8193.0, 5177.0, 3396.0, 2352.0, 1563.0, 1151.0, 775.0, 559.0, 387.0, 298.0, 218.0, 167.0, 102.0, 81.0, 61.0, 42.0, 30.0, 15.0, 13.0, 14.0, 10.0, 11.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0036983489990234375, -0.0035813748836517334, -0.0034644007682800293, -0.003347426652908325, -0.003230452537536621, -0.003113478422164917, -0.002996504306793213, -0.002879530191421509, -0.0027625560760498047, -0.0026455819606781006, -0.0025286078453063965, -0.0024116337299346924, -0.0022946596145629883, -0.002177685499191284, -0.00206071138381958, -0.001943737268447876, -0.0018267631530761719, -0.0017097890377044678, -0.0015928149223327637, -0.0014758408069610596, -0.0013588666915893555, -0.0012418925762176514, -0.0011249184608459473, -0.0010079443454742432, -0.0008909702301025391, -0.000773996114730835, -0.0006570219993591309, -0.0005400478839874268, -0.00042307376861572266, -0.00030609965324401855, -0.00018912553787231445, -7.215142250061035e-05, 4.482269287109375e-05, 0.00016179680824279785, 0.00027877092361450195, 0.00039574503898620605, 0.0005127191543579102, 0.0006296932697296143, 0.0007466673851013184, 0.0008636415004730225, 0.0009806156158447266, 0.0010975897312164307, 0.0012145638465881348, 0.0013315379619598389, 0.001448512077331543, 0.001565486192703247, 0.0016824603080749512, 0.0017994344234466553, 0.0019164085388183594, 0.0020333826541900635, 0.0021503567695617676, 0.0022673308849334717, 0.0023843050003051758, 0.00250127911567688, 0.002618253231048584, 0.002735227346420288, 0.002852201461791992, 0.0029691755771636963, 0.0030861496925354004, 0.0032031238079071045, 0.0033200979232788086, 0.0034370720386505127, 0.003554046154022217, 0.003671020269393921, 0.003787994384765625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 5.0, 7.0, 4.0, 5.0, 11.0, 9.0, 14.0, 12.0, 20.0, 26.0, 33.0, 51.0, 55.0, 92.0, 125.0, 111.0, 84.0, 73.0, 45.0, 45.0, 37.0, 24.0, 21.0, 23.0, 8.0, 9.0, 6.0, 3.0, 7.0, 5.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001186370849609375, -0.0011497139930725098, -0.0011130571365356445, -0.0010764002799987793, -0.001039743423461914, -0.0010030865669250488, -0.0009664297103881836, -0.0009297728538513184, -0.0008931159973144531, -0.0008564591407775879, -0.0008198022842407227, -0.0007831454277038574, -0.0007464885711669922, -0.000709831714630127, -0.0006731748580932617, -0.0006365180015563965, -0.0005998611450195312, -0.000563204288482666, -0.0005265474319458008, -0.0004898905754089355, -0.0004532337188720703, -0.0004165768623352051, -0.00037992000579833984, -0.0003432631492614746, -0.0003066062927246094, -0.00026994943618774414, -0.0002332925796508789, -0.00019663572311401367, -0.00015997886657714844, -0.0001233220100402832, -8.666515350341797e-05, -5.0008296966552734e-05, -1.33514404296875e-05, 2.3305416107177734e-05, 5.996227264404297e-05, 9.66191291809082e-05, 0.00013327598571777344, 0.00016993284225463867, 0.0002065896987915039, 0.00024324655532836914, 0.0002799034118652344, 0.0003165602684020996, 0.00035321712493896484, 0.0003898739814758301, 0.0004265308380126953, 0.00046318769454956055, 0.0004998445510864258, 0.000536501407623291, 0.0005731582641601562, 0.0006098151206970215, 0.0006464719772338867, 0.000683128833770752, 0.0007197856903076172, 0.0007564425468444824, 0.0007930994033813477, 0.0008297562599182129, 0.0008664131164550781, 0.0009030699729919434, 0.0009397268295288086, 0.0009763836860656738, 0.001013040542602539, 0.0010496973991394043, 0.0010863542556762695, 0.0011230111122131348, 0.00115966796875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 6.0, 6.0, 4.0, 10.0, 10.0, 11.0, 12.0, 14.0, 30.0, 45.0, 55.0, 48.0, 57.0, 75.0, 77.0, 86.0, 76.0, 64.0, 60.0, 38.0, 48.0, 31.0, 25.0, 23.0, 13.0, 13.0, 14.0, 9.0, 6.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007378107402473688, -0.007154962047934532, -0.006931816227734089, -0.006708670407533646, -0.00648552505299449, -0.006262379698455334, -0.0060392338782548904, -0.005816088058054447, -0.005592942703515291, -0.005369797348976135, -0.005146651528775692, -0.004923505708575249, -0.004700360354036093, -0.004477214999496937, -0.0042540691792964935, -0.00403092335909605, -0.0038077780045568943, -0.0035846324171870947, -0.003361486829817295, -0.0031383412424474955, -0.002915195655077696, -0.0026920500677078962, -0.0024689044803380966, -0.002245758892968297, -0.0020226133055984974, -0.0017994677182286978, -0.0015763221308588982, -0.0013531765434890985, -0.001130030956119299, -0.0009068853687494993, -0.0006837397813796997, -0.0004605941940099001, -0.0002374490723013878, -1.4303484931588173e-05, 0.00020884210243821144, 0.00043198768980801105, 0.0006551332771778107, 0.0008782788645476103, 0.00110142445191741, 0.0013245700392872095, 0.0015477156266570091, 0.0017708612140268087, 0.0019940068013966084, 0.002217152388766408, 0.0024402979761362076, 0.002663443563506007, 0.002886589150875807, 0.0031097347382456064, 0.003332880325615406, 0.0035560259129852057, 0.0037791715003550053, 0.004002316854894161, 0.0042254626750946045, 0.004448608495295048, 0.004671753849834204, 0.00489489920437336, 0.005118045024573803, 0.005341190844774246, 0.005564336199313402, 0.005787481553852558, 0.006010627374053001, 0.006233773194253445, 0.006456918548792601, 0.006680063903331757, 0.0069032097235322]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 3.0, 6.0, 6.0, 7.0, 11.0, 9.0, 4.0, 12.0, 14.0, 14.0, 20.0, 24.0, 32.0, 27.0, 32.0, 30.0, 31.0, 36.0, 44.0, 34.0, 28.0, 45.0, 38.0, 37.0, 47.0, 38.0, 35.0, 38.0, 39.0, 36.0, 36.0, 30.0, 28.0, 24.0, 17.0, 14.0, 10.0, 11.0, 9.0, 10.0, 9.0, 8.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004350780975073576, -0.0042036292143166065, -0.004056477919220924, -0.003909326158463955, -0.0037621748633682728, -0.0036150231026113033, -0.0034678715746849775, -0.0033207200467586517, -0.003173568518832326, -0.003026416990906, -0.0028792654629796743, -0.0027321139350533485, -0.002584962174296379, -0.002437810879200697, -0.0022906591184437275, -0.0021435075905174017, -0.001996356062591076, -0.00184920453466475, -0.0017020530067384243, -0.0015549013623967767, -0.0014077498344704509, -0.001260598306544125, -0.0011134466622024775, -0.0009662951342761517, -0.0008191436063498259, -0.0006719920784235001, -0.0005248404922895133, -0.0003776889352593571, -0.00023053737822920084, -8.338585030287504e-05, 6.376573583111167e-05, 0.00021091732196509838, 0.0003580693155527115, 0.0005052208434790373, 0.000652372429613024, 0.0007995240157470107, 0.0009466755436733365, 0.0010938270715996623, 0.00124097871594131, 0.0013881302438676357, 0.0015352817717939615, 0.0016824332997202873, 0.0018295848276466131, 0.001976736355572939, 0.0021238881163299084, 0.0022710394114255905, 0.00241819117218256, 0.0025653427001088858, 0.0027124942280352116, 0.0028596457559615374, 0.003006797283887863, 0.003153948811814189, 0.0033011003397405148, 0.003448252100497484, 0.00359540362842381, 0.003742555156350136, 0.0038897066842764616, 0.004036858212202787, 0.004184009972959757, 0.004331161268055439, 0.0044783130288124084, 0.004625464323908091, 0.00477261608466506, 0.004919767379760742, 0.005066919140517712]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 7.0, 7.0, 3.0, 4.0, 5.0, 6.0, 7.0, 11.0, 7.0, 23.0, 23.0, 26.0, 29.0, 33.0, 34.0, 35.0, 43.0, 54.0, 63.0, 64.0, 73.0, 86.0, 137.0, 253.0, 789.0, 2348.0, 517891.0, 1075.0, 312.0, 139.0, 102.0, 75.0, 61.0, 66.0, 46.0, 65.0, 52.0, 55.0, 24.0, 26.0, 25.0, 24.0, 19.0, 9.0, 7.0, 8.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10932926088571548, -0.10569936037063599, -0.10206946730613708, -0.09843956679105759, -0.09480966627597809, -0.09117977321147919, -0.08754987269639969, -0.08391997218132019, -0.08029007911682129, -0.07666017860174179, -0.07303028553724289, -0.06940038502216339, -0.06577049195766449, -0.06214059144258499, -0.05851069092750549, -0.05488079413771629, -0.051250897347927094, -0.047621000558137894, -0.043991103768348694, -0.040361203253269196, -0.036731306463479996, -0.033101409673690796, -0.029471511021256447, -0.025841612368822098, -0.022211715579032898, -0.018581818789243698, -0.014951920136809349, -0.011322022415697575, -0.0076921246945858, -0.0040622279047966, -0.0004323292523622513, 0.0031975694000720978, 0.006827458739280701, 0.010457356460392475, 0.01408725418150425, 0.0177171528339386, 0.0213470496237278, 0.024976946413517, 0.028606845065951347, 0.032236743718385696, 0.035866640508174896, 0.039496537297964096, 0.043126434087753296, 0.046756334602832794, 0.050386231392621994, 0.054016128182411194, 0.05764602869749069, 0.06127592548727989, 0.06490582227706909, 0.06853572279214859, 0.07216561585664749, 0.07579551637172699, 0.07942540943622589, 0.08305530995130539, 0.08668521046638489, 0.09031510353088379, 0.09394500404596329, 0.09757490456104279, 0.10120479762554169, 0.10483469814062119, 0.10846459865570068, 0.11209449172019958, 0.11572439223527908, 0.11935429275035858, 0.12298418581485748]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 9.0, 3.0, 12.0, 6.0, 11.0, 9.0, 19.0, 17.0, 15.0, 17.0, 37.0, 37.0, 27.0, 34.0, 33.0, 43.0, 33.0, 32.0, 43.0, 32.0, 1060.0, 42.0, 41.0, 44.0, 35.0, 45.0, 38.0, 25.0, 33.0, 31.0, 28.0, 22.0, 15.0, 14.0, 14.0, 9.0, 10.0, 5.0, 8.0, 9.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12247154116630554, -0.11824946105480194, -0.11402738094329834, -0.10980530083179474, -0.10558322072029114, -0.10136114060878754, -0.09713905304670334, -0.09291697293519974, -0.08869489282369614, -0.08447281271219254, -0.08025073260068893, -0.07602865248918533, -0.07180656492710114, -0.06758448481559753, -0.06336240470409393, -0.05914032459259033, -0.05491824448108673, -0.05069616436958313, -0.04647408425807953, -0.04225200042128563, -0.03802992030978203, -0.03380784019827843, -0.029585758224129677, -0.025363676249980927, -0.021141596138477325, -0.016919516026973724, -0.012697434052824974, -0.008475353009998798, -0.004253271967172623, -3.1191855669021606e-05, 0.004190890118479729, 0.008412972092628479, 0.012635067105293274, 0.016857147216796875, 0.021079229190945625, 0.025301311165094376, 0.029523391276597977, 0.03374547138810158, 0.03796755522489548, 0.04218963533639908, 0.04641171544790268, 0.05063379555940628, 0.05485587567090988, 0.05907795950770378, 0.06330004334449768, 0.06752212345600128, 0.07174420356750488, 0.07596628367900848, 0.08018836379051208, 0.08441044390201569, 0.08863252401351929, 0.09285460412502289, 0.09707668423652649, 0.10129876434803009, 0.10552085191011429, 0.10974293202161789, 0.11396501213312149, 0.11818709224462509, 0.12240917235612869, 0.1266312599182129, 0.1308533400297165, 0.1350754201412201, 0.1392975002527237, 0.1435195803642273, 0.1477416604757309]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 3.0, 4.0, 7.0, 5.0, 4.0, 3.0, 7.0, 4.0, 3.0, 6.0, 15.0, 24.0, 32.0, 31.0, 60.0, 95.0, 141.0, 215.0, 306.0, 457.0, 671.0, 829.0, 957.0, 1275.0, 1332.0, 2985.0, 24800.0, 31198388.0, 8836.0, 11081.0, 571.0, 622.0, 125.0, 168.0, 359.0, 16.0, 15.0, 11.0, 8.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-28560.0, -27913.25, -27266.5, -26619.75, -25973.0, -25326.25, -24679.5, -24032.75, -23386.0, -22739.25, -22092.5, -21445.75, -20799.0, -20152.25, -19505.5, -18858.75, -18212.0, -17565.25, -16918.5, -16271.75, -15625.0, -14978.25, -14331.5, -13684.75, -13038.0, -12391.25, -11744.5, -11097.75, -10451.0, -9804.25, -9157.5, -8510.75, -7864.0, -7217.25, -6570.5, -5923.75, -5277.0, -4630.25, -3983.5, -3336.75, -2690.0, -2043.25, -1396.5, -749.75, -103.0, 543.75, 1190.5, 1837.25, 2484.0, 3130.75, 3777.5, 4424.25, 5071.0, 5717.75, 6364.5, 7011.25, 7658.0, 8304.75, 8951.5, 9598.25, 10245.0, 10891.75, 11538.5, 12185.25, 12832.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 8.0, 22.0, 19.0, 27.0, 45.0, 68.0, 81.0, 134.0, 182.0, 275.0, 438.0, 590.0, 807.0, 1369.0, 2274.0, 3563.0, 6140.0, 10666.0, 20237.0, 40434.0, 93162.0, 253119.0, 1103175.0, 4038178.0, 451116.0, 144631.0, 58728.0, 27423.0, 14154.0, 7836.0, 4621.0, 2840.0, 1704.0, 1145.0, 710.0, 460.0, 306.0, 242.0, 156.0, 93.0, 70.0, 50.0, 34.0, 24.0, 22.0, 15.0, 14.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-63.71875, -61.67919921875, -59.6396484375, -57.60009765625, -55.560546875, -53.52099609375, -51.4814453125, -49.44189453125, -47.40234375, -45.36279296875, -43.3232421875, -41.28369140625, -39.244140625, -37.20458984375, -35.1650390625, -33.12548828125, -31.0859375, -29.04638671875, -27.0068359375, -24.96728515625, -22.927734375, -20.88818359375, -18.8486328125, -16.80908203125, -14.76953125, -12.72998046875, -10.6904296875, -8.65087890625, -6.611328125, -4.57177734375, -2.5322265625, -0.49267578125, 1.546875, 3.58642578125, 5.6259765625, 7.66552734375, 9.705078125, 11.74462890625, 13.7841796875, 15.82373046875, 17.86328125, 19.90283203125, 21.9423828125, 23.98193359375, 26.021484375, 28.06103515625, 30.1005859375, 32.14013671875, 34.1796875, 36.21923828125, 38.2587890625, 40.29833984375, 42.337890625, 44.37744140625, 46.4169921875, 48.45654296875, 50.49609375, 52.53564453125, 54.5751953125, 56.61474609375, 58.654296875, 60.69384765625, 62.7333984375, 64.77294921875, 66.8125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 3.0, 7.0, 7.0, 10.0, 16.0, 21.0, 20.0, 23.0, 26.0, 25.0, 32.0, 44.0, 35.0, 54.0, 83.0, 93.0, 145.0, 306.0, 337.0, 165.0, 94.0, 85.0, 60.0, 56.0, 38.0, 42.0, 33.0, 24.0, 24.0, 17.0, 15.0, 6.0, 16.0, 12.0, 10.0, 5.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-55.28125, -53.6083984375, -51.935546875, -50.2626953125, -48.58984375, -46.9169921875, -45.244140625, -43.5712890625, -41.8984375, -40.2255859375, -38.552734375, -36.8798828125, -35.20703125, -33.5341796875, -31.861328125, -30.1884765625, -28.515625, -26.8427734375, -25.169921875, -23.4970703125, -21.82421875, -20.1513671875, -18.478515625, -16.8056640625, -15.1328125, -13.4599609375, -11.787109375, -10.1142578125, -8.44140625, -6.7685546875, -5.095703125, -3.4228515625, -1.75, -0.0771484375, 1.595703125, 3.2685546875, 4.94140625, 6.6142578125, 8.287109375, 9.9599609375, 11.6328125, 13.3056640625, 14.978515625, 16.6513671875, 18.32421875, 19.9970703125, 21.669921875, 23.3427734375, 25.015625, 26.6884765625, 28.361328125, 30.0341796875, 31.70703125, 33.3798828125, 35.052734375, 36.7255859375, 38.3984375, 40.0712890625, 41.744140625, 43.4169921875, 45.08984375, 46.7626953125, 48.435546875, 50.1083984375, 51.78125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 13.0, 19.0, 34.0, 36.0, 52.0, 70.0, 105.0, 141.0, 272.0, 520.0, 984.0, 1704.0, 3301.0, 6712.0, 13957.0, 31247.0, 77852.0, 238785.0, 1240555.0, 4079368.0, 399706.0, 115728.0, 43897.0, 18288.0, 8614.0, 4259.0, 2169.0, 1213.0, 736.0, 427.0, 234.0, 137.0, 100.0, 73.0, 29.0, 27.0, 14.0, 17.0, 21.0, 12.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0], "bins": [-78.9375, -76.6279296875, -74.318359375, -72.0087890625, -69.69921875, -67.3896484375, -65.080078125, -62.7705078125, -60.4609375, -58.1513671875, -55.841796875, -53.5322265625, -51.22265625, -48.9130859375, -46.603515625, -44.2939453125, -41.984375, -39.6748046875, -37.365234375, -35.0556640625, -32.74609375, -30.4365234375, -28.126953125, -25.8173828125, -23.5078125, -21.1982421875, -18.888671875, -16.5791015625, -14.26953125, -11.9599609375, -9.650390625, -7.3408203125, -5.03125, -2.7216796875, -0.412109375, 1.8974609375, 4.20703125, 6.5166015625, 8.826171875, 11.1357421875, 13.4453125, 15.7548828125, 18.064453125, 20.3740234375, 22.68359375, 24.9931640625, 27.302734375, 29.6123046875, 31.921875, 34.2314453125, 36.541015625, 38.8505859375, 41.16015625, 43.4697265625, 45.779296875, 48.0888671875, 50.3984375, 52.7080078125, 55.017578125, 57.3271484375, 59.63671875, 61.9462890625, 64.255859375, 66.5654296875, 68.875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 2.0, 6.0, 10.0, 12.0, 16.0, 21.0, 32.0, 69.0, 87.0, 122.0, 175.0, 294.0, 569.0, 184.0, 110.0, 68.0, 61.0, 56.0, 43.0, 13.0, 13.0, 9.0, 9.0, 3.0, 4.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-83.3125, -80.8154296875, -78.318359375, -75.8212890625, -73.32421875, -70.8271484375, -68.330078125, -65.8330078125, -63.3359375, -60.8388671875, -58.341796875, -55.8447265625, -53.34765625, -50.8505859375, -48.353515625, -45.8564453125, -43.359375, -40.8623046875, -38.365234375, -35.8681640625, -33.37109375, -30.8740234375, -28.376953125, -25.8798828125, -23.3828125, -20.8857421875, -18.388671875, -15.8916015625, -13.39453125, -10.8974609375, -8.400390625, -5.9033203125, -3.40625, -0.9091796875, 1.587890625, 4.0849609375, 6.58203125, 9.0791015625, 11.576171875, 14.0732421875, 16.5703125, 19.0673828125, 21.564453125, 24.0615234375, 26.55859375, 29.0556640625, 31.552734375, 34.0498046875, 36.546875, 39.0439453125, 41.541015625, 44.0380859375, 46.53515625, 49.0322265625, 51.529296875, 54.0263671875, 56.5234375, 59.0205078125, 61.517578125, 64.0146484375, 66.51171875, 69.0087890625, 71.505859375, 74.0029296875, 76.5]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 8.0, 6.0, 5.0, 3.0, 8.0, 7.0, 3.0, 9.0, 9.0, 23.0, 24.0, 43.0, 61.0, 73.0, 81.0, 91.0, 147.0, 210.0, 263.0, 401.0, 599.0, 965.0, 1606.0, 3002.0, 6370.0, 18987.0, 119643.0, 6069191.0, 46903.0, 11884.0, 4687.0, 2302.0, 1245.0, 763.0, 517.0, 351.0, 268.0, 175.0, 124.0, 77.0, 66.0, 55.0, 41.0, 41.0, 31.0, 25.0, 13.0, 5.0, 8.0, 3.0, 8.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-476.75, -461.01171875, -445.2734375, -429.53515625, -413.796875, -398.05859375, -382.3203125, -366.58203125, -350.84375, -335.10546875, -319.3671875, -303.62890625, -287.890625, -272.15234375, -256.4140625, -240.67578125, -224.9375, -209.19921875, -193.4609375, -177.72265625, -161.984375, -146.24609375, -130.5078125, -114.76953125, -99.03125, -83.29296875, -67.5546875, -51.81640625, -36.078125, -20.33984375, -4.6015625, 11.13671875, 26.875, 42.61328125, 58.3515625, 74.08984375, 89.828125, 105.56640625, 121.3046875, 137.04296875, 152.78125, 168.51953125, 184.2578125, 199.99609375, 215.734375, 231.47265625, 247.2109375, 262.94921875, 278.6875, 294.42578125, 310.1640625, 325.90234375, 341.640625, 357.37890625, 373.1171875, 388.85546875, 404.59375, 420.33203125, 436.0703125, 451.80859375, 467.546875, 483.28515625, 499.0234375, 514.76171875, 530.5]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 7.0, 6.0, 10.0, 10.0, 8.0, 14.0, 21.0, 32.0, 55.0, 91.0, 162.0, 302.0, 759.0, 222.0, 103.0, 72.0, 35.0, 22.0, 19.0, 7.0, 8.0, 8.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.25, -113.521484375, -109.79296875, -106.064453125, -102.3359375, -98.607421875, -94.87890625, -91.150390625, -87.421875, -83.693359375, -79.96484375, -76.236328125, -72.5078125, -68.779296875, -65.05078125, -61.322265625, -57.59375, -53.865234375, -50.13671875, -46.408203125, -42.6796875, -38.951171875, -35.22265625, -31.494140625, -27.765625, -24.037109375, -20.30859375, -16.580078125, -12.8515625, -9.123046875, -5.39453125, -1.666015625, 2.0625, 5.791015625, 9.51953125, 13.248046875, 16.9765625, 20.705078125, 24.43359375, 28.162109375, 31.890625, 35.619140625, 39.34765625, 43.076171875, 46.8046875, 50.533203125, 54.26171875, 57.990234375, 61.71875, 65.447265625, 69.17578125, 72.904296875, 76.6328125, 80.361328125, 84.08984375, 87.818359375, 91.546875, 95.275390625, 99.00390625, 102.732421875, 106.4609375, 110.189453125, 113.91796875, 117.646484375, 121.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 12.0, 17.0, 27.0, 60.0, 815.0, 42.0, 18.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1196.569580078125, -1147.4462890625, -1098.3228759765625, -1049.1995849609375, -1000.076171875, -950.952880859375, -901.8295288085938, -852.7061767578125, -803.5828247070312, -754.45947265625, -705.3361206054688, -656.2127685546875, -607.0894775390625, -557.966064453125, -508.8427734375, -459.71942138671875, -410.5960693359375, -361.47271728515625, -312.349365234375, -263.2260437011719, -214.10269165039062, -164.97933959960938, -115.85601806640625, -66.732666015625, -17.60931396484375, 31.51403045654297, 80.63737487792969, 129.76071166992188, 178.88406372070312, 228.00741577148438, 277.1307373046875, 326.25408935546875, 375.3773193359375, 424.50067138671875, 473.6240234375, 522.747314453125, 571.8707275390625, 620.9940185546875, 670.1173706054688, 719.24072265625, 768.3640747070312, 817.4874267578125, 866.6107788085938, 915.734130859375, 964.857421875, 1013.9808349609375, 1063.1041259765625, 1112.2275390625, 1161.350830078125, 1210.47412109375, 1259.5975341796875, 1308.7208251953125, 1357.84423828125, 1406.967529296875, 1456.0908203125, 1505.2142333984375, 1554.337646484375, 1603.4609375, 1652.5843505859375, 1701.7076416015625, 1750.8310546875, 1799.954345703125, 1849.07763671875, 1898.2010498046875, 1947.3243408203125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 7.0, 15.0, 11.0, 12.0, 42.0, 158.0, 367.0, 248.0, 60.0, 19.0, 14.0, 14.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-622.4904174804688, -607.1726684570312, -591.85498046875, -576.5372314453125, -561.2195434570312, -545.9017944335938, -530.5841064453125, -515.266357421875, -499.94866943359375, -484.6309509277344, -469.313232421875, -453.9955139160156, -438.67779541015625, -423.3600769042969, -408.0423583984375, -392.7246398925781, -377.40692138671875, -362.0892028808594, -346.771484375, -331.4537658691406, -316.13604736328125, -300.8183288574219, -285.5006103515625, -270.1828918457031, -254.86514282226562, -239.54742431640625, -224.22970581054688, -208.9119873046875, -193.59426879882812, -178.27655029296875, -162.95883178710938, -147.64111328125, -132.32339477539062, -117.00567626953125, -101.68795776367188, -86.3702392578125, -71.05252075195312, -55.73479461669922, -40.417076110839844, -25.09935760498047, -9.781639099121094, 5.536080360412598, 20.85379981994629, 36.1715202331543, 51.48923873901367, 66.80696105957031, 82.12467956542969, 97.44239807128906, 112.76011657714844, 128.0778350830078, 143.3955535888672, 158.71327209472656, 174.03099060058594, 189.34872436523438, 204.66644287109375, 219.98416137695312, 235.3018798828125, 250.61959838867188, 265.93731689453125, 281.2550354003906, 296.57275390625, 311.8904724121094, 327.20819091796875, 342.5259094238281, 357.8436279296875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 12.0, 16.0, 26.0, 28.0, 37.0, 54.0, 78.0, 81.0, 128.0, 149.0, 207.0, 237.0, 327.0, 471.0, 649.0, 1007.0, 1801.0, 3709.0, 9257.0, 35293.0, 423218.0, 3622716.0, 67462.0, 14292.0, 5977.0, 2946.0, 1575.0, 827.0, 477.0, 301.0, 195.0, 127.0, 97.0, 74.0, 75.0, 65.0, 38.0, 45.0, 28.0, 31.0, 29.0, 17.0, 21.0, 9.0, 10.0, 15.0, 7.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0], "bins": [-17.453125, -16.833984375, -16.21484375, -15.595703125, -14.9765625, -14.357421875, -13.73828125, -13.119140625, -12.5, -11.880859375, -11.26171875, -10.642578125, -10.0234375, -9.404296875, -8.78515625, -8.166015625, -7.546875, -6.927734375, -6.30859375, -5.689453125, -5.0703125, -4.451171875, -3.83203125, -3.212890625, -2.59375, -1.974609375, -1.35546875, -0.736328125, -0.1171875, 0.501953125, 1.12109375, 1.740234375, 2.359375, 2.978515625, 3.59765625, 4.216796875, 4.8359375, 5.455078125, 6.07421875, 6.693359375, 7.3125, 7.931640625, 8.55078125, 9.169921875, 9.7890625, 10.408203125, 11.02734375, 11.646484375, 12.265625, 12.884765625, 13.50390625, 14.123046875, 14.7421875, 15.361328125, 15.98046875, 16.599609375, 17.21875, 17.837890625, 18.45703125, 19.076171875, 19.6953125, 20.314453125, 20.93359375, 21.552734375, 22.171875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 9.0, 29.0, 66.0, 156.0, 266.0, 240.0, 139.0, 48.0, 11.0, 8.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3349609375, -1.288665771484375, -1.24237060546875, -1.196075439453125, -1.1497802734375, -1.103485107421875, -1.05718994140625, -1.010894775390625, -0.964599609375, -0.918304443359375, -0.87200927734375, -0.825714111328125, -0.7794189453125, -0.733123779296875, -0.68682861328125, -0.640533447265625, -0.59423828125, -0.547943115234375, -0.50164794921875, -0.455352783203125, -0.4090576171875, -0.362762451171875, -0.31646728515625, -0.270172119140625, -0.223876953125, -0.177581787109375, -0.13128662109375, -0.084991455078125, -0.0386962890625, 0.007598876953125, 0.05389404296875, 0.100189208984375, 0.146484375, 0.192779541015625, 0.23907470703125, 0.285369873046875, 0.3316650390625, 0.377960205078125, 0.42425537109375, 0.470550537109375, 0.516845703125, 0.563140869140625, 0.60943603515625, 0.655731201171875, 0.7020263671875, 0.748321533203125, 0.79461669921875, 0.840911865234375, 0.88720703125, 0.933502197265625, 0.97979736328125, 1.026092529296875, 1.0723876953125, 1.118682861328125, 1.16497802734375, 1.211273193359375, 1.257568359375, 1.303863525390625, 1.35015869140625, 1.396453857421875, 1.4427490234375, 1.489044189453125, 1.53533935546875, 1.581634521484375, 1.6279296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 9.0, 13.0, 21.0, 22.0, 33.0, 47.0, 88.0, 109.0, 163.0, 267.0, 550.0, 1299.0, 4750.0, 27977.0, 492886.0, 3602016.0, 53573.0, 7021.0, 1827.0, 631.0, 333.0, 197.0, 106.0, 86.0, 63.0, 50.0, 32.0, 23.0, 17.0, 11.0, 11.0, 10.0, 5.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.796875, -20.05859375, -19.3203125, -18.58203125, -17.84375, -17.10546875, -16.3671875, -15.62890625, -14.890625, -14.15234375, -13.4140625, -12.67578125, -11.9375, -11.19921875, -10.4609375, -9.72265625, -8.984375, -8.24609375, -7.5078125, -6.76953125, -6.03125, -5.29296875, -4.5546875, -3.81640625, -3.078125, -2.33984375, -1.6015625, -0.86328125, -0.125, 0.61328125, 1.3515625, 2.08984375, 2.828125, 3.56640625, 4.3046875, 5.04296875, 5.78125, 6.51953125, 7.2578125, 7.99609375, 8.734375, 9.47265625, 10.2109375, 10.94921875, 11.6875, 12.42578125, 13.1640625, 13.90234375, 14.640625, 15.37890625, 16.1171875, 16.85546875, 17.59375, 18.33203125, 19.0703125, 19.80859375, 20.546875, 21.28515625, 22.0234375, 22.76171875, 23.5, 24.23828125, 24.9765625, 25.71484375, 26.453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 10.0, 8.0, 8.0, 13.0, 17.0, 15.0, 29.0, 32.0, 36.0, 54.0, 46.0, 68.0, 117.0, 95.0, 105.0, 150.0, 182.0, 260.0, 960.0, 799.0, 307.0, 194.0, 149.0, 105.0, 65.0, 57.0, 38.0, 38.0, 33.0, 16.0, 22.0, 7.0, 4.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.779296875, -2.7097015380859375, -2.640106201171875, -2.5705108642578125, -2.50091552734375, -2.4313201904296875, -2.361724853515625, -2.2921295166015625, -2.2225341796875, -2.1529388427734375, -2.083343505859375, -2.0137481689453125, -1.94415283203125, -1.8745574951171875, -1.804962158203125, -1.7353668212890625, -1.665771484375, -1.5961761474609375, -1.526580810546875, -1.4569854736328125, -1.38739013671875, -1.3177947998046875, -1.248199462890625, -1.1786041259765625, -1.1090087890625, -1.0394134521484375, -0.969818115234375, -0.9002227783203125, -0.83062744140625, -0.7610321044921875, -0.691436767578125, -0.6218414306640625, -0.55224609375, -0.4826507568359375, -0.413055419921875, -0.3434600830078125, -0.27386474609375, -0.2042694091796875, -0.134674072265625, -0.0650787353515625, 0.0045166015625, 0.0741119384765625, 0.143707275390625, 0.2133026123046875, 0.28289794921875, 0.3524932861328125, 0.422088623046875, 0.4916839599609375, 0.561279296875, 0.6308746337890625, 0.700469970703125, 0.7700653076171875, 0.83966064453125, 0.9092559814453125, 0.978851318359375, 1.0484466552734375, 1.1180419921875, 1.1876373291015625, 1.257232666015625, 1.3268280029296875, 1.39642333984375, 1.4660186767578125, 1.535614013671875, 1.6052093505859375, 1.6748046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 14.0, 24.0, 105.0, 352.0, 493.0, 18.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.35906982421875, -262.137451171875, -255.91586303710938, -249.6942596435547, -243.47265625, -237.2510528564453, -231.02944946289062, -224.80783081054688, -218.58624267578125, -212.36463928222656, -206.14303588867188, -199.9214324951172, -193.6998291015625, -187.4782257080078, -181.25662231445312, -175.03500366210938, -168.8134002685547, -162.591796875, -156.3701934814453, -150.14859008789062, -143.92698669433594, -137.70538330078125, -131.4837646484375, -125.26216888427734, -119.04056549072266, -112.81896209716797, -106.59735870361328, -100.37574768066406, -94.15414428710938, -87.93254089355469, -81.7109375, -75.48933410644531, -69.26773071289062, -63.04612731933594, -56.82452392578125, -50.6029167175293, -44.38131332397461, -38.15970993041992, -31.93810272216797, -25.71649932861328, -19.494895935058594, -13.27329158782959, -7.051687240600586, -0.8300819396972656, 5.391521453857422, 11.61312484741211, 17.834732055664062, 24.05633544921875, 30.277938842773438, 36.499542236328125, 42.72114562988281, 48.942752838134766, 55.16435623168945, 61.38595962524414, 67.6075668334961, 73.82917022705078, 80.05077362060547, 86.27237701416016, 92.49398040771484, 98.71559143066406, 104.93719482421875, 111.15879821777344, 117.38040161132812, 123.60200500488281, 129.8236083984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 14.0, 21.0, 24.0, 23.0, 30.0, 49.0, 49.0, 71.0, 79.0, 80.0, 92.0, 71.0, 76.0, 75.0, 56.0, 43.0, 38.0, 26.0, 22.0, 17.0, 10.0, 9.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.748382568359375, -35.693641662597656, -34.63890075683594, -33.58415985107422, -32.5294189453125, -31.474679946899414, -30.419939041137695, -29.365198135375977, -28.31045913696289, -27.255718231201172, -26.200977325439453, -25.146236419677734, -24.09149742126465, -23.03675651550293, -21.98201560974121, -20.927274703979492, -19.872533798217773, -18.817792892456055, -17.763051986694336, -16.70831298828125, -15.653572082519531, -14.598831176757812, -13.544090270996094, -12.489349365234375, -11.434609413146973, -10.379868507385254, -9.325128555297852, -8.270387649536133, -7.215647220611572, -6.160906791687012, -5.106165885925293, -4.051425457000732, -2.996685028076172, -1.9419444799423218, -0.8872039318084717, 0.16753673553466797, 1.2222771644592285, 2.277017593383789, 3.331758499145508, 4.386498928070068, 5.441239356994629, 6.4959797859191895, 7.55072021484375, 8.605461120605469, 9.660202026367188, 10.71494197845459, 11.769682884216309, 12.824422836303711, 13.87916374206543, 14.933904647827148, 15.98864459991455, 17.043384552001953, 18.098125457763672, 19.15286636352539, 20.20760726928711, 21.262348175048828, 22.317089080810547, 23.371829986572266, 24.426570892333984, 25.481311798095703, 26.53605079650879, 27.590791702270508, 28.645532608032227, 29.700273513793945, 30.75501251220703]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 10.0, 12.0, 15.0, 26.0, 22.0, 30.0, 38.0, 80.0, 99.0, 143.0, 207.0, 292.0, 515.0, 844.0, 1335.0, 2635.0, 5745.0, 21604.0, 197490.0, 746690.0, 52485.0, 9945.0, 3621.0, 1829.0, 1041.0, 585.0, 373.0, 248.0, 175.0, 127.0, 92.0, 57.0, 33.0, 27.0, 20.0, 15.0, 13.0, 12.0, 8.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.2578125, -9.9395751953125, -9.621337890625, -9.3031005859375, -8.98486328125, -8.6666259765625, -8.348388671875, -8.0301513671875, -7.7119140625, -7.3936767578125, -7.075439453125, -6.7572021484375, -6.43896484375, -6.1207275390625, -5.802490234375, -5.4842529296875, -5.166015625, -4.8477783203125, -4.529541015625, -4.2113037109375, -3.89306640625, -3.5748291015625, -3.256591796875, -2.9383544921875, -2.6201171875, -2.3018798828125, -1.983642578125, -1.6654052734375, -1.34716796875, -1.0289306640625, -0.710693359375, -0.3924560546875, -0.07421875, 0.2440185546875, 0.562255859375, 0.8804931640625, 1.19873046875, 1.5169677734375, 1.835205078125, 2.1534423828125, 2.4716796875, 2.7899169921875, 3.108154296875, 3.4263916015625, 3.74462890625, 4.0628662109375, 4.381103515625, 4.6993408203125, 5.017578125, 5.3358154296875, 5.654052734375, 5.9722900390625, 6.29052734375, 6.6087646484375, 6.927001953125, 7.2452392578125, 7.5634765625, 7.8817138671875, 8.199951171875, 8.5181884765625, 8.83642578125, 9.1546630859375, 9.472900390625, 9.7911376953125, 10.109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 11.0, 13.0, 37.0, 74.0, 115.0, 151.0, 183.0, 148.0, 118.0, 52.0, 38.0, 20.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4990234375, -1.46185302734375, -1.4246826171875, -1.38751220703125, -1.350341796875, -1.31317138671875, -1.2760009765625, -1.23883056640625, -1.20166015625, -1.16448974609375, -1.1273193359375, -1.09014892578125, -1.052978515625, -1.01580810546875, -0.9786376953125, -0.94146728515625, -0.904296875, -0.86712646484375, -0.8299560546875, -0.79278564453125, -0.755615234375, -0.71844482421875, -0.6812744140625, -0.64410400390625, -0.60693359375, -0.56976318359375, -0.5325927734375, -0.49542236328125, -0.458251953125, -0.42108154296875, -0.3839111328125, -0.34674072265625, -0.3095703125, -0.27239990234375, -0.2352294921875, -0.19805908203125, -0.160888671875, -0.12371826171875, -0.0865478515625, -0.04937744140625, -0.01220703125, 0.02496337890625, 0.0621337890625, 0.09930419921875, 0.136474609375, 0.17364501953125, 0.2108154296875, 0.24798583984375, 0.28515625, 0.32232666015625, 0.3594970703125, 0.39666748046875, 0.433837890625, 0.47100830078125, 0.5081787109375, 0.54534912109375, 0.58251953125, 0.61968994140625, 0.6568603515625, 0.69403076171875, 0.731201171875, 0.76837158203125, 0.8055419921875, 0.84271240234375, 0.8798828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 10.0, 3.0, 11.0, 12.0, 20.0, 38.0, 80.0, 140.0, 337.0, 908.0, 3482.0, 29637.0, 933529.0, 72807.0, 5440.0, 1281.0, 429.0, 165.0, 86.0, 45.0, 30.0, 16.0, 14.0, 11.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.59375, -34.64794921875, -33.7021484375, -32.75634765625, -31.810546875, -30.86474609375, -29.9189453125, -28.97314453125, -28.02734375, -27.08154296875, -26.1357421875, -25.18994140625, -24.244140625, -23.29833984375, -22.3525390625, -21.40673828125, -20.4609375, -19.51513671875, -18.5693359375, -17.62353515625, -16.677734375, -15.73193359375, -14.7861328125, -13.84033203125, -12.89453125, -11.94873046875, -11.0029296875, -10.05712890625, -9.111328125, -8.16552734375, -7.2197265625, -6.27392578125, -5.328125, -4.38232421875, -3.4365234375, -2.49072265625, -1.544921875, -0.59912109375, 0.3466796875, 1.29248046875, 2.23828125, 3.18408203125, 4.1298828125, 5.07568359375, 6.021484375, 6.96728515625, 7.9130859375, 8.85888671875, 9.8046875, 10.75048828125, 11.6962890625, 12.64208984375, 13.587890625, 14.53369140625, 15.4794921875, 16.42529296875, 17.37109375, 18.31689453125, 19.2626953125, 20.20849609375, 21.154296875, 22.10009765625, 23.0458984375, 23.99169921875, 24.9375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 7.0, 9.0, 19.0, 19.0, 26.0, 20.0, 32.0, 42.0, 35.0, 40.0, 52.0, 49.0, 52.0, 54.0, 74.0, 56.0, 53.0, 46.0, 50.0, 51.0, 37.0, 30.0, 22.0, 29.0, 18.0, 18.0, 16.0, 7.0, 3.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.48565673828125, -4.3072509765625, -4.12884521484375, -3.950439453125, -3.77203369140625, -3.5936279296875, -3.41522216796875, -3.23681640625, -3.05841064453125, -2.8800048828125, -2.70159912109375, -2.523193359375, -2.34478759765625, -2.1663818359375, -1.98797607421875, -1.8095703125, -1.63116455078125, -1.4527587890625, -1.27435302734375, -1.095947265625, -0.91754150390625, -0.7391357421875, -0.56072998046875, -0.38232421875, -0.20391845703125, -0.0255126953125, 0.15289306640625, 0.331298828125, 0.50970458984375, 0.6881103515625, 0.86651611328125, 1.044921875, 1.22332763671875, 1.4017333984375, 1.58013916015625, 1.758544921875, 1.93695068359375, 2.1153564453125, 2.29376220703125, 2.47216796875, 2.65057373046875, 2.8289794921875, 3.00738525390625, 3.185791015625, 3.36419677734375, 3.5426025390625, 3.72100830078125, 3.8994140625, 4.07781982421875, 4.2562255859375, 4.43463134765625, 4.613037109375, 4.79144287109375, 4.9698486328125, 5.14825439453125, 5.32666015625, 5.50506591796875, 5.6834716796875, 5.86187744140625, 6.040283203125, 6.21868896484375, 6.3970947265625, 6.57550048828125, 6.75390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 11.0, 6.0, 11.0, 17.0, 20.0, 39.0, 59.0, 169.0, 379.0, 1185.0, 12474.0, 1027937.0, 4844.0, 847.0, 279.0, 121.0, 62.0, 32.0, 19.0, 10.0, 14.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.75, -178.455078125, -172.16015625, -165.865234375, -159.5703125, -153.275390625, -146.98046875, -140.685546875, -134.390625, -128.095703125, -121.80078125, -115.505859375, -109.2109375, -102.916015625, -96.62109375, -90.326171875, -84.03125, -77.736328125, -71.44140625, -65.146484375, -58.8515625, -52.556640625, -46.26171875, -39.966796875, -33.671875, -27.376953125, -21.08203125, -14.787109375, -8.4921875, -2.197265625, 4.09765625, 10.392578125, 16.6875, 22.982421875, 29.27734375, 35.572265625, 41.8671875, 48.162109375, 54.45703125, 60.751953125, 67.046875, 73.341796875, 79.63671875, 85.931640625, 92.2265625, 98.521484375, 104.81640625, 111.111328125, 117.40625, 123.701171875, 129.99609375, 136.291015625, 142.5859375, 148.880859375, 155.17578125, 161.470703125, 167.765625, 174.060546875, 180.35546875, 186.650390625, 192.9453125, 199.240234375, 205.53515625, 211.830078125, 218.125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 7.0, 11.0, 20.0, 51.0, 134.0, 516.0, 156.0, 46.0, 21.0, 12.0, 9.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002105712890625, -0.002052396535873413, -0.001999080181121826, -0.0019457638263702393, -0.0018924474716186523, -0.0018391311168670654, -0.0017858147621154785, -0.0017324984073638916, -0.0016791820526123047, -0.0016258656978607178, -0.0015725493431091309, -0.001519232988357544, -0.001465916633605957, -0.0014126002788543701, -0.0013592839241027832, -0.0013059675693511963, -0.0012526512145996094, -0.0011993348598480225, -0.0011460185050964355, -0.0010927021503448486, -0.0010393857955932617, -0.0009860694408416748, -0.0009327530860900879, -0.000879436731338501, -0.0008261203765869141, -0.0007728040218353271, -0.0007194876670837402, -0.0006661713123321533, -0.0006128549575805664, -0.0005595386028289795, -0.0005062222480773926, -0.00045290589332580566, -0.00039958953857421875, -0.00034627318382263184, -0.0002929568290710449, -0.000239640474319458, -0.0001863241195678711, -0.00013300776481628418, -7.969141006469727e-05, -2.637505531311035e-05, 2.6941299438476562e-05, 8.025765419006348e-05, 0.0001335740089416504, 0.0001868903636932373, 0.00024020671844482422, 0.00029352307319641113, 0.00034683942794799805, 0.00040015578269958496, 0.0004534721374511719, 0.0005067884922027588, 0.0005601048469543457, 0.0006134212017059326, 0.0006667375564575195, 0.0007200539112091064, 0.0007733702659606934, 0.0008266866207122803, 0.0008800029754638672, 0.0009333193302154541, 0.000986635684967041, 0.001039952039718628, 0.0010932683944702148, 0.0011465847492218018, 0.0011999011039733887, 0.0012532174587249756, 0.0013065338134765625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 6.0, 6.0, 3.0, 13.0, 17.0, 28.0, 28.0, 43.0, 70.0, 108.0, 166.0, 278.0, 564.0, 1057.0, 2487.0, 7060.0, 36359.0, 967373.0, 23151.0, 5485.0, 2124.0, 946.0, 471.0, 273.0, 129.0, 93.0, 73.0, 41.0, 38.0, 14.0, 16.0, 12.0, 9.0, 4.0, 2.0, 9.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.15625, -46.7958984375, -45.435546875, -44.0751953125, -42.71484375, -41.3544921875, -39.994140625, -38.6337890625, -37.2734375, -35.9130859375, -34.552734375, -33.1923828125, -31.83203125, -30.4716796875, -29.111328125, -27.7509765625, -26.390625, -25.0302734375, -23.669921875, -22.3095703125, -20.94921875, -19.5888671875, -18.228515625, -16.8681640625, -15.5078125, -14.1474609375, -12.787109375, -11.4267578125, -10.06640625, -8.7060546875, -7.345703125, -5.9853515625, -4.625, -3.2646484375, -1.904296875, -0.5439453125, 0.81640625, 2.1767578125, 3.537109375, 4.8974609375, 6.2578125, 7.6181640625, 8.978515625, 10.3388671875, 11.69921875, 13.0595703125, 14.419921875, 15.7802734375, 17.140625, 18.5009765625, 19.861328125, 21.2216796875, 22.58203125, 23.9423828125, 25.302734375, 26.6630859375, 28.0234375, 29.3837890625, 30.744140625, 32.1044921875, 33.46484375, 34.8251953125, 36.185546875, 37.5458984375, 38.90625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 3.0, 2.0, 5.0, 6.0, 6.0, 11.0, 17.0, 28.0, 75.0, 426.0, 268.0, 45.0, 25.0, 18.0, 11.0, 9.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.296875, -16.676025390625, -16.05517578125, -15.434326171875, -14.8134765625, -14.192626953125, -13.57177734375, -12.950927734375, -12.330078125, -11.709228515625, -11.08837890625, -10.467529296875, -9.8466796875, -9.225830078125, -8.60498046875, -7.984130859375, -7.36328125, -6.742431640625, -6.12158203125, -5.500732421875, -4.8798828125, -4.259033203125, -3.63818359375, -3.017333984375, -2.396484375, -1.775634765625, -1.15478515625, -0.533935546875, 0.0869140625, 0.707763671875, 1.32861328125, 1.949462890625, 2.5703125, 3.191162109375, 3.81201171875, 4.432861328125, 5.0537109375, 5.674560546875, 6.29541015625, 6.916259765625, 7.537109375, 8.157958984375, 8.77880859375, 9.399658203125, 10.0205078125, 10.641357421875, 11.26220703125, 11.883056640625, 12.50390625, 13.124755859375, 13.74560546875, 14.366455078125, 14.9873046875, 15.608154296875, 16.22900390625, 16.849853515625, 17.470703125, 18.091552734375, 18.71240234375, 19.333251953125, 19.9541015625, 20.574951171875, 21.19580078125, 21.816650390625, 22.4375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 22.0, 53.0, 196.0, 511.0, 164.0, 34.0, 9.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.5936279296875, -250.91433715820312, -240.23504638671875, -229.55575561523438, -218.87646484375, -208.19717407226562, -197.51788330078125, -186.83859252929688, -176.1593017578125, -165.48001098632812, -154.80072021484375, -144.12142944335938, -133.442138671875, -122.76284790039062, -112.08356475830078, -101.4042739868164, -90.72499084472656, -80.04570007324219, -69.36640930175781, -58.6871223449707, -48.00783157348633, -37.32854080200195, -26.649253845214844, -15.969963073730469, -5.290672302246094, 5.388617515563965, 16.067907333374023, 26.747196197509766, 37.42648696899414, 48.105777740478516, 58.785064697265625, 69.46435546875, 80.14364624023438, 90.82293701171875, 101.50222778320312, 112.1815185546875, 122.86080932617188, 133.54010009765625, 144.21939086914062, 154.898681640625, 165.57797241210938, 176.25726318359375, 186.93655395507812, 197.6158447265625, 208.29513549804688, 218.97442626953125, 229.65371704101562, 240.3330078125, 251.0122833251953, 261.6915588378906, 272.370849609375, 283.0501403808594, 293.72943115234375, 304.4087219238281, 315.0880126953125, 325.7673034667969, 336.44659423828125, 347.1258850097656, 357.80517578125, 368.4844665527344, 379.16375732421875, 389.8430480957031, 400.5223388671875, 411.2016296386719, 421.88092041015625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 10.0, 10.0, 14.0, 36.0, 43.0, 70.0, 82.0, 114.0, 106.0, 100.0, 105.0, 76.0, 68.0, 53.0, 36.0, 22.0, 14.0, 11.0, 7.0, 8.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.97468566894531, -82.91608428955078, -79.85747528076172, -76.79887390136719, -73.74026489257812, -70.6816635131836, -67.62306213378906, -64.564453125, -61.5058479309082, -58.447242736816406, -55.38863754272461, -52.33003234863281, -49.27143096923828, -46.21282196044922, -43.15422058105469, -40.09561538696289, -37.037010192871094, -33.9784049987793, -30.9197998046875, -27.861196517944336, -24.80259132385254, -21.743986129760742, -18.685382843017578, -15.626777648925781, -12.568172454833984, -9.509567260742188, -6.450963020324707, -3.3923587799072266, -0.3337535858154297, 2.724851608276367, 5.783454895019531, 8.842060089111328, 11.900657653808594, 14.95926284790039, 18.017868041992188, 21.07647132873535, 24.13507652282715, 27.193681716918945, 30.25228500366211, 33.310890197753906, 36.3694953918457, 39.4281005859375, 42.4867057800293, 45.545310974121094, 48.603912353515625, 51.66252136230469, 54.72112274169922, 57.779727935791016, 60.83833312988281, 63.89693832397461, 66.9555435180664, 70.01414489746094, 73.07275390625, 76.13135528564453, 79.18995666503906, 82.24856567382812, 85.30717468261719, 88.36577606201172, 91.42438507080078, 94.48298645019531, 97.54159545898438, 100.6001968383789, 103.65879821777344, 106.7174072265625, 109.77600860595703]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 10.0, 14.0, 26.0, 57.0, 240.0, 4182.0, 4188591.0, 1018.0, 71.0, 31.0, 19.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-508.5, -496.2109375, -483.921875, -471.6328125, -459.34375, -447.0546875, -434.765625, -422.4765625, -410.1875, -397.8984375, -385.609375, -373.3203125, -361.03125, -348.7421875, -336.453125, -324.1640625, -311.875, -299.5859375, -287.296875, -275.0078125, -262.71875, -250.4296875, -238.140625, -225.8515625, -213.5625, -201.2734375, -188.984375, -176.6953125, -164.40625, -152.1171875, -139.828125, -127.5390625, -115.25, -102.9609375, -90.671875, -78.3828125, -66.09375, -53.8046875, -41.515625, -29.2265625, -16.9375, -4.6484375, 7.640625, 19.9296875, 32.21875, 44.5078125, 56.796875, 69.0859375, 81.375, 93.6640625, 105.953125, 118.2421875, 130.53125, 142.8203125, 155.109375, 167.3984375, 179.6875, 191.9765625, 204.265625, 216.5546875, 228.84375, 241.1328125, 253.421875, 265.7109375, 278.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 5.0, 11.0, 8.0, 21.0, 27.0, 34.0, 35.0, 91.0, 74.0, 92.0, 120.0, 99.0, 91.0, 75.0, 59.0, 51.0, 36.0, 23.0, 17.0, 6.0, 5.0, 8.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0452728271484375, -1.013397216796875, -0.9815216064453125, -0.94964599609375, -0.9177703857421875, -0.885894775390625, -0.8540191650390625, -0.8221435546875, -0.7902679443359375, -0.758392333984375, -0.7265167236328125, -0.69464111328125, -0.6627655029296875, -0.630889892578125, -0.5990142822265625, -0.567138671875, -0.5352630615234375, -0.503387451171875, -0.4715118408203125, -0.43963623046875, -0.4077606201171875, -0.375885009765625, -0.3440093994140625, -0.3121337890625, -0.2802581787109375, -0.248382568359375, -0.2165069580078125, -0.18463134765625, -0.1527557373046875, -0.120880126953125, -0.0890045166015625, -0.05712890625, -0.0252532958984375, 0.006622314453125, 0.0384979248046875, 0.07037353515625, 0.1022491455078125, 0.134124755859375, 0.1660003662109375, 0.1978759765625, 0.2297515869140625, 0.261627197265625, 0.2935028076171875, 0.32537841796875, 0.3572540283203125, 0.389129638671875, 0.4210052490234375, 0.452880859375, 0.4847564697265625, 0.516632080078125, 0.5485076904296875, 0.58038330078125, 0.6122589111328125, 0.644134521484375, 0.6760101318359375, 0.7078857421875, 0.7397613525390625, 0.771636962890625, 0.8035125732421875, 0.83538818359375, 0.8672637939453125, 0.899139404296875, 0.9310150146484375, 0.962890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 10.0, 11.0, 45.0, 90.0, 194.0, 656.0, 4254.0, 182927.0, 3992377.0, 11389.0, 1234.0, 379.0, 205.0, 142.0, 131.0, 76.0, 51.0, 34.0, 25.0, 16.0, 10.0, 9.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.125, -23.3515625, -21.578125, -19.8046875, -18.03125, -16.2578125, -14.484375, -12.7109375, -10.9375, -9.1640625, -7.390625, -5.6171875, -3.84375, -2.0703125, -0.296875, 1.4765625, 3.25, 5.0234375, 6.796875, 8.5703125, 10.34375, 12.1171875, 13.890625, 15.6640625, 17.4375, 19.2109375, 20.984375, 22.7578125, 24.53125, 26.3046875, 28.078125, 29.8515625, 31.625, 33.3984375, 35.171875, 36.9453125, 38.71875, 40.4921875, 42.265625, 44.0390625, 45.8125, 47.5859375, 49.359375, 51.1328125, 52.90625, 54.6796875, 56.453125, 58.2265625, 60.0, 61.7734375, 63.546875, 65.3203125, 67.09375, 68.8671875, 70.640625, 72.4140625, 74.1875, 75.9609375, 77.734375, 79.5078125, 81.28125, 83.0546875, 84.828125, 86.6015625, 88.375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 17.0, 8.0, 15.0, 28.0, 40.0, 47.0, 78.0, 125.0, 298.0, 2054.0, 810.0, 256.0, 114.0, 52.0, 28.0, 26.0, 17.0, 11.0, 18.0, 8.0, 5.0, 2.0, 5.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.826171875, -2.7510986328125, -2.676025390625, -2.6009521484375, -2.52587890625, -2.4508056640625, -2.375732421875, -2.3006591796875, -2.2255859375, -2.1505126953125, -2.075439453125, -2.0003662109375, -1.92529296875, -1.8502197265625, -1.775146484375, -1.7000732421875, -1.625, -1.5499267578125, -1.474853515625, -1.3997802734375, -1.32470703125, -1.2496337890625, -1.174560546875, -1.0994873046875, -1.0244140625, -0.9493408203125, -0.874267578125, -0.7991943359375, -0.72412109375, -0.6490478515625, -0.573974609375, -0.4989013671875, -0.423828125, -0.3487548828125, -0.273681640625, -0.1986083984375, -0.12353515625, -0.0484619140625, 0.026611328125, 0.1016845703125, 0.1767578125, 0.2518310546875, 0.326904296875, 0.4019775390625, 0.47705078125, 0.5521240234375, 0.627197265625, 0.7022705078125, 0.77734375, 0.8524169921875, 0.927490234375, 1.0025634765625, 1.07763671875, 1.1527099609375, 1.227783203125, 1.3028564453125, 1.3779296875, 1.4530029296875, 1.528076171875, 1.6031494140625, 1.67822265625, 1.7532958984375, 1.828369140625, 1.9034423828125, 1.978515625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 16.0, 893.0, 92.0, 17.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.146678924560547, -12.90083122253418, -4.6549835205078125, 3.5908641815185547, 11.836711883544922, 20.082561492919922, 28.328407287597656, 36.57425308227539, 44.82010269165039, 53.065948486328125, 61.311798095703125, 69.55764770507812, 77.80349731445312, 86.04934692382812, 94.2951889038086, 102.54103088378906, 110.78688049316406, 119.03273010253906, 127.27857971191406, 135.52442932128906, 143.770263671875, 152.01611328125, 160.261962890625, 168.5078125, 176.753662109375, 184.99951171875, 193.245361328125, 201.4912109375, 209.737060546875, 217.98291015625, 226.22874450683594, 234.47459411621094, 242.720458984375, 250.96630859375, 259.212158203125, 267.4580078125, 275.703857421875, 283.94970703125, 292.195556640625, 300.44140625, 308.687255859375, 316.93310546875, 325.178955078125, 333.4248046875, 341.670654296875, 349.91650390625, 358.162353515625, 366.408203125, 374.6540222167969, 382.8998718261719, 391.1457214355469, 399.3915710449219, 407.6374206542969, 415.8832702636719, 424.1291198730469, 432.37493896484375, 440.62078857421875, 448.86663818359375, 457.11248779296875, 465.35833740234375, 473.60418701171875, 481.85003662109375, 490.09588623046875, 498.34173583984375, 506.58758544921875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 18.0, 32.0, 48.0, 60.0, 71.0, 96.0, 107.0, 119.0, 109.0, 100.0, 78.0, 59.0, 34.0, 30.0, 15.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.513940811157227, -8.975436210632324, -8.436930656433105, -7.898426055908203, -7.359920978546143, -6.821415901184082, -6.28291130065918, -5.744406223297119, -5.205901145935059, -4.667396068572998, -4.1288909912109375, -3.590386390686035, -3.0518813133239746, -2.513376235961914, -1.9748713970184326, -1.4363665580749512, -0.8978614807128906, -0.35935652256011963, 0.17914843559265137, 0.7176533937454224, 1.2561583518981934, 1.794663429260254, 2.3331682682037354, 2.871673107147217, 3.4101781845092773, 3.948683261871338, 4.487188339233398, 5.025692939758301, 5.564198017120361, 6.102703094482422, 6.641207695007324, 7.179712772369385, 7.7182159423828125, 8.256720542907715, 8.795226097106934, 9.333730697631836, 9.872236251831055, 10.410740852355957, 10.94924545288086, 11.487751007080078, 12.02625560760498, 12.564760208129883, 13.103265762329102, 13.641770362854004, 14.180274963378906, 14.718780517578125, 15.257285118103027, 15.79578971862793, 16.33429527282715, 16.872800827026367, 17.411304473876953, 17.949810028076172, 18.48831558227539, 19.02682113647461, 19.565324783325195, 20.103830337524414, 20.642333984375, 21.18083953857422, 21.719343185424805, 22.257848739624023, 22.796354293823242, 23.334857940673828, 23.873363494873047, 24.411869049072266, 24.950374603271484]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 13.0, 19.0, 20.0, 28.0, 45.0, 58.0, 109.0, 137.0, 219.0, 397.0, 629.0, 1231.0, 2198.0, 4183.0, 8581.0, 18935.0, 46311.0, 143126.0, 542040.0, 183290.0, 55138.0, 21688.0, 9724.0, 4699.0, 2418.0, 1313.0, 766.0, 427.0, 254.0, 169.0, 95.0, 75.0, 49.0, 38.0, 21.0, 19.0, 20.0, 17.0, 7.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-9.0859375, -8.83062744140625, -8.5753173828125, -8.32000732421875, -8.064697265625, -7.80938720703125, -7.5540771484375, -7.29876708984375, -7.04345703125, -6.78814697265625, -6.5328369140625, -6.27752685546875, -6.022216796875, -5.76690673828125, -5.5115966796875, -5.25628662109375, -5.0009765625, -4.74566650390625, -4.4903564453125, -4.23504638671875, -3.979736328125, -3.72442626953125, -3.4691162109375, -3.21380615234375, -2.95849609375, -2.70318603515625, -2.4478759765625, -2.19256591796875, -1.937255859375, -1.68194580078125, -1.4266357421875, -1.17132568359375, -0.916015625, -0.66070556640625, -0.4053955078125, -0.15008544921875, 0.105224609375, 0.36053466796875, 0.6158447265625, 0.87115478515625, 1.12646484375, 1.38177490234375, 1.6370849609375, 1.89239501953125, 2.147705078125, 2.40301513671875, 2.6583251953125, 2.91363525390625, 3.1689453125, 3.42425537109375, 3.6795654296875, 3.93487548828125, 4.190185546875, 4.44549560546875, 4.7008056640625, 4.95611572265625, 5.21142578125, 5.46673583984375, 5.7220458984375, 5.97735595703125, 6.232666015625, 6.48797607421875, 6.7432861328125, 6.99859619140625, 7.25390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 12.0, 9.0, 12.0, 17.0, 23.0, 31.0, 35.0, 51.0, 69.0, 57.0, 78.0, 67.0, 80.0, 73.0, 78.0, 58.0, 58.0, 43.0, 43.0, 27.0, 21.0, 14.0, 14.0, 11.0, 9.0, 2.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0068359375, -0.9805755615234375, -0.954315185546875, -0.9280548095703125, -0.90179443359375, -0.8755340576171875, -0.849273681640625, -0.8230133056640625, -0.7967529296875, -0.7704925537109375, -0.744232177734375, -0.7179718017578125, -0.69171142578125, -0.6654510498046875, -0.639190673828125, -0.6129302978515625, -0.586669921875, -0.5604095458984375, -0.534149169921875, -0.5078887939453125, -0.48162841796875, -0.4553680419921875, -0.429107666015625, -0.4028472900390625, -0.3765869140625, -0.3503265380859375, -0.324066162109375, -0.2978057861328125, -0.27154541015625, -0.2452850341796875, -0.219024658203125, -0.1927642822265625, -0.16650390625, -0.1402435302734375, -0.113983154296875, -0.0877227783203125, -0.06146240234375, -0.0352020263671875, -0.008941650390625, 0.0173187255859375, 0.0435791015625, 0.0698394775390625, 0.096099853515625, 0.1223602294921875, 0.14862060546875, 0.1748809814453125, 0.201141357421875, 0.2274017333984375, 0.253662109375, 0.2799224853515625, 0.306182861328125, 0.3324432373046875, 0.35870361328125, 0.3849639892578125, 0.411224365234375, 0.4374847412109375, 0.4637451171875, 0.4900054931640625, 0.516265869140625, 0.5425262451171875, 0.56878662109375, 0.5950469970703125, 0.621307373046875, 0.6475677490234375, 0.673828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 14.0, 10.0, 18.0, 17.0, 24.0, 48.0, 165.0, 2005.0, 365091.0, 678146.0, 2596.0, 217.0, 58.0, 27.0, 16.0, 18.0, 15.0, 10.0, 9.0, 11.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.71875, -31.41162109375, -30.1044921875, -28.79736328125, -27.490234375, -26.18310546875, -24.8759765625, -23.56884765625, -22.26171875, -20.95458984375, -19.6474609375, -18.34033203125, -17.033203125, -15.72607421875, -14.4189453125, -13.11181640625, -11.8046875, -10.49755859375, -9.1904296875, -7.88330078125, -6.576171875, -5.26904296875, -3.9619140625, -2.65478515625, -1.34765625, -0.04052734375, 1.2666015625, 2.57373046875, 3.880859375, 5.18798828125, 6.4951171875, 7.80224609375, 9.109375, 10.41650390625, 11.7236328125, 13.03076171875, 14.337890625, 15.64501953125, 16.9521484375, 18.25927734375, 19.56640625, 20.87353515625, 22.1806640625, 23.48779296875, 24.794921875, 26.10205078125, 27.4091796875, 28.71630859375, 30.0234375, 31.33056640625, 32.6376953125, 33.94482421875, 35.251953125, 36.55908203125, 37.8662109375, 39.17333984375, 40.48046875, 41.78759765625, 43.0947265625, 44.40185546875, 45.708984375, 47.01611328125, 48.3232421875, 49.63037109375, 50.9375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 11.0, 10.0, 14.0, 17.0, 22.0, 27.0, 18.0, 33.0, 29.0, 33.0, 58.0, 35.0, 44.0, 38.0, 44.0, 50.0, 49.0, 54.0, 43.0, 44.0, 31.0, 33.0, 29.0, 24.0, 27.0, 32.0, 18.0, 23.0, 12.0, 15.0, 8.0, 17.0, 11.0, 7.0, 8.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.659942626953125, -2.56402587890625, -2.468109130859375, -2.3721923828125, -2.276275634765625, -2.18035888671875, -2.084442138671875, -1.988525390625, -1.892608642578125, -1.79669189453125, -1.700775146484375, -1.6048583984375, -1.508941650390625, -1.41302490234375, -1.317108154296875, -1.22119140625, -1.125274658203125, -1.02935791015625, -0.933441162109375, -0.8375244140625, -0.741607666015625, -0.64569091796875, -0.549774169921875, -0.453857421875, -0.357940673828125, -0.26202392578125, -0.166107177734375, -0.0701904296875, 0.025726318359375, 0.12164306640625, 0.217559814453125, 0.3134765625, 0.409393310546875, 0.50531005859375, 0.601226806640625, 0.6971435546875, 0.793060302734375, 0.88897705078125, 0.984893798828125, 1.080810546875, 1.176727294921875, 1.27264404296875, 1.368560791015625, 1.4644775390625, 1.560394287109375, 1.65631103515625, 1.752227783203125, 1.84814453125, 1.944061279296875, 2.03997802734375, 2.135894775390625, 2.2318115234375, 2.327728271484375, 2.42364501953125, 2.519561767578125, 2.615478515625, 2.711395263671875, 2.80731201171875, 2.903228759765625, 2.9991455078125, 3.095062255859375, 3.19097900390625, 3.286895751953125, 3.3828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 11.0, 6.0, 11.0, 29.0, 74.0, 342.0, 8544.0, 1037641.0, 1627.0, 156.0, 46.0, 20.0, 8.0, 6.0, 5.0, 3.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.625, -198.2890625, -191.953125, -185.6171875, -179.28125, -172.9453125, -166.609375, -160.2734375, -153.9375, -147.6015625, -141.265625, -134.9296875, -128.59375, -122.2578125, -115.921875, -109.5859375, -103.25, -96.9140625, -90.578125, -84.2421875, -77.90625, -71.5703125, -65.234375, -58.8984375, -52.5625, -46.2265625, -39.890625, -33.5546875, -27.21875, -20.8828125, -14.546875, -8.2109375, -1.875, 4.4609375, 10.796875, 17.1328125, 23.46875, 29.8046875, 36.140625, 42.4765625, 48.8125, 55.1484375, 61.484375, 67.8203125, 74.15625, 80.4921875, 86.828125, 93.1640625, 99.5, 105.8359375, 112.171875, 118.5078125, 124.84375, 131.1796875, 137.515625, 143.8515625, 150.1875, 156.5234375, 162.859375, 169.1953125, 175.53125, 181.8671875, 188.203125, 194.5390625, 200.875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 9.0, 20.0, 33.0, 53.0, 92.0, 164.0, 233.0, 170.0, 98.0, 42.0, 25.0, 14.0, 15.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005803108215332031, -0.0005605444312095642, -0.0005407780408859253, -0.0005210116505622864, -0.0005012452602386475, -0.00048147886991500854, -0.00046171247959136963, -0.0004419460892677307, -0.0004221796989440918, -0.0004024133086204529, -0.00038264691829681396, -0.00036288052797317505, -0.00034311413764953613, -0.0003233477473258972, -0.0003035813570022583, -0.0002838149666786194, -0.00026404857635498047, -0.00024428218603134155, -0.00022451579570770264, -0.00020474940538406372, -0.0001849830150604248, -0.0001652166247367859, -0.00014545023441314697, -0.00012568384408950806, -0.00010591745376586914, -8.615106344223022e-05, -6.638467311859131e-05, -4.661828279495239e-05, -2.6851892471313477e-05, -7.0855021476745605e-06, 1.2680888175964355e-05, 3.244727849960327e-05, 5.221366882324219e-05, 7.19800591468811e-05, 9.174644947052002e-05, 0.00011151283979415894, 0.00013127923011779785, 0.00015104562044143677, 0.00017081201076507568, 0.0001905784010887146, 0.00021034479141235352, 0.00023011118173599243, 0.00024987757205963135, 0.00026964396238327026, 0.0002894103527069092, 0.0003091767430305481, 0.000328943133354187, 0.00034870952367782593, 0.00036847591400146484, 0.00038824230432510376, 0.0004080086946487427, 0.0004277750849723816, 0.0004475414752960205, 0.0004673078656196594, 0.00048707425594329834, 0.0005068406462669373, 0.0005266070365905762, 0.0005463734269142151, 0.000566139817237854, 0.0005859062075614929, 0.0006056725978851318, 0.0006254389882087708, 0.0006452053785324097, 0.0006649717688560486, 0.0006847381591796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 14.0, 7.0, 6.0, 8.0, 24.0, 44.0, 61.0, 107.0, 136.0, 284.0, 434.0, 787.0, 1507.0, 3276.0, 8756.0, 55648.0, 940128.0, 26440.0, 5978.0, 2298.0, 1108.0, 633.0, 349.0, 194.0, 112.0, 75.0, 57.0, 33.0, 13.0, 14.0, 9.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.40625, -38.92919921875, -37.4521484375, -35.97509765625, -34.498046875, -33.02099609375, -31.5439453125, -30.06689453125, -28.58984375, -27.11279296875, -25.6357421875, -24.15869140625, -22.681640625, -21.20458984375, -19.7275390625, -18.25048828125, -16.7734375, -15.29638671875, -13.8193359375, -12.34228515625, -10.865234375, -9.38818359375, -7.9111328125, -6.43408203125, -4.95703125, -3.47998046875, -2.0029296875, -0.52587890625, 0.951171875, 2.42822265625, 3.9052734375, 5.38232421875, 6.859375, 8.33642578125, 9.8134765625, 11.29052734375, 12.767578125, 14.24462890625, 15.7216796875, 17.19873046875, 18.67578125, 20.15283203125, 21.6298828125, 23.10693359375, 24.583984375, 26.06103515625, 27.5380859375, 29.01513671875, 30.4921875, 31.96923828125, 33.4462890625, 34.92333984375, 36.400390625, 37.87744140625, 39.3544921875, 40.83154296875, 42.30859375, 43.78564453125, 45.2626953125, 46.73974609375, 48.216796875, 49.69384765625, 51.1708984375, 52.64794921875, 54.125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 11.0, 7.0, 7.0, 15.0, 39.0, 114.0, 477.0, 211.0, 50.0, 19.0, 12.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.3125, -30.457763671875, -29.60302734375, -28.748291015625, -27.8935546875, -27.038818359375, -26.18408203125, -25.329345703125, -24.474609375, -23.619873046875, -22.76513671875, -21.910400390625, -21.0556640625, -20.200927734375, -19.34619140625, -18.491455078125, -17.63671875, -16.781982421875, -15.92724609375, -15.072509765625, -14.2177734375, -13.363037109375, -12.50830078125, -11.653564453125, -10.798828125, -9.944091796875, -9.08935546875, -8.234619140625, -7.3798828125, -6.525146484375, -5.67041015625, -4.815673828125, -3.9609375, -3.106201171875, -2.25146484375, -1.396728515625, -0.5419921875, 0.312744140625, 1.16748046875, 2.022216796875, 2.876953125, 3.731689453125, 4.58642578125, 5.441162109375, 6.2958984375, 7.150634765625, 8.00537109375, 8.860107421875, 9.71484375, 10.569580078125, 11.42431640625, 12.279052734375, 13.1337890625, 13.988525390625, 14.84326171875, 15.697998046875, 16.552734375, 17.407470703125, 18.26220703125, 19.116943359375, 19.9716796875, 20.826416015625, 21.68115234375, 22.535888671875, 23.390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 13.0, 100.0, 651.0, 212.0, 31.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.75907135009766, -64.02366638183594, -54.28826904296875, -44.55286407470703, -34.81746292114258, -25.082061767578125, -15.346656799316406, -5.611259460449219, 4.1241455078125, 13.85954761505127, 23.59494972229004, 33.330352783203125, 43.06575393676758, 52.80115509033203, 62.53656005859375, 72.27195739746094, 82.00736236572266, 91.74276733398438, 101.47816467285156, 111.21356964111328, 120.948974609375, 130.6843719482422, 140.41976928710938, 150.15518188476562, 159.8905792236328, 169.6259765625, 179.36138916015625, 189.09678649902344, 198.83218383789062, 208.56759643554688, 218.30299377441406, 228.03839111328125, 237.77377319335938, 247.50917053222656, 257.24456787109375, 266.97998046875, 276.71539306640625, 286.4507751464844, 296.1861877441406, 305.92156982421875, 315.656982421875, 325.39239501953125, 335.1277770996094, 344.8631896972656, 354.5986022949219, 364.333984375, 374.06939697265625, 383.8048095703125, 393.54022216796875, 403.275634765625, 413.0110168457031, 422.7464294433594, 432.4818420410156, 442.21722412109375, 451.95263671875, 461.68804931640625, 471.4234313964844, 481.1588439941406, 490.89422607421875, 500.629638671875, 510.36505126953125, 520.1004638671875, 529.8358154296875, 539.5712280273438, 549.306640625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 13.0, 13.0, 19.0, 28.0, 40.0, 35.0, 49.0, 63.0, 67.0, 72.0, 81.0, 75.0, 78.0, 61.0, 61.0, 49.0, 47.0, 40.0, 27.0, 19.0, 16.0, 5.0, 9.0, 9.0, 8.0, 6.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.36708068847656, -42.0186882019043, -40.6702995300293, -39.32190704345703, -37.973514556884766, -36.6251220703125, -35.2767333984375, -33.928340911865234, -32.57994842529297, -31.231557846069336, -29.88316535949707, -28.534774780273438, -27.186382293701172, -25.83799171447754, -24.489601135253906, -23.14120864868164, -21.792818069458008, -20.444427490234375, -19.09603500366211, -17.747644424438477, -16.39925193786621, -15.050861358642578, -13.702469825744629, -12.35407829284668, -11.00568675994873, -9.657295227050781, -8.308903694152832, -6.960512638092041, -5.612121105194092, -4.263729572296143, -2.9153385162353516, -1.5669469833374023, -0.21855545043945312, 1.1298359632492065, 2.478227376937866, 3.8266186714172363, 5.1750102043151855, 6.523401737213135, 7.871792793273926, 9.220184326171875, 10.568575859069824, 11.916967391967773, 13.265358924865723, 14.613750457763672, 15.962141036987305, 17.31053352355957, 18.658924102783203, 20.00731658935547, 21.3557071685791, 22.704097747802734, 24.052490234375, 25.400880813598633, 26.7492733001709, 28.09766387939453, 29.446056365966797, 30.79444694519043, 32.14283752441406, 33.49123001098633, 34.83961868286133, 36.188011169433594, 37.53640365600586, 38.884796142578125, 40.233184814453125, 41.58157730102539, 42.929969787597656]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 0.0, 4.0, 8.0, 6.0, 6.0, 6.0, 12.0, 8.0, 6.0, 13.0, 16.0, 32.0, 62.0, 126.0, 296.0, 1242.0, 11860.0, 4075714.0, 98870.0, 4697.0, 783.0, 209.0, 88.0, 68.0, 35.0, 18.0, 24.0, 22.0, 15.0, 5.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-67.6875, -65.337890625, -62.98828125, -60.638671875, -58.2890625, -55.939453125, -53.58984375, -51.240234375, -48.890625, -46.541015625, -44.19140625, -41.841796875, -39.4921875, -37.142578125, -34.79296875, -32.443359375, -30.09375, -27.744140625, -25.39453125, -23.044921875, -20.6953125, -18.345703125, -15.99609375, -13.646484375, -11.296875, -8.947265625, -6.59765625, -4.248046875, -1.8984375, 0.451171875, 2.80078125, 5.150390625, 7.5, 9.849609375, 12.19921875, 14.548828125, 16.8984375, 19.248046875, 21.59765625, 23.947265625, 26.296875, 28.646484375, 30.99609375, 33.345703125, 35.6953125, 38.044921875, 40.39453125, 42.744140625, 45.09375, 47.443359375, 49.79296875, 52.142578125, 54.4921875, 56.841796875, 59.19140625, 61.541015625, 63.890625, 66.240234375, 68.58984375, 70.939453125, 73.2890625, 75.638671875, 77.98828125, 80.337890625, 82.6875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 8.0, 16.0, 33.0, 48.0, 56.0, 65.0, 76.0, 98.0, 101.0, 115.0, 91.0, 85.0, 74.0, 41.0, 27.0, 26.0, 11.0, 13.0, 10.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.0270843505859375, -0.985809326171875, -0.9445343017578125, -0.90325927734375, -0.8619842529296875, -0.820709228515625, -0.7794342041015625, -0.7381591796875, -0.6968841552734375, -0.655609130859375, -0.6143341064453125, -0.57305908203125, -0.5317840576171875, -0.490509033203125, -0.4492340087890625, -0.407958984375, -0.3666839599609375, -0.325408935546875, -0.2841339111328125, -0.24285888671875, -0.2015838623046875, -0.160308837890625, -0.1190338134765625, -0.0777587890625, -0.0364837646484375, 0.004791259765625, 0.0460662841796875, 0.08734130859375, 0.1286163330078125, 0.169891357421875, 0.2111663818359375, 0.25244140625, 0.2937164306640625, 0.334991455078125, 0.3762664794921875, 0.41754150390625, 0.4588165283203125, 0.500091552734375, 0.5413665771484375, 0.5826416015625, 0.6239166259765625, 0.665191650390625, 0.7064666748046875, 0.74774169921875, 0.7890167236328125, 0.830291748046875, 0.8715667724609375, 0.912841796875, 0.9541168212890625, 0.995391845703125, 1.0366668701171875, 1.07794189453125, 1.1192169189453125, 1.160491943359375, 1.2017669677734375, 1.2430419921875, 1.2843170166015625, 1.325592041015625, 1.3668670654296875, 1.40814208984375, 1.4494171142578125, 1.490692138671875, 1.5319671630859375, 1.5732421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 8.0, 75.0, 2935.0, 4187101.0, 4053.0, 106.0, 13.0, 5.0], "bins": [-315.5, -310.2001953125, -304.900390625, -299.6005859375, -294.30078125, -289.0009765625, -283.701171875, -278.4013671875, -273.1015625, -267.8017578125, -262.501953125, -257.2021484375, -251.90234375, -246.6025390625, -241.302734375, -236.0029296875, -230.703125, -225.4033203125, -220.103515625, -214.8037109375, -209.50390625, -204.2041015625, -198.904296875, -193.6044921875, -188.3046875, -183.0048828125, -177.705078125, -172.4052734375, -167.10546875, -161.8056640625, -156.505859375, -151.2060546875, -145.90625, -140.6064453125, -135.306640625, -130.0068359375, -124.70703125, -119.4072265625, -114.107421875, -108.8076171875, -103.5078125, -98.2080078125, -92.908203125, -87.6083984375, -82.30859375, -77.0087890625, -71.708984375, -66.4091796875, -61.109375, -55.8095703125, -50.509765625, -45.2099609375, -39.91015625, -34.6103515625, -29.310546875, -24.0107421875, -18.7109375, -13.4111328125, -8.111328125, -2.8115234375, 2.48828125, 7.7880859375, 13.087890625, 18.3876953125, 23.6875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 10.0, 10.0, 7.0, 13.0, 23.0, 32.0, 45.0, 63.0, 102.0, 261.0, 2634.0, 495.0, 165.0, 62.0, 40.0, 27.0, 16.0, 10.0, 11.0, 10.0, 14.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.001953125, -2.90692138671875, -2.8118896484375, -2.71685791015625, -2.621826171875, -2.52679443359375, -2.4317626953125, -2.33673095703125, -2.24169921875, -2.14666748046875, -2.0516357421875, -1.95660400390625, -1.861572265625, -1.76654052734375, -1.6715087890625, -1.57647705078125, -1.4814453125, -1.38641357421875, -1.2913818359375, -1.19635009765625, -1.101318359375, -1.00628662109375, -0.9112548828125, -0.81622314453125, -0.72119140625, -0.62615966796875, -0.5311279296875, -0.43609619140625, -0.341064453125, -0.24603271484375, -0.1510009765625, -0.05596923828125, 0.0390625, 0.13409423828125, 0.2291259765625, 0.32415771484375, 0.419189453125, 0.51422119140625, 0.6092529296875, 0.70428466796875, 0.79931640625, 0.89434814453125, 0.9893798828125, 1.08441162109375, 1.179443359375, 1.27447509765625, 1.3695068359375, 1.46453857421875, 1.5595703125, 1.65460205078125, 1.7496337890625, 1.84466552734375, 1.939697265625, 2.03472900390625, 2.1297607421875, 2.22479248046875, 2.31982421875, 2.41485595703125, 2.5098876953125, 2.60491943359375, 2.699951171875, 2.79498291015625, 2.8900146484375, 2.98504638671875, 3.080078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 855.0, 157.0, 5.0], "bins": [-755.0245361328125, -742.81396484375, -730.6033935546875, -718.3927612304688, -706.1821899414062, -693.9716186523438, -681.760986328125, -669.5504150390625, -657.33984375, -645.1292724609375, -632.918701171875, -620.7080688476562, -608.4974975585938, -596.2869262695312, -584.0762939453125, -571.86572265625, -559.6551513671875, -547.444580078125, -535.2340087890625, -523.0233764648438, -510.81280517578125, -498.60223388671875, -486.3916320800781, -474.1810302734375, -461.970458984375, -449.7598876953125, -437.5492858886719, -425.33868408203125, -413.12811279296875, -400.91754150390625, -388.7069396972656, -376.496337890625, -364.2857360839844, -352.07513427734375, -339.86456298828125, -327.65399169921875, -315.4433898925781, -303.2327880859375, -291.022216796875, -278.8116455078125, -266.6010437011719, -254.3904571533203, -242.17987060546875, -229.9692840576172, -217.75869750976562, -205.54811096191406, -193.3375244140625, -181.12693786621094, -168.91635131835938, -156.7057647705078, -144.49517822265625, -132.2845916748047, -120.07400512695312, -107.86341857910156, -95.65283203125, -83.44224548339844, -71.2316665649414, -59.021080017089844, -46.81049346923828, -34.59990692138672, -22.389320373535156, -10.178733825683594, 2.0318527221679688, 14.242439270019531, 26.453025817871094]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 19.0, 34.0, 50.0, 72.0, 120.0, 137.0, 145.0, 109.0, 116.0, 85.0, 69.0, 23.0, 16.0, 11.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-47.301273345947266, -46.367698669433594, -45.43412399291992, -44.50054931640625, -43.56697463989258, -42.633399963378906, -41.699825286865234, -40.76625061035156, -39.83267593383789, -38.89910125732422, -37.96552658081055, -37.031951904296875, -36.0983772277832, -35.16480255126953, -34.23122787475586, -33.29765319824219, -32.36407470703125, -31.430500030517578, -30.496925354003906, -29.563350677490234, -28.629776000976562, -27.69620132446289, -26.76262664794922, -25.829050064086914, -24.895477294921875, -23.961902618408203, -23.02832794189453, -22.09475326538086, -21.161178588867188, -20.227603912353516, -19.294029235839844, -18.36045265197754, -17.426877975463867, -16.493303298950195, -15.559728622436523, -14.626153945922852, -13.692578315734863, -12.759003639221191, -11.82542896270752, -10.891853332519531, -9.95827865600586, -9.024703979492188, -8.091129302978516, -7.1575541496276855, -6.2239789962768555, -5.290404319763184, -4.356829643249512, -3.4232544898986816, -2.489680290222168, -1.556105375289917, -0.6225305795669556, 0.31104421615600586, 1.2446191310882568, 2.178194046020508, 3.1117687225341797, 4.04534387588501, 4.978918552398682, 5.9124932289123535, 6.846068382263184, 7.7796430587768555, 8.713217735290527, 9.646793365478516, 10.580368041992188, 11.51394271850586, 12.447517395019531]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 9.0, 7.0, 14.0, 15.0, 20.0, 21.0, 21.0, 27.0, 39.0, 40.0, 32.0, 44.0, 72.0, 106.0, 769.0, 998326.0, 48319.0, 258.0, 84.0, 55.0, 41.0, 32.0, 44.0, 31.0, 24.0, 13.0, 24.0, 20.0, 11.0, 4.0, 6.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-123.875, -120.5078125, -117.140625, -113.7734375, -110.40625, -107.0390625, -103.671875, -100.3046875, -96.9375, -93.5703125, -90.203125, -86.8359375, -83.46875, -80.1015625, -76.734375, -73.3671875, -70.0, -66.6328125, -63.265625, -59.8984375, -56.53125, -53.1640625, -49.796875, -46.4296875, -43.0625, -39.6953125, -36.328125, -32.9609375, -29.59375, -26.2265625, -22.859375, -19.4921875, -16.125, -12.7578125, -9.390625, -6.0234375, -2.65625, 0.7109375, 4.078125, 7.4453125, 10.8125, 14.1796875, 17.546875, 20.9140625, 24.28125, 27.6484375, 31.015625, 34.3828125, 37.75, 41.1171875, 44.484375, 47.8515625, 51.21875, 54.5859375, 57.953125, 61.3203125, 64.6875, 68.0546875, 71.421875, 74.7890625, 78.15625, 81.5234375, 84.890625, 88.2578125, 91.625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 46.0, 136.0, 274.0, 288.0, 185.0, 64.0, 15.0, 0.0, 2.0, 1.0], "bins": [-10.28125, -10.101104736328125, -9.92095947265625, -9.740814208984375, -9.5606689453125, -9.380523681640625, -9.20037841796875, -9.020233154296875, -8.840087890625, -8.659942626953125, -8.47979736328125, -8.299652099609375, -8.1195068359375, -7.939361572265625, -7.75921630859375, -7.579071044921875, -7.39892578125, -7.218780517578125, -7.03863525390625, -6.858489990234375, -6.6783447265625, -6.498199462890625, -6.31805419921875, -6.137908935546875, -5.957763671875, -5.777618408203125, -5.59747314453125, -5.417327880859375, -5.2371826171875, -5.057037353515625, -4.87689208984375, -4.696746826171875, -4.5166015625, -4.336456298828125, -4.15631103515625, -3.976165771484375, -3.7960205078125, -3.615875244140625, -3.43572998046875, -3.255584716796875, -3.075439453125, -2.895294189453125, -2.71514892578125, -2.535003662109375, -2.3548583984375, -2.174713134765625, -1.99456787109375, -1.814422607421875, -1.63427734375, -1.454132080078125, -1.27398681640625, -1.093841552734375, -0.9136962890625, -0.733551025390625, -0.55340576171875, -0.373260498046875, -0.193115234375, -0.012969970703125, 0.16717529296875, 0.347320556640625, 0.5274658203125, 0.707611083984375, 0.88775634765625, 1.067901611328125, 1.248046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 11.0, 6.0, 10.0, 25.0, 20.0, 42.0, 49.0, 86.0, 158.0, 390.0, 1297.0, 6399.0, 67472.0, 806504.0, 152421.0, 10785.0, 1799.0, 518.0, 239.0, 103.0, 56.0, 38.0, 23.0, 25.0, 11.0, 9.0, 7.0, 7.0, 8.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -42.6357421875, -41.146484375, -39.6572265625, -38.16796875, -36.6787109375, -35.189453125, -33.7001953125, -32.2109375, -30.7216796875, -29.232421875, -27.7431640625, -26.25390625, -24.7646484375, -23.275390625, -21.7861328125, -20.296875, -18.8076171875, -17.318359375, -15.8291015625, -14.33984375, -12.8505859375, -11.361328125, -9.8720703125, -8.3828125, -6.8935546875, -5.404296875, -3.9150390625, -2.42578125, -0.9365234375, 0.552734375, 2.0419921875, 3.53125, 5.0205078125, 6.509765625, 7.9990234375, 9.48828125, 10.9775390625, 12.466796875, 13.9560546875, 15.4453125, 16.9345703125, 18.423828125, 19.9130859375, 21.40234375, 22.8916015625, 24.380859375, 25.8701171875, 27.359375, 28.8486328125, 30.337890625, 31.8271484375, 33.31640625, 34.8056640625, 36.294921875, 37.7841796875, 39.2734375, 40.7626953125, 42.251953125, 43.7412109375, 45.23046875, 46.7197265625, 48.208984375, 49.6982421875, 51.1875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 14.0, 8.0, 20.0, 21.0, 18.0, 23.0, 34.0, 41.0, 54.0, 54.0, 64.0, 45.0, 54.0, 63.0, 51.0, 74.0, 51.0, 59.0, 41.0, 37.0, 28.0, 26.0, 22.0, 18.0, 19.0, 14.0, 7.0, 8.0, 10.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.09375, -9.7362060546875, -9.378662109375, -9.0211181640625, -8.66357421875, -8.3060302734375, -7.948486328125, -7.5909423828125, -7.2333984375, -6.8758544921875, -6.518310546875, -6.1607666015625, -5.80322265625, -5.4456787109375, -5.088134765625, -4.7305908203125, -4.373046875, -4.0155029296875, -3.657958984375, -3.3004150390625, -2.94287109375, -2.5853271484375, -2.227783203125, -1.8702392578125, -1.5126953125, -1.1551513671875, -0.797607421875, -0.4400634765625, -0.08251953125, 0.2750244140625, 0.632568359375, 0.9901123046875, 1.34765625, 1.7052001953125, 2.062744140625, 2.4202880859375, 2.77783203125, 3.1353759765625, 3.492919921875, 3.8504638671875, 4.2080078125, 4.5655517578125, 4.923095703125, 5.2806396484375, 5.63818359375, 5.9957275390625, 6.353271484375, 6.7108154296875, 7.068359375, 7.4259033203125, 7.783447265625, 8.1409912109375, 8.49853515625, 8.8560791015625, 9.213623046875, 9.5711669921875, 9.9287109375, 10.2862548828125, 10.643798828125, 11.0013427734375, 11.35888671875, 11.7164306640625, 12.073974609375, 12.4315185546875, 12.7890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 6.0, 11.0, 17.0, 23.0, 19.0, 41.0, 48.0, 81.0, 131.0, 220.0, 447.0, 887.0, 2450.0, 8720.0, 48346.0, 588432.0, 356840.0, 31702.0, 6469.0, 1969.0, 769.0, 357.0, 170.0, 107.0, 80.0, 53.0, 39.0, 24.0, 20.0, 16.0, 7.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.921875, -22.179931640625, -21.43798828125, -20.696044921875, -19.9541015625, -19.212158203125, -18.47021484375, -17.728271484375, -16.986328125, -16.244384765625, -15.50244140625, -14.760498046875, -14.0185546875, -13.276611328125, -12.53466796875, -11.792724609375, -11.05078125, -10.308837890625, -9.56689453125, -8.824951171875, -8.0830078125, -7.341064453125, -6.59912109375, -5.857177734375, -5.115234375, -4.373291015625, -3.63134765625, -2.889404296875, -2.1474609375, -1.405517578125, -0.66357421875, 0.078369140625, 0.8203125, 1.562255859375, 2.30419921875, 3.046142578125, 3.7880859375, 4.530029296875, 5.27197265625, 6.013916015625, 6.755859375, 7.497802734375, 8.23974609375, 8.981689453125, 9.7236328125, 10.465576171875, 11.20751953125, 11.949462890625, 12.69140625, 13.433349609375, 14.17529296875, 14.917236328125, 15.6591796875, 16.401123046875, 17.14306640625, 17.885009765625, 18.626953125, 19.368896484375, 20.11083984375, 20.852783203125, 21.5947265625, 22.336669921875, 23.07861328125, 23.820556640625, 24.5625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 20.0, 18.0, 27.0, 38.0, 59.0, 87.0, 102.0, 100.0, 118.0, 112.0, 80.0, 72.0, 55.0, 32.0, 27.0, 11.0, 11.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001613616943359375, -0.001554638147354126, -0.001495659351348877, -0.001436680555343628, -0.001377701759338379, -0.0013187229633331299, -0.0012597441673278809, -0.0012007653713226318, -0.0011417865753173828, -0.0010828077793121338, -0.0010238289833068848, -0.0009648501873016357, -0.0009058713912963867, -0.0008468925952911377, -0.0007879137992858887, -0.0007289350032806396, -0.0006699562072753906, -0.0006109774112701416, -0.0005519986152648926, -0.0004930198192596436, -0.00043404102325439453, -0.0003750622272491455, -0.0003160834312438965, -0.00025710463523864746, -0.00019812583923339844, -0.00013914704322814941, -8.016824722290039e-05, -2.1189451217651367e-05, 3.7789344787597656e-05, 9.676814079284668e-05, 0.0001557469367980957, 0.00021472573280334473, 0.00027370452880859375, 0.0003326833248138428, 0.0003916621208190918, 0.0004506409168243408, 0.0005096197128295898, 0.0005685985088348389, 0.0006275773048400879, 0.0006865561008453369, 0.0007455348968505859, 0.000804513692855835, 0.000863492488861084, 0.000922471284866333, 0.000981450080871582, 0.001040428876876831, 0.00109940767288208, 0.001158386468887329, 0.0012173652648925781, 0.0012763440608978271, 0.0013353228569030762, 0.0013943016529083252, 0.0014532804489135742, 0.0015122592449188232, 0.0015712380409240723, 0.0016302168369293213, 0.0016891956329345703, 0.0017481744289398193, 0.0018071532249450684, 0.0018661320209503174, 0.0019251108169555664, 0.0019840896129608154, 0.0020430684089660645, 0.0021020472049713135, 0.0021610260009765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 4.0, 15.0, 17.0, 10.0, 25.0, 42.0, 79.0, 118.0, 228.0, 595.0, 2077.0, 11662.0, 169183.0, 809551.0, 47818.0, 5112.0, 1149.0, 419.0, 187.0, 91.0, 57.0, 18.0, 25.0, 11.0, 12.0, 14.0, 3.0, 9.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.52392578125, -23.6572265625, -22.79052734375, -21.923828125, -21.05712890625, -20.1904296875, -19.32373046875, -18.45703125, -17.59033203125, -16.7236328125, -15.85693359375, -14.990234375, -14.12353515625, -13.2568359375, -12.39013671875, -11.5234375, -10.65673828125, -9.7900390625, -8.92333984375, -8.056640625, -7.18994140625, -6.3232421875, -5.45654296875, -4.58984375, -3.72314453125, -2.8564453125, -1.98974609375, -1.123046875, -0.25634765625, 0.6103515625, 1.47705078125, 2.34375, 3.21044921875, 4.0771484375, 4.94384765625, 5.810546875, 6.67724609375, 7.5439453125, 8.41064453125, 9.27734375, 10.14404296875, 11.0107421875, 11.87744140625, 12.744140625, 13.61083984375, 14.4775390625, 15.34423828125, 16.2109375, 17.07763671875, 17.9443359375, 18.81103515625, 19.677734375, 20.54443359375, 21.4111328125, 22.27783203125, 23.14453125, 24.01123046875, 24.8779296875, 25.74462890625, 26.611328125, 27.47802734375, 28.3447265625, 29.21142578125, 30.078125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 5.0, 13.0, 12.0, 13.0, 18.0, 17.0, 32.0, 42.0, 56.0, 75.0, 80.0, 96.0, 131.0, 84.0, 73.0, 53.0, 39.0, 41.0, 18.0, 17.0, 17.0, 13.0, 8.0, 5.0, 7.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4765625, -8.2275390625, -7.978515625, -7.7294921875, -7.48046875, -7.2314453125, -6.982421875, -6.7333984375, -6.484375, -6.2353515625, -5.986328125, -5.7373046875, -5.48828125, -5.2392578125, -4.990234375, -4.7412109375, -4.4921875, -4.2431640625, -3.994140625, -3.7451171875, -3.49609375, -3.2470703125, -2.998046875, -2.7490234375, -2.5, -2.2509765625, -2.001953125, -1.7529296875, -1.50390625, -1.2548828125, -1.005859375, -0.7568359375, -0.5078125, -0.2587890625, -0.009765625, 0.2392578125, 0.48828125, 0.7373046875, 0.986328125, 1.2353515625, 1.484375, 1.7333984375, 1.982421875, 2.2314453125, 2.48046875, 2.7294921875, 2.978515625, 3.2275390625, 3.4765625, 3.7255859375, 3.974609375, 4.2236328125, 4.47265625, 4.7216796875, 4.970703125, 5.2197265625, 5.46875, 5.7177734375, 5.966796875, 6.2158203125, 6.46484375, 6.7138671875, 6.962890625, 7.2119140625, 7.4609375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 19.0, 85.0, 397.0, 345.0, 99.0, 24.0, 10.0, 5.0, 2.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.99536895751953, -52.71883773803711, -41.44230651855469, -30.16577911376953, -18.88924789428711, -7.6127166748046875, 3.6638107299804688, 14.940345764160156, 26.216873168945312, 37.493404388427734, 48.769935607910156, 60.04646301269531, 71.322998046875, 82.59952545166016, 93.87605285644531, 105.152587890625, 116.42911529541016, 127.70564270019531, 138.982177734375, 150.25869750976562, 161.5352325439453, 172.811767578125, 184.08828735351562, 195.36483764648438, 206.641357421875, 217.9178924560547, 229.1944122314453, 240.470947265625, 251.7474822998047, 263.0240173339844, 274.300537109375, 285.57708740234375, 296.8536071777344, 308.130126953125, 319.40667724609375, 330.6831970214844, 341.959716796875, 353.23626708984375, 364.5127868652344, 375.789306640625, 387.06585693359375, 398.3423767089844, 409.6189270019531, 420.89544677734375, 432.1719665527344, 443.4485168457031, 454.72503662109375, 466.0015869140625, 477.278076171875, 488.5545959472656, 499.8311462402344, 511.107666015625, 522.3842163085938, 533.6607055664062, 544.937255859375, 556.2138061523438, 567.4903564453125, 578.7669067382812, 590.0433959960938, 601.3199462890625, 612.5964965820312, 623.8729858398438, 635.1495361328125, 646.4260864257812, 657.7025756835938]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 12.0, 8.0, 19.0, 23.0, 31.0, 52.0, 53.0, 72.0, 86.0, 85.0, 97.0, 83.0, 83.0, 63.0, 67.0, 52.0, 41.0, 21.0, 24.0, 14.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.49164581298828, -123.83369445800781, -120.17574310302734, -116.51779174804688, -112.85983276367188, -109.20188903808594, -105.54393005371094, -101.88597869873047, -98.22802734375, -94.57007598876953, -90.91212463378906, -87.2541732788086, -83.59622192382812, -79.93826293945312, -76.28031158447266, -72.62236022949219, -68.96440887451172, -65.30645751953125, -61.64850616455078, -57.99055099487305, -54.33259963989258, -50.67464828491211, -47.016693115234375, -43.358741760253906, -39.70079040527344, -36.04283905029297, -32.3848876953125, -28.726932525634766, -25.068981170654297, -21.411029815673828, -17.753076553344727, -14.095123291015625, -10.437179565429688, -6.779227256774902, -3.121274948120117, 0.536677360534668, 4.194629669189453, 7.852581024169922, 11.510534286499023, 15.168487548828125, 18.826438903808594, 22.484390258789062, 26.142343521118164, 29.800296783447266, 33.458248138427734, 37.1161994934082, 40.77415466308594, 44.432106018066406, 48.090057373046875, 51.748008728027344, 55.40596008300781, 59.06391525268555, 62.721866607666016, 66.37982177734375, 70.03777313232422, 73.69572448730469, 77.35367584228516, 81.01162719726562, 84.6695785522461, 88.32752990722656, 91.98548889160156, 95.6434326171875, 99.3013916015625, 102.95934295654297, 106.61729431152344]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 12.0, 20.0, 43.0, 99.0, 196.0, 616.0, 5633.0, 4184979.0, 2129.0, 316.0, 107.0, 56.0, 35.0, 19.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0], "bins": [-382.75, -375.3056640625, -367.861328125, -360.4169921875, -352.97265625, -345.5283203125, -338.083984375, -330.6396484375, -323.1953125, -315.7509765625, -308.306640625, -300.8623046875, -293.41796875, -285.9736328125, -278.529296875, -271.0849609375, -263.640625, -256.1962890625, -248.751953125, -241.3076171875, -233.86328125, -226.4189453125, -218.974609375, -211.5302734375, -204.0859375, -196.6416015625, -189.197265625, -181.7529296875, -174.30859375, -166.8642578125, -159.419921875, -151.9755859375, -144.53125, -137.0869140625, -129.642578125, -122.1982421875, -114.75390625, -107.3095703125, -99.865234375, -92.4208984375, -84.9765625, -77.5322265625, -70.087890625, -62.6435546875, -55.19921875, -47.7548828125, -40.310546875, -32.8662109375, -25.421875, -17.9775390625, -10.533203125, -3.0888671875, 4.35546875, 11.7998046875, 19.244140625, 26.6884765625, 34.1328125, 41.5771484375, 49.021484375, 56.4658203125, 63.91015625, 71.3544921875, 78.798828125, 86.2431640625, 93.6875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 41.0, 86.0, 177.0, 248.0, 221.0, 143.0, 60.0, 16.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -11.07891845703125, -10.8687744140625, -10.65863037109375, -10.448486328125, -10.23834228515625, -10.0281982421875, -9.81805419921875, -9.60791015625, -9.39776611328125, -9.1876220703125, -8.97747802734375, -8.767333984375, -8.55718994140625, -8.3470458984375, -8.13690185546875, -7.9267578125, -7.71661376953125, -7.5064697265625, -7.29632568359375, -7.086181640625, -6.87603759765625, -6.6658935546875, -6.45574951171875, -6.24560546875, -6.03546142578125, -5.8253173828125, -5.61517333984375, -5.405029296875, -5.19488525390625, -4.9847412109375, -4.77459716796875, -4.564453125, -4.35430908203125, -4.1441650390625, -3.93402099609375, -3.723876953125, -3.51373291015625, -3.3035888671875, -3.09344482421875, -2.88330078125, -2.67315673828125, -2.4630126953125, -2.25286865234375, -2.042724609375, -1.83258056640625, -1.6224365234375, -1.41229248046875, -1.2021484375, -0.99200439453125, -0.7818603515625, -0.57171630859375, -0.361572265625, -0.15142822265625, 0.0587158203125, 0.26885986328125, 0.47900390625, 0.68914794921875, 0.8992919921875, 1.10943603515625, 1.319580078125, 1.52972412109375, 1.7398681640625, 1.95001220703125, 2.16015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 14.0, 28.0, 38.0, 100.0, 167.0, 235.0, 401.0, 4184104.0, 8673.0, 237.0, 144.0, 79.0, 41.0, 25.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1247.0, -1221.4765625, -1195.953125, -1170.4296875, -1144.90625, -1119.3828125, -1093.859375, -1068.3359375, -1042.8125, -1017.2890625, -991.765625, -966.2421875, -940.71875, -915.1953125, -889.671875, -864.1484375, -838.625, -813.1015625, -787.578125, -762.0546875, -736.53125, -711.0078125, -685.484375, -659.9609375, -634.4375, -608.9140625, -583.390625, -557.8671875, -532.34375, -506.8203125, -481.296875, -455.7734375, -430.25, -404.7265625, -379.203125, -353.6796875, -328.15625, -302.6328125, -277.109375, -251.5859375, -226.0625, -200.5390625, -175.015625, -149.4921875, -123.96875, -98.4453125, -72.921875, -47.3984375, -21.875, 3.6484375, 29.171875, 54.6953125, 80.21875, 105.7421875, 131.265625, 156.7890625, 182.3125, 207.8359375, 233.359375, 258.8828125, 284.40625, 309.9296875, 335.453125, 360.9765625, 386.5]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 50.0, 637.0, 3359.0, 35.0, 8.0], "bins": [-112.875, -111.02838134765625, -109.1817626953125, -107.33514404296875, -105.488525390625, -103.64190673828125, -101.7952880859375, -99.94866943359375, -98.10205078125, -96.25543212890625, -94.4088134765625, -92.56219482421875, -90.715576171875, -88.86895751953125, -87.0223388671875, -85.17572021484375, -83.3291015625, -81.48248291015625, -79.6358642578125, -77.78924560546875, -75.942626953125, -74.09600830078125, -72.2493896484375, -70.40277099609375, -68.55615234375, -66.70953369140625, -64.8629150390625, -63.01629638671875, -61.169677734375, -59.32305908203125, -57.4764404296875, -55.62982177734375, -53.783203125, -51.93658447265625, -50.0899658203125, -48.24334716796875, -46.396728515625, -44.55010986328125, -42.7034912109375, -40.85687255859375, -39.01025390625, -37.16363525390625, -35.3170166015625, -33.47039794921875, -31.623779296875, -29.77716064453125, -27.9305419921875, -26.08392333984375, -24.2373046875, -22.39068603515625, -20.5440673828125, -18.69744873046875, -16.850830078125, -15.00421142578125, -13.1575927734375, -11.31097412109375, -9.46435546875, -7.61773681640625, -5.7711181640625, -3.92449951171875, -2.077880859375, -0.23126220703125, 1.6153564453125, 3.46197509765625, 5.30859375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 17.0, 247.0, 696.0, 36.0, 6.0, 2.0, 4.0, 1.0], "bins": [-1444.3778076171875, -1419.55126953125, -1394.724853515625, -1369.8983154296875, -1345.07177734375, -1320.245361328125, -1295.4188232421875, -1270.5924072265625, -1245.765869140625, -1220.9393310546875, -1196.1129150390625, -1171.286376953125, -1146.4599609375, -1121.6334228515625, -1096.806884765625, -1071.98046875, -1047.1539306640625, -1022.3274536132812, -997.5009765625, -972.6744384765625, -947.8479614257812, -923.021484375, -898.1949462890625, -873.3684692382812, -848.5419921875, -823.7155151367188, -798.8890380859375, -774.0625, -749.2360229492188, -724.4095458984375, -699.5830078125, -674.7565307617188, -649.9300537109375, -625.1035766601562, -600.277099609375, -575.4505615234375, -550.6240844726562, -525.797607421875, -500.9710998535156, -476.14459228515625, -451.318115234375, -426.49163818359375, -401.6651306152344, -376.838623046875, -352.01214599609375, -327.1856689453125, -302.3591613769531, -277.53265380859375, -252.70616149902344, -227.87966918945312, -203.0531768798828, -178.2266845703125, -153.4001922607422, -128.57369995117188, -103.74720764160156, -78.92071533203125, -54.09422302246094, -29.267730712890625, -4.4412384033203125, 20.38525390625, 45.21174621582031, 70.03823852539062, 94.86473083496094, 119.69122314453125, 144.51771545410156]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 18.0, 24.0, 56.0, 112.0, 146.0, 186.0, 153.0, 130.0, 74.0, 63.0, 18.0, 10.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-311.02392578125, -299.43194580078125, -287.8399658203125, -276.24798583984375, -264.656005859375, -253.06402587890625, -241.47203063964844, -229.8800506591797, -218.28807067871094, -206.6960906982422, -195.10411071777344, -183.51211547851562, -171.92013549804688, -160.32815551757812, -148.73617553710938, -137.14419555664062, -125.55221557617188, -113.96023559570312, -102.36825561523438, -90.7762680053711, -79.18428802490234, -67.5923080444336, -56.00032043457031, -44.40834045410156, -32.81636047363281, -21.22437858581543, -9.632396697998047, 1.9595870971679688, 13.551567077636719, 25.14354705810547, 36.73553466796875, 48.3275146484375, 59.91949462890625, 71.511474609375, 83.10345458984375, 94.69544219970703, 106.28742218017578, 117.87940216064453, 129.4713897705078, 141.06336975097656, 152.6553497314453, 164.24732971191406, 175.8393096923828, 187.43130493164062, 199.02328491210938, 210.61526489257812, 222.20724487304688, 233.79922485351562, 245.39120483398438, 256.9831848144531, 268.5751647949219, 280.1671447753906, 291.7591247558594, 303.3511047363281, 314.943115234375, 326.53509521484375, 338.1270751953125, 349.71905517578125, 361.31103515625, 372.90301513671875, 384.4949951171875, 396.08697509765625, 407.678955078125, 419.27093505859375, 430.8629150390625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 16.0, 20.0, 30.0, 33.0, 46.0, 86.0, 125.0, 281.0, 684.0, 2401.0, 20412.0, 838701.0, 176341.0, 7004.0, 1356.0, 479.0, 195.0, 120.0, 52.0, 43.0, 23.0, 28.0, 16.0, 14.0, 14.0, 10.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.375, -136.783203125, -132.19140625, -127.599609375, -123.0078125, -118.416015625, -113.82421875, -109.232421875, -104.640625, -100.048828125, -95.45703125, -90.865234375, -86.2734375, -81.681640625, -77.08984375, -72.498046875, -67.90625, -63.314453125, -58.72265625, -54.130859375, -49.5390625, -44.947265625, -40.35546875, -35.763671875, -31.171875, -26.580078125, -21.98828125, -17.396484375, -12.8046875, -8.212890625, -3.62109375, 0.970703125, 5.5625, 10.154296875, 14.74609375, 19.337890625, 23.9296875, 28.521484375, 33.11328125, 37.705078125, 42.296875, 46.888671875, 51.48046875, 56.072265625, 60.6640625, 65.255859375, 69.84765625, 74.439453125, 79.03125, 83.623046875, 88.21484375, 92.806640625, 97.3984375, 101.990234375, 106.58203125, 111.173828125, 115.765625, 120.357421875, 124.94921875, 129.541015625, 134.1328125, 138.724609375, 143.31640625, 147.908203125, 152.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 12.0, 29.0, 46.0, 67.0, 106.0, 125.0, 145.0, 153.0, 101.0, 88.0, 57.0, 31.0, 19.0, 13.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.312255859375, -18.85888671875, -18.405517578125, -17.9521484375, -17.498779296875, -17.04541015625, -16.592041015625, -16.138671875, -15.685302734375, -15.23193359375, -14.778564453125, -14.3251953125, -13.871826171875, -13.41845703125, -12.965087890625, -12.51171875, -12.058349609375, -11.60498046875, -11.151611328125, -10.6982421875, -10.244873046875, -9.79150390625, -9.338134765625, -8.884765625, -8.431396484375, -7.97802734375, -7.524658203125, -7.0712890625, -6.617919921875, -6.16455078125, -5.711181640625, -5.2578125, -4.804443359375, -4.35107421875, -3.897705078125, -3.4443359375, -2.990966796875, -2.53759765625, -2.084228515625, -1.630859375, -1.177490234375, -0.72412109375, -0.270751953125, 0.1826171875, 0.635986328125, 1.08935546875, 1.542724609375, 1.99609375, 2.449462890625, 2.90283203125, 3.356201171875, 3.8095703125, 4.262939453125, 4.71630859375, 5.169677734375, 5.623046875, 6.076416015625, 6.52978515625, 6.983154296875, 7.4365234375, 7.889892578125, 8.34326171875, 8.796630859375, 9.25]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 11.0, 15.0, 14.0, 13.0, 23.0, 23.0, 46.0, 71.0, 111.0, 293.0, 1010.0, 7723.0, 358053.0, 666998.0, 12134.0, 1309.0, 332.0, 133.0, 61.0, 47.0, 32.0, 27.0, 22.0, 8.0, 9.0, 7.0, 6.0, 5.0, 6.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.0, -112.693359375, -109.38671875, -106.080078125, -102.7734375, -99.466796875, -96.16015625, -92.853515625, -89.546875, -86.240234375, -82.93359375, -79.626953125, -76.3203125, -73.013671875, -69.70703125, -66.400390625, -63.09375, -59.787109375, -56.48046875, -53.173828125, -49.8671875, -46.560546875, -43.25390625, -39.947265625, -36.640625, -33.333984375, -30.02734375, -26.720703125, -23.4140625, -20.107421875, -16.80078125, -13.494140625, -10.1875, -6.880859375, -3.57421875, -0.267578125, 3.0390625, 6.345703125, 9.65234375, 12.958984375, 16.265625, 19.572265625, 22.87890625, 26.185546875, 29.4921875, 32.798828125, 36.10546875, 39.412109375, 42.71875, 46.025390625, 49.33203125, 52.638671875, 55.9453125, 59.251953125, 62.55859375, 65.865234375, 69.171875, 72.478515625, 75.78515625, 79.091796875, 82.3984375, 85.705078125, 89.01171875, 92.318359375, 95.625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 10.0, 4.0, 11.0, 13.0, 12.0, 16.0, 26.0, 21.0, 36.0, 42.0, 49.0, 54.0, 73.0, 77.0, 60.0, 60.0, 64.0, 59.0, 43.0, 48.0, 31.0, 38.0, 39.0, 27.0, 21.0, 13.0, 10.0, 14.0, 5.0, 2.0, 4.0, 8.0, 3.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.375, -35.37109375, -34.3671875, -33.36328125, -32.359375, -31.35546875, -30.3515625, -29.34765625, -28.34375, -27.33984375, -26.3359375, -25.33203125, -24.328125, -23.32421875, -22.3203125, -21.31640625, -20.3125, -19.30859375, -18.3046875, -17.30078125, -16.296875, -15.29296875, -14.2890625, -13.28515625, -12.28125, -11.27734375, -10.2734375, -9.26953125, -8.265625, -7.26171875, -6.2578125, -5.25390625, -4.25, -3.24609375, -2.2421875, -1.23828125, -0.234375, 0.76953125, 1.7734375, 2.77734375, 3.78125, 4.78515625, 5.7890625, 6.79296875, 7.796875, 8.80078125, 9.8046875, 10.80859375, 11.8125, 12.81640625, 13.8203125, 14.82421875, 15.828125, 16.83203125, 17.8359375, 18.83984375, 19.84375, 20.84765625, 21.8515625, 22.85546875, 23.859375, 24.86328125, 25.8671875, 26.87109375, 27.875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 12.0, 11.0, 13.0, 16.0, 18.0, 31.0, 56.0, 75.0, 101.0, 192.0, 448.0, 1209.0, 4260.0, 38600.0, 956396.0, 40468.0, 4511.0, 1159.0, 438.0, 196.0, 106.0, 79.0, 41.0, 16.0, 18.0, 11.0, 14.0, 7.0, 4.0, 4.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.03125, -56.88525390625, -54.7392578125, -52.59326171875, -50.447265625, -48.30126953125, -46.1552734375, -44.00927734375, -41.86328125, -39.71728515625, -37.5712890625, -35.42529296875, -33.279296875, -31.13330078125, -28.9873046875, -26.84130859375, -24.6953125, -22.54931640625, -20.4033203125, -18.25732421875, -16.111328125, -13.96533203125, -11.8193359375, -9.67333984375, -7.52734375, -5.38134765625, -3.2353515625, -1.08935546875, 1.056640625, 3.20263671875, 5.3486328125, 7.49462890625, 9.640625, 11.78662109375, 13.9326171875, 16.07861328125, 18.224609375, 20.37060546875, 22.5166015625, 24.66259765625, 26.80859375, 28.95458984375, 31.1005859375, 33.24658203125, 35.392578125, 37.53857421875, 39.6845703125, 41.83056640625, 43.9765625, 46.12255859375, 48.2685546875, 50.41455078125, 52.560546875, 54.70654296875, 56.8525390625, 58.99853515625, 61.14453125, 63.29052734375, 65.4365234375, 67.58251953125, 69.728515625, 71.87451171875, 74.0205078125, 76.16650390625, 78.3125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 11.0, 12.0, 35.0, 50.0, 66.0, 109.0, 150.0, 175.0, 140.0, 101.0, 56.0, 27.0, 16.0, 16.0, 12.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00446319580078125, -0.0043437182903289795, -0.004224240779876709, -0.0041047632694244385, -0.003985285758972168, -0.0038658082485198975, -0.003746330738067627, -0.0036268532276153564, -0.003507375717163086, -0.0033878982067108154, -0.003268420696258545, -0.0031489431858062744, -0.003029465675354004, -0.0029099881649017334, -0.002790510654449463, -0.0026710331439971924, -0.002551555633544922, -0.0024320781230926514, -0.002312600612640381, -0.0021931231021881104, -0.00207364559173584, -0.0019541680812835693, -0.0018346905708312988, -0.0017152130603790283, -0.0015957355499267578, -0.0014762580394744873, -0.0013567805290222168, -0.0012373030185699463, -0.0011178255081176758, -0.0009983479976654053, -0.0008788704872131348, -0.0007593929767608643, -0.0006399154663085938, -0.0005204379558563232, -0.00040096044540405273, -0.0002814829349517822, -0.00016200542449951172, -4.252791404724121e-05, 7.69495964050293e-05, 0.0001964271068572998, 0.0003159046173095703, 0.0004353821277618408, 0.0005548596382141113, 0.0006743371486663818, 0.0007938146591186523, 0.0009132921695709229, 0.0010327696800231934, 0.0011522471904754639, 0.0012717247009277344, 0.0013912022113800049, 0.0015106797218322754, 0.001630157232284546, 0.0017496347427368164, 0.001869112253189087, 0.0019885897636413574, 0.002108067274093628, 0.0022275447845458984, 0.002347022294998169, 0.0024664998054504395, 0.00258597731590271, 0.0027054548263549805, 0.002824932336807251, 0.0029444098472595215, 0.003063887357711792, 0.0031833648681640625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 9.0, 1.0, 8.0, 8.0, 8.0, 13.0, 35.0, 38.0, 64.0, 98.0, 189.0, 444.0, 1396.0, 6770.0, 191537.0, 829537.0, 15049.0, 2232.0, 599.0, 194.0, 123.0, 64.0, 44.0, 21.0, 20.0, 4.0, 13.0, 6.0, 6.0, 8.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-68.0, -66.1708984375, -64.341796875, -62.5126953125, -60.68359375, -58.8544921875, -57.025390625, -55.1962890625, -53.3671875, -51.5380859375, -49.708984375, -47.8798828125, -46.05078125, -44.2216796875, -42.392578125, -40.5634765625, -38.734375, -36.9052734375, -35.076171875, -33.2470703125, -31.41796875, -29.5888671875, -27.759765625, -25.9306640625, -24.1015625, -22.2724609375, -20.443359375, -18.6142578125, -16.78515625, -14.9560546875, -13.126953125, -11.2978515625, -9.46875, -7.6396484375, -5.810546875, -3.9814453125, -2.15234375, -0.3232421875, 1.505859375, 3.3349609375, 5.1640625, 6.9931640625, 8.822265625, 10.6513671875, 12.48046875, 14.3095703125, 16.138671875, 17.9677734375, 19.796875, 21.6259765625, 23.455078125, 25.2841796875, 27.11328125, 28.9423828125, 30.771484375, 32.6005859375, 34.4296875, 36.2587890625, 38.087890625, 39.9169921875, 41.74609375, 43.5751953125, 45.404296875, 47.2333984375, 49.0625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 15.0, 24.0, 34.0, 46.0, 75.0, 99.0, 122.0, 127.0, 119.0, 119.0, 69.0, 39.0, 27.0, 17.0, 13.0, 6.0, 1.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.6788330078125, -23.107666015625, -22.5364990234375, -21.96533203125, -21.3941650390625, -20.822998046875, -20.2518310546875, -19.6806640625, -19.1094970703125, -18.538330078125, -17.9671630859375, -17.39599609375, -16.8248291015625, -16.253662109375, -15.6824951171875, -15.111328125, -14.5401611328125, -13.968994140625, -13.3978271484375, -12.82666015625, -12.2554931640625, -11.684326171875, -11.1131591796875, -10.5419921875, -9.9708251953125, -9.399658203125, -8.8284912109375, -8.25732421875, -7.6861572265625, -7.114990234375, -6.5438232421875, -5.97265625, -5.4014892578125, -4.830322265625, -4.2591552734375, -3.68798828125, -3.1168212890625, -2.545654296875, -1.9744873046875, -1.4033203125, -0.8321533203125, -0.260986328125, 0.3101806640625, 0.88134765625, 1.4525146484375, 2.023681640625, 2.5948486328125, 3.166015625, 3.7371826171875, 4.308349609375, 4.8795166015625, 5.45068359375, 6.0218505859375, 6.593017578125, 7.1641845703125, 7.7353515625, 8.3065185546875, 8.877685546875, 9.4488525390625, 10.02001953125, 10.5911865234375, 11.162353515625, 11.7335205078125, 12.3046875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 8.0, 8.0, 29.0, 106.0, 354.0, 358.0, 100.0, 24.0, 10.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.0758285522461, -94.62273406982422, -78.16964721679688, -61.716552734375, -45.263458251953125, -28.81036376953125, -12.357276916503906, 4.095817565917969, 20.548912048339844, 37.00200653076172, 53.45509719848633, 69.90818786621094, 86.36128234863281, 102.81437683105469, 119.26746368408203, 135.72055053710938, 152.17364501953125, 168.62673950195312, 185.079833984375, 201.53292846679688, 217.98602294921875, 234.43911743164062, 250.89219665527344, 267.34527587890625, 283.79840087890625, 300.2514953613281, 316.70458984375, 333.1576843261719, 349.61077880859375, 366.0638732910156, 382.5169677734375, 398.97003173828125, 415.423095703125, 431.8761901855469, 448.32928466796875, 464.7823791503906, 481.2354736328125, 497.6885681152344, 514.1416625976562, 530.5947265625, 547.0478515625, 563.5009155273438, 579.9540405273438, 596.4071044921875, 612.8602294921875, 629.3132934570312, 645.7664184570312, 662.219482421875, 678.672607421875, 695.1256713867188, 711.5787963867188, 728.0318603515625, 744.4849853515625, 760.9380493164062, 777.3911743164062, 793.84423828125, 810.2973022460938, 826.7503662109375, 843.2034912109375, 859.6565551757812, 876.1096801757812, 892.562744140625, 909.015869140625, 925.4689331054688, 941.9220581054688]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 12.0, 20.0, 28.0, 29.0, 35.0, 43.0, 49.0, 49.0, 56.0, 58.0, 63.0, 67.0, 67.0, 50.0, 52.0, 58.0, 42.0, 33.0, 36.0, 31.0, 20.0, 19.0, 17.0, 6.0, 10.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-221.92776489257812, -215.7952117919922, -209.6626739501953, -203.53012084960938, -197.39756774902344, -191.2650146484375, -185.13247680664062, -178.9999237060547, -172.86737060546875, -166.7348175048828, -160.60227966308594, -154.4697265625, -148.33717346191406, -142.20462036132812, -136.07208251953125, -129.9395294189453, -123.80699157714844, -117.67444610595703, -111.5418930053711, -105.40934753417969, -99.27679443359375, -93.14424896240234, -87.01170349121094, -80.879150390625, -74.7466049194336, -68.61405944824219, -62.48150634765625, -56.348960876464844, -50.21641159057617, -44.0838623046875, -37.951316833496094, -31.818767547607422, -25.68621826171875, -19.553668975830078, -13.421121597290039, -7.28857421875, -1.1560249328613281, 4.976524353027344, 11.10906982421875, 17.241619110107422, 23.374168395996094, 29.506717681884766, 35.63926696777344, 41.771812438964844, 47.904361724853516, 54.03691101074219, 60.169456481933594, 66.302001953125, 72.43455505371094, 78.56710052490234, 84.69965362548828, 90.83219909667969, 96.96475219726562, 103.09729766845703, 109.22984313964844, 115.36239624023438, 121.49494171142578, 127.62748718261719, 133.76004028320312, 139.892578125, 146.02513122558594, 152.15768432617188, 158.29022216796875, 164.4227752685547, 170.55532836914062]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 13.0, 19.0, 37.0, 77.0, 187.0, 381.0, 1661.0, 48013.0, 4137049.0, 6214.0, 388.0, 118.0, 63.0, 35.0, 14.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-346.5, -339.611328125, -332.72265625, -325.833984375, -318.9453125, -312.056640625, -305.16796875, -298.279296875, -291.390625, -284.501953125, -277.61328125, -270.724609375, -263.8359375, -256.947265625, -250.05859375, -243.169921875, -236.28125, -229.392578125, -222.50390625, -215.615234375, -208.7265625, -201.837890625, -194.94921875, -188.060546875, -181.171875, -174.283203125, -167.39453125, -160.505859375, -153.6171875, -146.728515625, -139.83984375, -132.951171875, -126.0625, -119.173828125, -112.28515625, -105.396484375, -98.5078125, -91.619140625, -84.73046875, -77.841796875, -70.953125, -64.064453125, -57.17578125, -50.287109375, -43.3984375, -36.509765625, -29.62109375, -22.732421875, -15.84375, -8.955078125, -2.06640625, 4.822265625, 11.7109375, 18.599609375, 25.48828125, 32.376953125, 39.265625, 46.154296875, 53.04296875, 59.931640625, 66.8203125, 73.708984375, 80.59765625, 87.486328125, 94.375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 22.0, 46.0, 67.0, 84.0, 117.0, 123.0, 132.0, 117.0, 92.0, 62.0, 42.0, 28.0, 22.0, 15.0, 3.0, 4.0, 0.0, 2.0, 0.0, 3.0], "bins": [-19.6875, -19.29345703125, -18.8994140625, -18.50537109375, -18.111328125, -17.71728515625, -17.3232421875, -16.92919921875, -16.53515625, -16.14111328125, -15.7470703125, -15.35302734375, -14.958984375, -14.56494140625, -14.1708984375, -13.77685546875, -13.3828125, -12.98876953125, -12.5947265625, -12.20068359375, -11.806640625, -11.41259765625, -11.0185546875, -10.62451171875, -10.23046875, -9.83642578125, -9.4423828125, -9.04833984375, -8.654296875, -8.26025390625, -7.8662109375, -7.47216796875, -7.078125, -6.68408203125, -6.2900390625, -5.89599609375, -5.501953125, -5.10791015625, -4.7138671875, -4.31982421875, -3.92578125, -3.53173828125, -3.1376953125, -2.74365234375, -2.349609375, -1.95556640625, -1.5615234375, -1.16748046875, -0.7734375, -0.37939453125, 0.0146484375, 0.40869140625, 0.802734375, 1.19677734375, 1.5908203125, 1.98486328125, 2.37890625, 2.77294921875, 3.1669921875, 3.56103515625, 3.955078125, 4.34912109375, 4.7431640625, 5.13720703125, 5.53125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 11.0, 34.0, 113.0, 276.0, 3520.0, 4189600.0, 603.0, 82.0, 38.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1323.0, -1298.18359375, -1273.3671875, -1248.55078125, -1223.734375, -1198.91796875, -1174.1015625, -1149.28515625, -1124.46875, -1099.65234375, -1074.8359375, -1050.01953125, -1025.203125, -1000.38671875, -975.5703125, -950.75390625, -925.9375, -901.12109375, -876.3046875, -851.48828125, -826.671875, -801.85546875, -777.0390625, -752.22265625, -727.40625, -702.58984375, -677.7734375, -652.95703125, -628.140625, -603.32421875, -578.5078125, -553.69140625, -528.875, -504.05859375, -479.2421875, -454.42578125, -429.609375, -404.79296875, -379.9765625, -355.16015625, -330.34375, -305.52734375, -280.7109375, -255.89453125, -231.078125, -206.26171875, -181.4453125, -156.62890625, -131.8125, -106.99609375, -82.1796875, -57.36328125, -32.546875, -7.73046875, 17.0859375, 41.90234375, 66.71875, 91.53515625, 116.3515625, 141.16796875, 165.984375, 190.80078125, 215.6171875, 240.43359375, 265.25]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 20.0, 52.0, 460.0, 3394.0, 131.0, 21.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.875, -101.997802734375, -100.12060546875, -98.243408203125, -96.3662109375, -94.489013671875, -92.61181640625, -90.734619140625, -88.857421875, -86.980224609375, -85.10302734375, -83.225830078125, -81.3486328125, -79.471435546875, -77.59423828125, -75.717041015625, -73.83984375, -71.962646484375, -70.08544921875, -68.208251953125, -66.3310546875, -64.453857421875, -62.57666015625, -60.699462890625, -58.822265625, -56.945068359375, -55.06787109375, -53.190673828125, -51.3134765625, -49.436279296875, -47.55908203125, -45.681884765625, -43.8046875, -41.927490234375, -40.05029296875, -38.173095703125, -36.2958984375, -34.418701171875, -32.54150390625, -30.664306640625, -28.787109375, -26.909912109375, -25.03271484375, -23.155517578125, -21.2783203125, -19.401123046875, -17.52392578125, -15.646728515625, -13.76953125, -11.892333984375, -10.01513671875, -8.137939453125, -6.2607421875, -4.383544921875, -2.50634765625, -0.629150390625, 1.248046875, 3.125244140625, 5.00244140625, 6.879638671875, 8.7568359375, 10.634033203125, 12.51123046875, 14.388427734375, 16.265625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 13.0, 37.0, 229.0, 568.0, 111.0, 22.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-576.6055297851562, -566.0121459960938, -555.4188232421875, -544.825439453125, -534.2320556640625, -523.6387329101562, -513.0453491210938, -502.4519958496094, -491.858642578125, -481.2652893066406, -470.6719055175781, -460.07855224609375, -449.4851989746094, -438.891845703125, -428.2984619140625, -417.7051086425781, -407.11175537109375, -396.5184020996094, -385.9250183105469, -375.3316650390625, -364.7383117675781, -354.14495849609375, -343.55157470703125, -332.9582214355469, -322.3648376464844, -311.771484375, -301.1781005859375, -290.5847473144531, -279.99139404296875, -269.3980407714844, -258.8046569824219, -248.2113037109375, -237.61798095703125, -227.0246124267578, -216.43125915527344, -205.837890625, -195.24453735351562, -184.6511688232422, -174.05780029296875, -163.46444702148438, -152.87107849121094, -142.2777099609375, -131.68435668945312, -121.09098815917969, -110.49763488769531, -99.90426635742188, -89.31090545654297, -78.71754455566406, -68.12418365478516, -57.53082275390625, -46.937461853027344, -36.34409713745117, -25.750736236572266, -15.15737533569336, -4.5640106201171875, 6.029350280761719, 16.622711181640625, 27.21607208251953, 37.80943298339844, 48.40279769897461, 58.996158599853516, 69.58952331542969, 80.1828842163086, 90.7762451171875, 101.3696060180664]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 10.0, 18.0, 31.0, 36.0, 51.0, 101.0, 81.0, 111.0, 114.0, 103.0, 88.0, 82.0, 73.0, 32.0, 27.0, 23.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-202.74334716796875, -197.2250213623047, -191.7067108154297, -186.18838500976562, -180.67007446289062, -175.15174865722656, -169.6334228515625, -164.1151123046875, -158.59678649902344, -153.07846069335938, -147.56015014648438, -142.0418243408203, -136.52349853515625, -131.00518798828125, -125.48686218261719, -119.96854400634766, -114.45022583007812, -108.9319076538086, -103.41358947753906, -97.895263671875, -92.37694549560547, -86.85862731933594, -81.34030151367188, -75.82198333740234, -70.30366516113281, -64.78534698486328, -59.267024993896484, -53.74870300292969, -48.230384826660156, -42.712066650390625, -37.19374465942383, -31.67542266845703, -26.1571044921875, -20.638784408569336, -15.120464324951172, -9.602144241333008, -4.083824157714844, 1.4344959259033203, 6.952816009521484, 12.471138000488281, 17.989456176757812, 23.507776260375977, 29.02609634399414, 34.54441833496094, 40.06273651123047, 45.5810546875, 51.0993766784668, 56.617698669433594, 62.136016845703125, 67.65433502197266, 73.17265319824219, 78.69097900390625, 84.20929718017578, 89.72761535644531, 95.24594116210938, 100.7642593383789, 106.28257751464844, 111.80089569091797, 117.3192138671875, 122.83753967285156, 128.35586547851562, 133.87417602539062, 139.3925018310547, 144.91082763671875, 150.42913818359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 2.0, 8.0, 11.0, 6.0, 13.0, 26.0, 23.0, 30.0, 40.0, 44.0, 77.0, 91.0, 112.0, 192.0, 296.0, 526.0, 1115.0, 2766.0, 10190.0, 54886.0, 410692.0, 482966.0, 66544.0, 11989.0, 3092.0, 1185.0, 556.0, 335.0, 176.0, 155.0, 105.0, 67.0, 45.0, 35.0, 35.0, 19.0, 16.0, 23.0, 9.0, 12.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-59.625, -57.7646484375, -55.904296875, -54.0439453125, -52.18359375, -50.3232421875, -48.462890625, -46.6025390625, -44.7421875, -42.8818359375, -41.021484375, -39.1611328125, -37.30078125, -35.4404296875, -33.580078125, -31.7197265625, -29.859375, -27.9990234375, -26.138671875, -24.2783203125, -22.41796875, -20.5576171875, -18.697265625, -16.8369140625, -14.9765625, -13.1162109375, -11.255859375, -9.3955078125, -7.53515625, -5.6748046875, -3.814453125, -1.9541015625, -0.09375, 1.7666015625, 3.626953125, 5.4873046875, 7.34765625, 9.2080078125, 11.068359375, 12.9287109375, 14.7890625, 16.6494140625, 18.509765625, 20.3701171875, 22.23046875, 24.0908203125, 25.951171875, 27.8115234375, 29.671875, 31.5322265625, 33.392578125, 35.2529296875, 37.11328125, 38.9736328125, 40.833984375, 42.6943359375, 44.5546875, 46.4150390625, 48.275390625, 50.1357421875, 51.99609375, 53.8564453125, 55.716796875, 57.5771484375, 59.4375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 18.0, 21.0, 24.0, 35.0, 62.0, 78.0, 87.0, 87.0, 106.0, 108.0, 92.0, 81.0, 63.0, 57.0, 24.0, 22.0, 15.0, 7.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.46875, -19.021728515625, -18.57470703125, -18.127685546875, -17.6806640625, -17.233642578125, -16.78662109375, -16.339599609375, -15.892578125, -15.445556640625, -14.99853515625, -14.551513671875, -14.1044921875, -13.657470703125, -13.21044921875, -12.763427734375, -12.31640625, -11.869384765625, -11.42236328125, -10.975341796875, -10.5283203125, -10.081298828125, -9.63427734375, -9.187255859375, -8.740234375, -8.293212890625, -7.84619140625, -7.399169921875, -6.9521484375, -6.505126953125, -6.05810546875, -5.611083984375, -5.1640625, -4.717041015625, -4.27001953125, -3.822998046875, -3.3759765625, -2.928955078125, -2.48193359375, -2.034912109375, -1.587890625, -1.140869140625, -0.69384765625, -0.246826171875, 0.2001953125, 0.647216796875, 1.09423828125, 1.541259765625, 1.98828125, 2.435302734375, 2.88232421875, 3.329345703125, 3.7763671875, 4.223388671875, 4.67041015625, 5.117431640625, 5.564453125, 6.011474609375, 6.45849609375, 6.905517578125, 7.3525390625, 7.799560546875, 8.24658203125, 8.693603515625, 9.140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 8.0, 12.0, 12.0, 19.0, 26.0, 32.0, 46.0, 70.0, 139.0, 306.0, 754.0, 2205.0, 9178.0, 72958.0, 715493.0, 222181.0, 19258.0, 3794.0, 1074.0, 433.0, 220.0, 97.0, 65.0, 39.0, 29.0, 25.0, 17.0, 13.0, 8.0, 1.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.28125, -58.31787109375, -56.3544921875, -54.39111328125, -52.427734375, -50.46435546875, -48.5009765625, -46.53759765625, -44.57421875, -42.61083984375, -40.6474609375, -38.68408203125, -36.720703125, -34.75732421875, -32.7939453125, -30.83056640625, -28.8671875, -26.90380859375, -24.9404296875, -22.97705078125, -21.013671875, -19.05029296875, -17.0869140625, -15.12353515625, -13.16015625, -11.19677734375, -9.2333984375, -7.27001953125, -5.306640625, -3.34326171875, -1.3798828125, 0.58349609375, 2.546875, 4.51025390625, 6.4736328125, 8.43701171875, 10.400390625, 12.36376953125, 14.3271484375, 16.29052734375, 18.25390625, 20.21728515625, 22.1806640625, 24.14404296875, 26.107421875, 28.07080078125, 30.0341796875, 31.99755859375, 33.9609375, 35.92431640625, 37.8876953125, 39.85107421875, 41.814453125, 43.77783203125, 45.7412109375, 47.70458984375, 49.66796875, 51.63134765625, 53.5947265625, 55.55810546875, 57.521484375, 59.48486328125, 61.4482421875, 63.41162109375, 65.375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 5.0, 8.0, 8.0, 8.0, 16.0, 23.0, 17.0, 16.0, 31.0, 28.0, 42.0, 46.0, 53.0, 49.0, 51.0, 67.0, 52.0, 64.0, 62.0, 69.0, 26.0, 54.0, 34.0, 31.0, 29.0, 19.0, 19.0, 17.0, 9.0, 15.0, 3.0, 5.0, 4.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.90625, -33.7880859375, -32.669921875, -31.5517578125, -30.43359375, -29.3154296875, -28.197265625, -27.0791015625, -25.9609375, -24.8427734375, -23.724609375, -22.6064453125, -21.48828125, -20.3701171875, -19.251953125, -18.1337890625, -17.015625, -15.8974609375, -14.779296875, -13.6611328125, -12.54296875, -11.4248046875, -10.306640625, -9.1884765625, -8.0703125, -6.9521484375, -5.833984375, -4.7158203125, -3.59765625, -2.4794921875, -1.361328125, -0.2431640625, 0.875, 1.9931640625, 3.111328125, 4.2294921875, 5.34765625, 6.4658203125, 7.583984375, 8.7021484375, 9.8203125, 10.9384765625, 12.056640625, 13.1748046875, 14.29296875, 15.4111328125, 16.529296875, 17.6474609375, 18.765625, 19.8837890625, 21.001953125, 22.1201171875, 23.23828125, 24.3564453125, 25.474609375, 26.5927734375, 27.7109375, 28.8291015625, 29.947265625, 31.0654296875, 32.18359375, 33.3017578125, 34.419921875, 35.5380859375, 36.65625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 17.0, 13.0, 25.0, 32.0, 59.0, 83.0, 194.0, 308.0, 718.0, 1928.0, 6971.0, 40431.0, 577852.0, 383024.0, 28517.0, 5411.0, 1636.0, 634.0, 305.0, 167.0, 89.0, 36.0, 43.0, 15.0, 15.0, 9.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.3125, -33.452880859375, -32.59326171875, -31.733642578125, -30.8740234375, -30.014404296875, -29.15478515625, -28.295166015625, -27.435546875, -26.575927734375, -25.71630859375, -24.856689453125, -23.9970703125, -23.137451171875, -22.27783203125, -21.418212890625, -20.55859375, -19.698974609375, -18.83935546875, -17.979736328125, -17.1201171875, -16.260498046875, -15.40087890625, -14.541259765625, -13.681640625, -12.822021484375, -11.96240234375, -11.102783203125, -10.2431640625, -9.383544921875, -8.52392578125, -7.664306640625, -6.8046875, -5.945068359375, -5.08544921875, -4.225830078125, -3.3662109375, -2.506591796875, -1.64697265625, -0.787353515625, 0.072265625, 0.931884765625, 1.79150390625, 2.651123046875, 3.5107421875, 4.370361328125, 5.22998046875, 6.089599609375, 6.94921875, 7.808837890625, 8.66845703125, 9.528076171875, 10.3876953125, 11.247314453125, 12.10693359375, 12.966552734375, 13.826171875, 14.685791015625, 15.54541015625, 16.405029296875, 17.2646484375, 18.124267578125, 18.98388671875, 19.843505859375, 20.703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 6.0, 1.0, 3.0, 5.0, 1.0, 13.0, 7.0, 6.0, 11.0, 13.0, 21.0, 21.0, 36.0, 29.0, 43.0, 55.0, 50.0, 98.0, 77.0, 86.0, 66.0, 58.0, 67.0, 51.0, 48.0, 30.0, 19.0, 16.0, 16.0, 13.0, 8.0, 8.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002124786376953125, -0.0020676404237747192, -0.0020104944705963135, -0.0019533485174179077, -0.001896202564239502, -0.0018390566110610962, -0.0017819106578826904, -0.0017247647047042847, -0.001667618751525879, -0.0016104727983474731, -0.0015533268451690674, -0.0014961808919906616, -0.0014390349388122559, -0.00138188898563385, -0.0013247430324554443, -0.0012675970792770386, -0.0012104511260986328, -0.001153305172920227, -0.0010961592197418213, -0.0010390132665634155, -0.0009818673133850098, -0.000924721360206604, -0.0008675754070281982, -0.0008104294538497925, -0.0007532835006713867, -0.000696137547492981, -0.0006389915943145752, -0.0005818456411361694, -0.0005246996879577637, -0.0004675537347793579, -0.00041040778160095215, -0.0003532618284225464, -0.0002961158752441406, -0.00023896992206573486, -0.0001818239688873291, -0.00012467801570892334, -6.753206253051758e-05, -1.0386109352111816e-05, 4.6759843826293945e-05, 0.00010390579700469971, 0.00016105175018310547, 0.00021819770336151123, 0.000275343656539917, 0.00033248960971832275, 0.0003896355628967285, 0.0004467815160751343, 0.00050392746925354, 0.0005610734224319458, 0.0006182193756103516, 0.0006753653287887573, 0.0007325112819671631, 0.0007896572351455688, 0.0008468031883239746, 0.0009039491415023804, 0.0009610950946807861, 0.001018241047859192, 0.0010753870010375977, 0.0011325329542160034, 0.0011896789073944092, 0.001246824860572815, 0.0013039708137512207, 0.0013611167669296265, 0.0014182627201080322, 0.001475408673286438, 0.0015325546264648438]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 14.0, 15.0, 18.0, 26.0, 36.0, 59.0, 103.0, 182.0, 364.0, 866.0, 2337.0, 9393.0, 65379.0, 810505.0, 139064.0, 14861.0, 3233.0, 1024.0, 467.0, 231.0, 113.0, 88.0, 41.0, 28.0, 23.0, 18.0, 14.0, 7.0, 3.0, 8.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.370361328125, -32.45947265625, -31.548583984375, -30.6376953125, -29.726806640625, -28.81591796875, -27.905029296875, -26.994140625, -26.083251953125, -25.17236328125, -24.261474609375, -23.3505859375, -22.439697265625, -21.52880859375, -20.617919921875, -19.70703125, -18.796142578125, -17.88525390625, -16.974365234375, -16.0634765625, -15.152587890625, -14.24169921875, -13.330810546875, -12.419921875, -11.509033203125, -10.59814453125, -9.687255859375, -8.7763671875, -7.865478515625, -6.95458984375, -6.043701171875, -5.1328125, -4.221923828125, -3.31103515625, -2.400146484375, -1.4892578125, -0.578369140625, 0.33251953125, 1.243408203125, 2.154296875, 3.065185546875, 3.97607421875, 4.886962890625, 5.7978515625, 6.708740234375, 7.61962890625, 8.530517578125, 9.44140625, 10.352294921875, 11.26318359375, 12.174072265625, 13.0849609375, 13.995849609375, 14.90673828125, 15.817626953125, 16.728515625, 17.639404296875, 18.55029296875, 19.461181640625, 20.3720703125, 21.282958984375, 22.19384765625, 23.104736328125, 24.015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 9.0, 9.0, 23.0, 12.0, 24.0, 26.0, 50.0, 62.0, 112.0, 132.0, 170.0, 109.0, 53.0, 47.0, 34.0, 18.0, 19.0, 10.0, 9.0, 8.0, 6.0, 6.0, 3.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-17.1875, -16.7354736328125, -16.283447265625, -15.8314208984375, -15.37939453125, -14.9273681640625, -14.475341796875, -14.0233154296875, -13.5712890625, -13.1192626953125, -12.667236328125, -12.2152099609375, -11.76318359375, -11.3111572265625, -10.859130859375, -10.4071044921875, -9.955078125, -9.5030517578125, -9.051025390625, -8.5989990234375, -8.14697265625, -7.6949462890625, -7.242919921875, -6.7908935546875, -6.3388671875, -5.8868408203125, -5.434814453125, -4.9827880859375, -4.53076171875, -4.0787353515625, -3.626708984375, -3.1746826171875, -2.72265625, -2.2706298828125, -1.818603515625, -1.3665771484375, -0.91455078125, -0.4625244140625, -0.010498046875, 0.4415283203125, 0.8935546875, 1.3455810546875, 1.797607421875, 2.2496337890625, 2.70166015625, 3.1536865234375, 3.605712890625, 4.0577392578125, 4.509765625, 4.9617919921875, 5.413818359375, 5.8658447265625, 6.31787109375, 6.7698974609375, 7.221923828125, 7.6739501953125, 8.1259765625, 8.5780029296875, 9.030029296875, 9.4820556640625, 9.93408203125, 10.3861083984375, 10.838134765625, 11.2901611328125, 11.7421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 17.0, 23.0, 57.0, 103.0, 186.0, 237.0, 169.0, 93.0, 50.0, 28.0, 8.0, 8.0, 7.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-252.16075134277344, -243.18038940429688, -234.2000274658203, -225.21966552734375, -216.23928833007812, -207.25894165039062, -198.278564453125, -189.29820251464844, -180.31784057617188, -171.3374786376953, -162.35711669921875, -153.3767547607422, -144.39639282226562, -135.416015625, -126.43565368652344, -117.45529174804688, -108.47492980957031, -99.49456787109375, -90.51420593261719, -81.5338363647461, -72.55347442626953, -63.57311248779297, -54.59274673461914, -45.61238098144531, -36.63201904296875, -27.651655197143555, -18.67129135131836, -9.690927505493164, -0.7105636596679688, 8.269798278808594, 17.250164031982422, 26.23052978515625, 35.210906982421875, 44.19126892089844, 53.171634674072266, 62.152000427246094, 71.13236236572266, 80.11272430419922, 89.09309387207031, 98.07345581054688, 107.05381774902344, 116.0341796875, 125.01454162597656, 133.99490356445312, 142.97528076171875, 151.95562744140625, 160.93600463867188, 169.91636657714844, 178.896728515625, 187.87709045410156, 196.85745239257812, 205.8378143310547, 214.81817626953125, 223.79855346679688, 232.77891540527344, 241.75927734375, 250.73963928222656, 259.7200012207031, 268.70037841796875, 277.68072509765625, 286.6611022949219, 295.6414489746094, 304.621826171875, 313.6021728515625, 322.5825500488281]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 9.0, 11.0, 14.0, 16.0, 19.0, 25.0, 25.0, 32.0, 40.0, 37.0, 31.0, 60.0, 43.0, 47.0, 46.0, 47.0, 53.0, 51.0, 36.0, 53.0, 48.0, 38.0, 49.0, 25.0, 23.0, 20.0, 18.0, 14.0, 12.0, 7.0, 9.0, 5.0, 3.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.3721466064453, -154.73846435546875, -149.10476684570312, -143.4710693359375, -137.83738708496094, -132.20370483398438, -126.57000732421875, -120.93631744384766, -115.30262756347656, -109.66893768310547, -104.03524780273438, -98.40155792236328, -92.76786804199219, -87.1341781616211, -81.50048828125, -75.8667984008789, -70.23310852050781, -64.59941864013672, -58.965728759765625, -53.33203887939453, -47.69834899902344, -42.064659118652344, -36.43096923828125, -30.797279357910156, -25.163589477539062, -19.52989959716797, -13.896209716796875, -8.262519836425781, -2.6288299560546875, 3.0048599243164062, 8.6385498046875, 14.272239685058594, 19.905914306640625, 25.53960418701172, 31.173294067382812, 36.806983947753906, 42.440673828125, 48.074363708496094, 53.70805358886719, 59.34174346923828, 64.97543334960938, 70.60912322998047, 76.24281311035156, 81.87650299072266, 87.51019287109375, 93.14388275146484, 98.77757263183594, 104.41126251220703, 110.04495239257812, 115.67864227294922, 121.31233215332031, 126.9460220336914, 132.5797119140625, 138.21340942382812, 143.8470916748047, 149.48077392578125, 155.11447143554688, 160.7481689453125, 166.38185119628906, 172.01553344726562, 177.64923095703125, 183.28292846679688, 188.91661071777344, 194.55029296875, 200.18399047851562]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 10.0, 8.0, 9.0, 17.0, 25.0, 24.0, 49.0, 67.0, 115.0, 155.0, 348.0, 661.0, 1810.0, 6911.0, 68777.0, 4020236.0, 85158.0, 7161.0, 1674.0, 560.0, 233.0, 110.0, 56.0, 39.0, 19.0, 19.0, 4.0, 12.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-119.75, -116.794921875, -113.83984375, -110.884765625, -107.9296875, -104.974609375, -102.01953125, -99.064453125, -96.109375, -93.154296875, -90.19921875, -87.244140625, -84.2890625, -81.333984375, -78.37890625, -75.423828125, -72.46875, -69.513671875, -66.55859375, -63.603515625, -60.6484375, -57.693359375, -54.73828125, -51.783203125, -48.828125, -45.873046875, -42.91796875, -39.962890625, -37.0078125, -34.052734375, -31.09765625, -28.142578125, -25.1875, -22.232421875, -19.27734375, -16.322265625, -13.3671875, -10.412109375, -7.45703125, -4.501953125, -1.546875, 1.408203125, 4.36328125, 7.318359375, 10.2734375, 13.228515625, 16.18359375, 19.138671875, 22.09375, 25.048828125, 28.00390625, 30.958984375, 33.9140625, 36.869140625, 39.82421875, 42.779296875, 45.734375, 48.689453125, 51.64453125, 54.599609375, 57.5546875, 60.509765625, 63.46484375, 66.419921875, 69.375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 17.0, 30.0, 44.0, 57.0, 71.0, 82.0, 105.0, 103.0, 86.0, 91.0, 84.0, 73.0, 49.0, 27.0, 21.0, 24.0, 8.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.265625, -18.814208984375, -18.36279296875, -17.911376953125, -17.4599609375, -17.008544921875, -16.55712890625, -16.105712890625, -15.654296875, -15.202880859375, -14.75146484375, -14.300048828125, -13.8486328125, -13.397216796875, -12.94580078125, -12.494384765625, -12.04296875, -11.591552734375, -11.14013671875, -10.688720703125, -10.2373046875, -9.785888671875, -9.33447265625, -8.883056640625, -8.431640625, -7.980224609375, -7.52880859375, -7.077392578125, -6.6259765625, -6.174560546875, -5.72314453125, -5.271728515625, -4.8203125, -4.368896484375, -3.91748046875, -3.466064453125, -3.0146484375, -2.563232421875, -2.11181640625, -1.660400390625, -1.208984375, -0.757568359375, -0.30615234375, 0.145263671875, 0.5966796875, 1.048095703125, 1.49951171875, 1.950927734375, 2.40234375, 2.853759765625, 3.30517578125, 3.756591796875, 4.2080078125, 4.659423828125, 5.11083984375, 5.562255859375, 6.013671875, 6.465087890625, 6.91650390625, 7.367919921875, 7.8193359375, 8.270751953125, 8.72216796875, 9.173583984375, 9.625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 7.0, 33.0, 59.0, 128.0, 419.0, 4134422.0, 58559.0, 329.0, 136.0, 91.0, 44.0, 27.0, 15.0, 10.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-383.25, -361.86328125, -340.4765625, -319.08984375, -297.703125, -276.31640625, -254.9296875, -233.54296875, -212.15625, -190.76953125, -169.3828125, -147.99609375, -126.609375, -105.22265625, -83.8359375, -62.44921875, -41.0625, -19.67578125, 1.7109375, 23.09765625, 44.484375, 65.87109375, 87.2578125, 108.64453125, 130.03125, 151.41796875, 172.8046875, 194.19140625, 215.578125, 236.96484375, 258.3515625, 279.73828125, 301.125, 322.51171875, 343.8984375, 365.28515625, 386.671875, 408.05859375, 429.4453125, 450.83203125, 472.21875, 493.60546875, 514.9921875, 536.37890625, 557.765625, 579.15234375, 600.5390625, 621.92578125, 643.3125, 664.69921875, 686.0859375, 707.47265625, 728.859375, 750.24609375, 771.6328125, 793.01953125, 814.40625, 835.79296875, 857.1796875, 878.56640625, 899.953125, 921.33984375, 942.7265625, 964.11328125, 985.5]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 53.0, 3471.0, 526.0, 28.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0625, -51.9677734375, -48.873046875, -45.7783203125, -42.68359375, -39.5888671875, -36.494140625, -33.3994140625, -30.3046875, -27.2099609375, -24.115234375, -21.0205078125, -17.92578125, -14.8310546875, -11.736328125, -8.6416015625, -5.546875, -2.4521484375, 0.642578125, 3.7373046875, 6.83203125, 9.9267578125, 13.021484375, 16.1162109375, 19.2109375, 22.3056640625, 25.400390625, 28.4951171875, 31.58984375, 34.6845703125, 37.779296875, 40.8740234375, 43.96875, 47.0634765625, 50.158203125, 53.2529296875, 56.34765625, 59.4423828125, 62.537109375, 65.6318359375, 68.7265625, 71.8212890625, 74.916015625, 78.0107421875, 81.10546875, 84.2001953125, 87.294921875, 90.3896484375, 93.484375, 96.5791015625, 99.673828125, 102.7685546875, 105.86328125, 108.9580078125, 112.052734375, 115.1474609375, 118.2421875, 121.3369140625, 124.431640625, 127.5263671875, 130.62109375, 133.7158203125, 136.810546875, 139.9052734375, 143.0]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 15.0, 138.0, 728.0, 109.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.47955322265625, -250.212890625, -234.94622802734375, -219.6795654296875, -204.41290283203125, -189.146240234375, -173.87957763671875, -158.6129150390625, -143.34625244140625, -128.07958984375, -112.81292724609375, -97.5462646484375, -82.27960205078125, -67.012939453125, -51.74627685546875, -36.4796142578125, -21.21295166015625, -5.9462890625, 9.32037353515625, 24.5870361328125, 39.85369873046875, 55.120361328125, 70.38702392578125, 85.6536865234375, 100.92034912109375, 116.18701171875, 131.45367431640625, 146.7203369140625, 161.98699951171875, 177.253662109375, 192.52032470703125, 207.7869873046875, 223.05364990234375, 238.3203125, 253.58697509765625, 268.8536376953125, 284.12030029296875, 299.386962890625, 314.65362548828125, 329.9202880859375, 345.18695068359375, 360.45361328125, 375.72027587890625, 390.9869384765625, 406.25360107421875, 421.520263671875, 436.78692626953125, 452.0535888671875, 467.32025146484375, 482.5869140625, 497.85357666015625, 513.1202392578125, 528.3869018554688, 543.653564453125, 558.9202270507812, 574.1868896484375, 589.4535522460938, 604.72021484375, 619.9868774414062, 635.2535400390625, 650.5202026367188, 665.786865234375, 681.0535278320312, 696.3201904296875, 711.5868530273438]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 13.0, 44.0, 60.0, 98.0, 155.0, 189.0, 160.0, 118.0, 80.0, 40.0, 26.0, 14.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.9304962158203, -209.77468872070312, -203.61888122558594, -197.46307373046875, -191.3072509765625, -185.1514434814453, -178.99563598632812, -172.83982849121094, -166.68402099609375, -160.52821350097656, -154.37240600585938, -148.2165985107422, -142.060791015625, -135.90496826171875, -129.74916076660156, -123.59335327148438, -117.43754577636719, -111.28173828125, -105.12593078613281, -98.9701156616211, -92.8143081665039, -86.65850067138672, -80.502685546875, -74.34687805175781, -68.19107055664062, -62.03526306152344, -55.879451751708984, -49.72364044189453, -43.567832946777344, -37.412025451660156, -31.256214141845703, -25.10040283203125, -18.944580078125, -12.78877067565918, -6.632961273193359, -0.47715187072753906, 5.678657531738281, 11.834466934204102, 17.990276336669922, 24.146087646484375, 30.301895141601562, 36.45770263671875, 42.6135139465332, 48.769325256347656, 54.925132751464844, 61.08094024658203, 67.23675537109375, 73.39256286621094, 79.54837036132812, 85.70417785644531, 91.8599853515625, 98.01580047607422, 104.1716079711914, 110.3274154663086, 116.48323059082031, 122.6390380859375, 128.7948455810547, 134.95065307617188, 141.10646057128906, 147.26226806640625, 153.4180908203125, 159.5738983154297, 165.72970581054688, 171.88551330566406, 178.04132080078125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 7.0, 12.0, 23.0, 18.0, 34.0, 47.0, 66.0, 92.0, 159.0, 324.0, 652.0, 2076.0, 8780.0, 64073.0, 569433.0, 358303.0, 36051.0, 5675.0, 1498.0, 553.0, 236.0, 123.0, 81.0, 72.0, 35.0, 33.0, 21.0, 15.0, 8.0, 10.0, 7.0, 4.0, 3.0, 2.0, 10.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-55.625, -53.62890625, -51.6328125, -49.63671875, -47.640625, -45.64453125, -43.6484375, -41.65234375, -39.65625, -37.66015625, -35.6640625, -33.66796875, -31.671875, -29.67578125, -27.6796875, -25.68359375, -23.6875, -21.69140625, -19.6953125, -17.69921875, -15.703125, -13.70703125, -11.7109375, -9.71484375, -7.71875, -5.72265625, -3.7265625, -1.73046875, 0.265625, 2.26171875, 4.2578125, 6.25390625, 8.25, 10.24609375, 12.2421875, 14.23828125, 16.234375, 18.23046875, 20.2265625, 22.22265625, 24.21875, 26.21484375, 28.2109375, 30.20703125, 32.203125, 34.19921875, 36.1953125, 38.19140625, 40.1875, 42.18359375, 44.1796875, 46.17578125, 48.171875, 50.16796875, 52.1640625, 54.16015625, 56.15625, 58.15234375, 60.1484375, 62.14453125, 64.140625, 66.13671875, 68.1328125, 70.12890625, 72.125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 8.0, 21.0, 24.0, 26.0, 41.0, 47.0, 54.0, 76.0, 74.0, 80.0, 93.0, 67.0, 67.0, 67.0, 69.0, 46.0, 33.0, 33.0, 21.0, 18.0, 13.0, 9.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.1796875, -13.84527587890625, -13.5108642578125, -13.17645263671875, -12.842041015625, -12.50762939453125, -12.1732177734375, -11.83880615234375, -11.50439453125, -11.16998291015625, -10.8355712890625, -10.50115966796875, -10.166748046875, -9.83233642578125, -9.4979248046875, -9.16351318359375, -8.8291015625, -8.49468994140625, -8.1602783203125, -7.82586669921875, -7.491455078125, -7.15704345703125, -6.8226318359375, -6.48822021484375, -6.15380859375, -5.81939697265625, -5.4849853515625, -5.15057373046875, -4.816162109375, -4.48175048828125, -4.1473388671875, -3.81292724609375, -3.478515625, -3.14410400390625, -2.8096923828125, -2.47528076171875, -2.140869140625, -1.80645751953125, -1.4720458984375, -1.13763427734375, -0.80322265625, -0.46881103515625, -0.1343994140625, 0.20001220703125, 0.534423828125, 0.86883544921875, 1.2032470703125, 1.53765869140625, 1.8720703125, 2.20648193359375, 2.5408935546875, 2.87530517578125, 3.209716796875, 3.54412841796875, 3.8785400390625, 4.21295166015625, 4.54736328125, 4.88177490234375, 5.2161865234375, 5.55059814453125, 5.885009765625, 6.21942138671875, 6.5538330078125, 6.88824462890625, 7.22265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 8.0, 13.0, 11.0, 16.0, 23.0, 36.0, 52.0, 81.0, 147.0, 286.0, 595.0, 1469.0, 4847.0, 27617.0, 340015.0, 607341.0, 54792.0, 7572.0, 2061.0, 748.0, 355.0, 172.0, 101.0, 55.0, 45.0, 30.0, 13.0, 13.0, 6.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.125, -69.1015625, -67.078125, -65.0546875, -63.03125, -61.0078125, -58.984375, -56.9609375, -54.9375, -52.9140625, -50.890625, -48.8671875, -46.84375, -44.8203125, -42.796875, -40.7734375, -38.75, -36.7265625, -34.703125, -32.6796875, -30.65625, -28.6328125, -26.609375, -24.5859375, -22.5625, -20.5390625, -18.515625, -16.4921875, -14.46875, -12.4453125, -10.421875, -8.3984375, -6.375, -4.3515625, -2.328125, -0.3046875, 1.71875, 3.7421875, 5.765625, 7.7890625, 9.8125, 11.8359375, 13.859375, 15.8828125, 17.90625, 19.9296875, 21.953125, 23.9765625, 26.0, 28.0234375, 30.046875, 32.0703125, 34.09375, 36.1171875, 38.140625, 40.1640625, 42.1875, 44.2109375, 46.234375, 48.2578125, 50.28125, 52.3046875, 54.328125, 56.3515625, 58.375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 15.0, 7.0, 8.0, 8.0, 12.0, 26.0, 30.0, 25.0, 32.0, 43.0, 52.0, 60.0, 54.0, 37.0, 60.0, 73.0, 56.0, 58.0, 58.0, 56.0, 42.0, 43.0, 24.0, 28.0, 23.0, 16.0, 13.0, 9.0, 4.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.4375, -43.201171875, -41.96484375, -40.728515625, -39.4921875, -38.255859375, -37.01953125, -35.783203125, -34.546875, -33.310546875, -32.07421875, -30.837890625, -29.6015625, -28.365234375, -27.12890625, -25.892578125, -24.65625, -23.419921875, -22.18359375, -20.947265625, -19.7109375, -18.474609375, -17.23828125, -16.001953125, -14.765625, -13.529296875, -12.29296875, -11.056640625, -9.8203125, -8.583984375, -7.34765625, -6.111328125, -4.875, -3.638671875, -2.40234375, -1.166015625, 0.0703125, 1.306640625, 2.54296875, 3.779296875, 5.015625, 6.251953125, 7.48828125, 8.724609375, 9.9609375, 11.197265625, 12.43359375, 13.669921875, 14.90625, 16.142578125, 17.37890625, 18.615234375, 19.8515625, 21.087890625, 22.32421875, 23.560546875, 24.796875, 26.033203125, 27.26953125, 28.505859375, 29.7421875, 30.978515625, 32.21484375, 33.451171875, 34.6875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 8.0, 10.0, 11.0, 27.0, 76.0, 143.0, 325.0, 1038.0, 4930.0, 78617.0, 924982.0, 33880.0, 3143.0, 839.0, 282.0, 120.0, 49.0, 26.0, 13.0, 8.0, 6.0, 10.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.40625, -41.0107421875, -39.615234375, -38.2197265625, -36.82421875, -35.4287109375, -34.033203125, -32.6376953125, -31.2421875, -29.8466796875, -28.451171875, -27.0556640625, -25.66015625, -24.2646484375, -22.869140625, -21.4736328125, -20.078125, -18.6826171875, -17.287109375, -15.8916015625, -14.49609375, -13.1005859375, -11.705078125, -10.3095703125, -8.9140625, -7.5185546875, -6.123046875, -4.7275390625, -3.33203125, -1.9365234375, -0.541015625, 0.8544921875, 2.25, 3.6455078125, 5.041015625, 6.4365234375, 7.83203125, 9.2275390625, 10.623046875, 12.0185546875, 13.4140625, 14.8095703125, 16.205078125, 17.6005859375, 18.99609375, 20.3916015625, 21.787109375, 23.1826171875, 24.578125, 25.9736328125, 27.369140625, 28.7646484375, 30.16015625, 31.5556640625, 32.951171875, 34.3466796875, 35.7421875, 37.1376953125, 38.533203125, 39.9287109375, 41.32421875, 42.7197265625, 44.115234375, 45.5107421875, 46.90625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 6.0, 6.0, 11.0, 12.0, 6.0, 16.0, 15.0, 33.0, 47.0, 58.0, 82.0, 94.0, 96.0, 113.0, 129.0, 75.0, 69.0, 40.0, 29.0, 19.0, 19.0, 12.0, 4.0, 4.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0024318695068359375, -0.00234830379486084, -0.002264738082885742, -0.0021811723709106445, -0.002097606658935547, -0.0020140409469604492, -0.0019304752349853516, -0.001846909523010254, -0.0017633438110351562, -0.0016797780990600586, -0.001596212387084961, -0.0015126466751098633, -0.0014290809631347656, -0.001345515251159668, -0.0012619495391845703, -0.0011783838272094727, -0.001094818115234375, -0.0010112524032592773, -0.0009276866912841797, -0.000844120979309082, -0.0007605552673339844, -0.0006769895553588867, -0.0005934238433837891, -0.0005098581314086914, -0.00042629241943359375, -0.0003427267074584961, -0.00025916099548339844, -0.00017559528350830078, -9.202957153320312e-05, -8.463859558105469e-06, 7.510185241699219e-05, 0.00015866756439208984, 0.0002422332763671875, 0.00032579898834228516, 0.0004093647003173828, 0.0004929304122924805, 0.0005764961242675781, 0.0006600618362426758, 0.0007436275482177734, 0.0008271932601928711, 0.0009107589721679688, 0.0009943246841430664, 0.001077890396118164, 0.0011614561080932617, 0.0012450218200683594, 0.001328587532043457, 0.0014121532440185547, 0.0014957189559936523, 0.00157928466796875, 0.0016628503799438477, 0.0017464160919189453, 0.001829981803894043, 0.0019135475158691406, 0.0019971132278442383, 0.002080678939819336, 0.0021642446517944336, 0.0022478103637695312, 0.002331376075744629, 0.0024149417877197266, 0.0024985074996948242, 0.002582073211669922, 0.0026656389236450195, 0.002749204635620117, 0.002832770347595215, 0.0029163360595703125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 8.0, 11.0, 21.0, 32.0, 52.0, 75.0, 132.0, 262.0, 563.0, 1363.0, 4291.0, 23156.0, 330831.0, 636208.0, 41901.0, 6439.0, 1838.0, 648.0, 314.0, 149.0, 100.0, 47.0, 41.0, 18.0, 14.0, 11.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.796875, -16.07080078125, -15.3447265625, -14.61865234375, -13.892578125, -13.16650390625, -12.4404296875, -11.71435546875, -10.98828125, -10.26220703125, -9.5361328125, -8.81005859375, -8.083984375, -7.35791015625, -6.6318359375, -5.90576171875, -5.1796875, -4.45361328125, -3.7275390625, -3.00146484375, -2.275390625, -1.54931640625, -0.8232421875, -0.09716796875, 0.62890625, 1.35498046875, 2.0810546875, 2.80712890625, 3.533203125, 4.25927734375, 4.9853515625, 5.71142578125, 6.4375, 7.16357421875, 7.8896484375, 8.61572265625, 9.341796875, 10.06787109375, 10.7939453125, 11.52001953125, 12.24609375, 12.97216796875, 13.6982421875, 14.42431640625, 15.150390625, 15.87646484375, 16.6025390625, 17.32861328125, 18.0546875, 18.78076171875, 19.5068359375, 20.23291015625, 20.958984375, 21.68505859375, 22.4111328125, 23.13720703125, 23.86328125, 24.58935546875, 25.3154296875, 26.04150390625, 26.767578125, 27.49365234375, 28.2197265625, 28.94580078125, 29.671875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 4.0, 3.0, 13.0, 18.0, 16.0, 25.0, 33.0, 41.0, 50.0, 64.0, 93.0, 117.0, 112.0, 106.0, 79.0, 59.0, 34.0, 37.0, 22.0, 21.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -12.008056640625, -11.59423828125, -11.180419921875, -10.7666015625, -10.352783203125, -9.93896484375, -9.525146484375, -9.111328125, -8.697509765625, -8.28369140625, -7.869873046875, -7.4560546875, -7.042236328125, -6.62841796875, -6.214599609375, -5.80078125, -5.386962890625, -4.97314453125, -4.559326171875, -4.1455078125, -3.731689453125, -3.31787109375, -2.904052734375, -2.490234375, -2.076416015625, -1.66259765625, -1.248779296875, -0.8349609375, -0.421142578125, -0.00732421875, 0.406494140625, 0.8203125, 1.234130859375, 1.64794921875, 2.061767578125, 2.4755859375, 2.889404296875, 3.30322265625, 3.717041015625, 4.130859375, 4.544677734375, 4.95849609375, 5.372314453125, 5.7861328125, 6.199951171875, 6.61376953125, 7.027587890625, 7.44140625, 7.855224609375, 8.26904296875, 8.682861328125, 9.0966796875, 9.510498046875, 9.92431640625, 10.338134765625, 10.751953125, 11.165771484375, 11.57958984375, 11.993408203125, 12.4072265625, 12.821044921875, 13.23486328125, 13.648681640625, 14.0625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 18.0, 41.0, 64.0, 131.0, 203.0, 222.0, 165.0, 60.0, 44.0, 23.0, 17.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-425.44464111328125, -415.1192626953125, -404.7939147949219, -394.46856689453125, -384.1431884765625, -373.81781005859375, -363.4924621582031, -353.1671142578125, -342.84173583984375, -332.516357421875, -322.1910095214844, -311.86566162109375, -301.540283203125, -291.21490478515625, -280.8895568847656, -270.564208984375, -260.23883056640625, -249.91346740722656, -239.58810424804688, -229.2627410888672, -218.9373779296875, -208.6120147705078, -198.28665161132812, -187.96128845214844, -177.63592529296875, -167.31056213378906, -156.98519897460938, -146.6598358154297, -136.33447265625, -126.00910949707031, -115.68374633789062, -105.35838317871094, -95.03298950195312, -84.70762634277344, -74.38226318359375, -64.05690002441406, -53.731536865234375, -43.40617370605469, -33.080810546875, -22.755447387695312, -12.430084228515625, -2.1047210693359375, 8.22064208984375, 18.546005249023438, 28.871368408203125, 39.19673156738281, 49.5220947265625, 59.84745788574219, 70.17282104492188, 80.49818420410156, 90.82354736328125, 101.14891052246094, 111.47427368164062, 121.79963684082031, 132.125, 142.4503631591797, 152.77572631835938, 163.10108947753906, 173.42645263671875, 183.75181579589844, 194.07717895507812, 204.4025421142578, 214.7279052734375, 225.0532684326172, 235.37863159179688]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 5.0, 2.0, 6.0, 4.0, 4.0, 9.0, 10.0, 13.0, 12.0, 15.0, 30.0, 21.0, 27.0, 28.0, 23.0, 25.0, 27.0, 43.0, 49.0, 38.0, 50.0, 57.0, 38.0, 62.0, 36.0, 57.0, 49.0, 44.0, 34.0, 21.0, 24.0, 25.0, 32.0, 13.0, 17.0, 8.0, 12.0, 9.0, 10.0, 10.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.65798950195312, -137.15762329101562, -131.65724182128906, -126.15687561035156, -120.65650177001953, -115.1561279296875, -109.65576171875, -104.15538787841797, -98.65501403808594, -93.1546401977539, -87.6542739868164, -82.15390014648438, -76.65352630615234, -71.15315246582031, -65.65278625488281, -60.15241241455078, -54.65204620361328, -49.151676177978516, -43.651302337646484, -38.15093231201172, -32.65055847167969, -27.150188446044922, -21.649818420410156, -16.149444580078125, -10.64907455444336, -5.148703098297119, 0.3516683578491211, 5.852039337158203, 11.352411270141602, 16.852783203125, 22.353153228759766, 27.853527069091797, 33.35389709472656, 38.85426712036133, 44.35464096069336, 49.855010986328125, 55.355384826660156, 60.85575485229492, 66.35612487792969, 71.85649871826172, 77.35687255859375, 82.85724639892578, 88.35761260986328, 93.85798645019531, 99.35836029052734, 104.85873413085938, 110.35910034179688, 115.8594741821289, 121.3598403930664, 126.86021423339844, 132.36058044433594, 137.8609619140625, 143.361328125, 148.8616943359375, 154.362060546875, 159.86244201660156, 165.36280822753906, 170.86317443847656, 176.36355590820312, 181.86392211914062, 187.36428833007812, 192.8646697998047, 198.3650360107422, 203.86541748046875, 209.36578369140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 4.0, 15.0, 10.0, 18.0, 23.0, 33.0, 64.0, 116.0, 197.0, 378.0, 788.0, 2078.0, 7279.0, 54288.0, 3872977.0, 236690.0, 14692.0, 2997.0, 902.0, 384.0, 171.0, 77.0, 43.0, 16.0, 15.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-139.125, -136.01318359375, -132.9013671875, -129.78955078125, -126.677734375, -123.56591796875, -120.4541015625, -117.34228515625, -114.23046875, -111.11865234375, -108.0068359375, -104.89501953125, -101.783203125, -98.67138671875, -95.5595703125, -92.44775390625, -89.3359375, -86.22412109375, -83.1123046875, -80.00048828125, -76.888671875, -73.77685546875, -70.6650390625, -67.55322265625, -64.44140625, -61.32958984375, -58.2177734375, -55.10595703125, -51.994140625, -48.88232421875, -45.7705078125, -42.65869140625, -39.546875, -36.43505859375, -33.3232421875, -30.21142578125, -27.099609375, -23.98779296875, -20.8759765625, -17.76416015625, -14.65234375, -11.54052734375, -8.4287109375, -5.31689453125, -2.205078125, 0.90673828125, 4.0185546875, 7.13037109375, 10.2421875, 13.35400390625, 16.4658203125, 19.57763671875, 22.689453125, 25.80126953125, 28.9130859375, 32.02490234375, 35.13671875, 38.24853515625, 41.3603515625, 44.47216796875, 47.583984375, 50.69580078125, 53.8076171875, 56.91943359375, 60.03125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 11.0, 22.0, 36.0, 36.0, 44.0, 50.0, 59.0, 71.0, 81.0, 92.0, 99.0, 77.0, 71.0, 53.0, 40.0, 46.0, 32.0, 28.0, 19.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0078125, -13.6541748046875, -13.300537109375, -12.9468994140625, -12.59326171875, -12.2396240234375, -11.885986328125, -11.5323486328125, -11.1787109375, -10.8250732421875, -10.471435546875, -10.1177978515625, -9.76416015625, -9.4105224609375, -9.056884765625, -8.7032470703125, -8.349609375, -7.9959716796875, -7.642333984375, -7.2886962890625, -6.93505859375, -6.5814208984375, -6.227783203125, -5.8741455078125, -5.5205078125, -5.1668701171875, -4.813232421875, -4.4595947265625, -4.10595703125, -3.7523193359375, -3.398681640625, -3.0450439453125, -2.69140625, -2.3377685546875, -1.984130859375, -1.6304931640625, -1.27685546875, -0.9232177734375, -0.569580078125, -0.2159423828125, 0.1376953125, 0.4913330078125, 0.844970703125, 1.1986083984375, 1.55224609375, 1.9058837890625, 2.259521484375, 2.6131591796875, 2.966796875, 3.3204345703125, 3.674072265625, 4.0277099609375, 4.38134765625, 4.7349853515625, 5.088623046875, 5.4422607421875, 5.7958984375, 6.1495361328125, 6.503173828125, 6.8568115234375, 7.21044921875, 7.5640869140625, 7.917724609375, 8.2713623046875, 8.625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 14.0, 23.0, 40.0, 54.0, 100.0, 201.0, 445.0, 1573.0, 7505.0, 215397.0, 3945644.0, 18669.0, 3218.0, 810.0, 276.0, 114.0, 79.0, 38.0, 30.0, 15.0, 7.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-181.25, -176.7412109375, -172.232421875, -167.7236328125, -163.21484375, -158.7060546875, -154.197265625, -149.6884765625, -145.1796875, -140.6708984375, -136.162109375, -131.6533203125, -127.14453125, -122.6357421875, -118.126953125, -113.6181640625, -109.109375, -104.6005859375, -100.091796875, -95.5830078125, -91.07421875, -86.5654296875, -82.056640625, -77.5478515625, -73.0390625, -68.5302734375, -64.021484375, -59.5126953125, -55.00390625, -50.4951171875, -45.986328125, -41.4775390625, -36.96875, -32.4599609375, -27.951171875, -23.4423828125, -18.93359375, -14.4248046875, -9.916015625, -5.4072265625, -0.8984375, 3.6103515625, 8.119140625, 12.6279296875, 17.13671875, 21.6455078125, 26.154296875, 30.6630859375, 35.171875, 39.6806640625, 44.189453125, 48.6982421875, 53.20703125, 57.7158203125, 62.224609375, 66.7333984375, 71.2421875, 75.7509765625, 80.259765625, 84.7685546875, 89.27734375, 93.7861328125, 98.294921875, 102.8037109375, 107.3125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 0.0, 3.0, 4.0, 10.0, 17.0, 18.0, 53.0, 92.0, 253.0, 738.0, 1965.0, 541.0, 194.0, 65.0, 41.0, 25.0, 10.0, 6.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-33.03125, -32.124267578125, -31.21728515625, -30.310302734375, -29.4033203125, -28.496337890625, -27.58935546875, -26.682373046875, -25.775390625, -24.868408203125, -23.96142578125, -23.054443359375, -22.1474609375, -21.240478515625, -20.33349609375, -19.426513671875, -18.51953125, -17.612548828125, -16.70556640625, -15.798583984375, -14.8916015625, -13.984619140625, -13.07763671875, -12.170654296875, -11.263671875, -10.356689453125, -9.44970703125, -8.542724609375, -7.6357421875, -6.728759765625, -5.82177734375, -4.914794921875, -4.0078125, -3.100830078125, -2.19384765625, -1.286865234375, -0.3798828125, 0.527099609375, 1.43408203125, 2.341064453125, 3.248046875, 4.155029296875, 5.06201171875, 5.968994140625, 6.8759765625, 7.782958984375, 8.68994140625, 9.596923828125, 10.50390625, 11.410888671875, 12.31787109375, 13.224853515625, 14.1318359375, 15.038818359375, 15.94580078125, 16.852783203125, 17.759765625, 18.666748046875, 19.57373046875, 20.480712890625, 21.3876953125, 22.294677734375, 23.20166015625, 24.108642578125, 25.015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 14.0, 50.0, 235.0, 436.0, 193.0, 54.0, 12.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-453.08721923828125, -441.3263244628906, -429.5654296875, -417.8045349121094, -406.04364013671875, -394.2827453613281, -382.5218505859375, -370.760986328125, -359.00006103515625, -347.2391662597656, -335.478271484375, -323.7173767089844, -311.95648193359375, -300.1955871582031, -288.4346923828125, -276.673828125, -264.9129333496094, -253.15203857421875, -241.39114379882812, -229.6302490234375, -217.86935424804688, -206.10845947265625, -194.3475799560547, -182.58668518066406, -170.82579040527344, -159.0648956298828, -147.3040008544922, -135.54312133789062, -123.78221893310547, -112.02132415771484, -100.26043701171875, -88.49954223632812, -76.7386474609375, -64.97775268554688, -53.216861724853516, -41.455970764160156, -29.69507598876953, -17.934181213378906, -6.1732940673828125, 5.5876007080078125, 17.348495483398438, 29.10938835144043, 40.87028121948242, 52.63117218017578, 64.3920669555664, 76.15296173095703, 87.91384887695312, 99.67474365234375, 111.43563842773438, 123.196533203125, 134.95742797851562, 146.71832275390625, 158.47921752929688, 170.2401123046875, 182.00099182128906, 193.7618865966797, 205.5227813720703, 217.28367614746094, 229.04457092285156, 240.80545043945312, 252.56634521484375, 264.3272399902344, 276.088134765625, 287.8490295410156, 299.60992431640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 9.0, 7.0, 10.0, 14.0, 26.0, 35.0, 40.0, 53.0, 72.0, 72.0, 72.0, 88.0, 96.0, 91.0, 88.0, 58.0, 47.0, 43.0, 21.0, 21.0, 23.0, 14.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-144.97024536132812, -141.11656188964844, -137.26287841796875, -133.40919494628906, -129.55551147460938, -125.70182800292969, -121.84814453125, -117.99446105957031, -114.14077758789062, -110.28709411621094, -106.43341064453125, -102.57972717285156, -98.72604370117188, -94.87236022949219, -91.0186767578125, -87.16499328613281, -83.3113021850586, -79.4576187133789, -75.60393524169922, -71.75025177001953, -67.89656829833984, -64.04288482666016, -60.1891975402832, -56.335514068603516, -52.48183059692383, -48.62814712524414, -44.77446365356445, -40.9207763671875, -37.06709289550781, -33.213409423828125, -29.359725952148438, -25.50604248046875, -21.652359008789062, -17.798675537109375, -13.944991111755371, -10.091306686401367, -6.23762321472168, -2.383939743041992, 1.4697456359863281, 5.323429107666016, 9.177112579345703, 13.03079605102539, 16.884479522705078, 20.7381649017334, 24.591848373413086, 28.445531845092773, 32.299217224121094, 36.15290069580078, 40.00658416748047, 43.860267639160156, 47.713951110839844, 51.56763458251953, 55.42131805419922, 59.275001525878906, 63.12868881225586, 66.98237609863281, 70.8360595703125, 74.68974304199219, 78.54342651367188, 82.39710998535156, 86.25079345703125, 90.10447692871094, 93.95816040039062, 97.81184387207031, 101.66552734375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 5.0, 5.0, 10.0, 12.0, 7.0, 14.0, 12.0, 14.0, 22.0, 26.0, 24.0, 39.0, 65.0, 98.0, 109.0, 180.0, 292.0, 550.0, 1114.0, 2807.0, 8787.0, 33193.0, 158443.0, 545447.0, 232772.0, 46148.0, 11570.0, 3596.0, 1472.0, 660.0, 376.0, 198.0, 128.0, 91.0, 63.0, 45.0, 37.0, 30.0, 20.0, 21.0, 11.0, 12.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0], "bins": [-53.28125, -51.86474609375, -50.4482421875, -49.03173828125, -47.615234375, -46.19873046875, -44.7822265625, -43.36572265625, -41.94921875, -40.53271484375, -39.1162109375, -37.69970703125, -36.283203125, -34.86669921875, -33.4501953125, -32.03369140625, -30.6171875, -29.20068359375, -27.7841796875, -26.36767578125, -24.951171875, -23.53466796875, -22.1181640625, -20.70166015625, -19.28515625, -17.86865234375, -16.4521484375, -15.03564453125, -13.619140625, -12.20263671875, -10.7861328125, -9.36962890625, -7.953125, -6.53662109375, -5.1201171875, -3.70361328125, -2.287109375, -0.87060546875, 0.5458984375, 1.96240234375, 3.37890625, 4.79541015625, 6.2119140625, 7.62841796875, 9.044921875, 10.46142578125, 11.8779296875, 13.29443359375, 14.7109375, 16.12744140625, 17.5439453125, 18.96044921875, 20.376953125, 21.79345703125, 23.2099609375, 24.62646484375, 26.04296875, 27.45947265625, 28.8759765625, 30.29248046875, 31.708984375, 33.12548828125, 34.5419921875, 35.95849609375, 37.375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 17.0, 29.0, 33.0, 51.0, 49.0, 68.0, 69.0, 76.0, 100.0, 107.0, 91.0, 58.0, 59.0, 41.0, 38.0, 40.0, 16.0, 19.0, 9.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.71875, -14.36566162109375, -14.0125732421875, -13.65948486328125, -13.306396484375, -12.95330810546875, -12.6002197265625, -12.24713134765625, -11.89404296875, -11.54095458984375, -11.1878662109375, -10.83477783203125, -10.481689453125, -10.12860107421875, -9.7755126953125, -9.42242431640625, -9.0693359375, -8.71624755859375, -8.3631591796875, -8.01007080078125, -7.656982421875, -7.30389404296875, -6.9508056640625, -6.59771728515625, -6.24462890625, -5.89154052734375, -5.5384521484375, -5.18536376953125, -4.832275390625, -4.47918701171875, -4.1260986328125, -3.77301025390625, -3.419921875, -3.06683349609375, -2.7137451171875, -2.36065673828125, -2.007568359375, -1.65447998046875, -1.3013916015625, -0.94830322265625, -0.59521484375, -0.24212646484375, 0.1109619140625, 0.46405029296875, 0.817138671875, 1.17022705078125, 1.5233154296875, 1.87640380859375, 2.2294921875, 2.58258056640625, 2.9356689453125, 3.28875732421875, 3.641845703125, 3.99493408203125, 4.3480224609375, 4.70111083984375, 5.05419921875, 5.40728759765625, 5.7603759765625, 6.11346435546875, 6.466552734375, 6.81964111328125, 7.1727294921875, 7.52581787109375, 7.87890625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 7.0, 12.0, 20.0, 25.0, 39.0, 42.0, 60.0, 87.0, 125.0, 176.0, 275.0, 468.0, 686.0, 1313.0, 2428.0, 5305.0, 12590.0, 35009.0, 105338.0, 292615.0, 361879.0, 149992.0, 48950.0, 17252.0, 6832.0, 3085.0, 1495.0, 901.0, 486.0, 349.0, 172.0, 153.0, 93.0, 77.0, 53.0, 42.0, 30.0, 15.0, 22.0, 9.0, 10.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.046875, -24.21630859375, -23.3857421875, -22.55517578125, -21.724609375, -20.89404296875, -20.0634765625, -19.23291015625, -18.40234375, -17.57177734375, -16.7412109375, -15.91064453125, -15.080078125, -14.24951171875, -13.4189453125, -12.58837890625, -11.7578125, -10.92724609375, -10.0966796875, -9.26611328125, -8.435546875, -7.60498046875, -6.7744140625, -5.94384765625, -5.11328125, -4.28271484375, -3.4521484375, -2.62158203125, -1.791015625, -0.96044921875, -0.1298828125, 0.70068359375, 1.53125, 2.36181640625, 3.1923828125, 4.02294921875, 4.853515625, 5.68408203125, 6.5146484375, 7.34521484375, 8.17578125, 9.00634765625, 9.8369140625, 10.66748046875, 11.498046875, 12.32861328125, 13.1591796875, 13.98974609375, 14.8203125, 15.65087890625, 16.4814453125, 17.31201171875, 18.142578125, 18.97314453125, 19.8037109375, 20.63427734375, 21.46484375, 22.29541015625, 23.1259765625, 23.95654296875, 24.787109375, 25.61767578125, 26.4482421875, 27.27880859375, 28.109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 7.0, 5.0, 7.0, 7.0, 13.0, 21.0, 26.0, 21.0, 20.0, 19.0, 41.0, 40.0, 55.0, 49.0, 58.0, 46.0, 42.0, 43.0, 69.0, 50.0, 47.0, 51.0, 38.0, 36.0, 38.0, 36.0, 22.0, 18.0, 16.0, 18.0, 10.0, 8.0, 7.0, 2.0, 9.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-38.875, -37.891357421875, -36.90771484375, -35.924072265625, -34.9404296875, -33.956787109375, -32.97314453125, -31.989501953125, -31.005859375, -30.022216796875, -29.03857421875, -28.054931640625, -27.0712890625, -26.087646484375, -25.10400390625, -24.120361328125, -23.13671875, -22.153076171875, -21.16943359375, -20.185791015625, -19.2021484375, -18.218505859375, -17.23486328125, -16.251220703125, -15.267578125, -14.283935546875, -13.30029296875, -12.316650390625, -11.3330078125, -10.349365234375, -9.36572265625, -8.382080078125, -7.3984375, -6.414794921875, -5.43115234375, -4.447509765625, -3.4638671875, -2.480224609375, -1.49658203125, -0.512939453125, 0.470703125, 1.454345703125, 2.43798828125, 3.421630859375, 4.4052734375, 5.388916015625, 6.37255859375, 7.356201171875, 8.33984375, 9.323486328125, 10.30712890625, 11.290771484375, 12.2744140625, 13.258056640625, 14.24169921875, 15.225341796875, 16.208984375, 17.192626953125, 18.17626953125, 19.159912109375, 20.1435546875, 21.127197265625, 22.11083984375, 23.094482421875, 24.078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 8.0, 14.0, 21.0, 28.0, 35.0, 57.0, 76.0, 159.0, 330.0, 803.0, 2072.0, 6084.0, 29105.0, 750595.0, 238146.0, 14418.0, 3980.0, 1438.0, 569.0, 252.0, 142.0, 68.0, 55.0, 19.0, 16.0, 20.0, 8.0, 7.0, 3.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.15087890625, -29.8955078125, -28.64013671875, -27.384765625, -26.12939453125, -24.8740234375, -23.61865234375, -22.36328125, -21.10791015625, -19.8525390625, -18.59716796875, -17.341796875, -16.08642578125, -14.8310546875, -13.57568359375, -12.3203125, -11.06494140625, -9.8095703125, -8.55419921875, -7.298828125, -6.04345703125, -4.7880859375, -3.53271484375, -2.27734375, -1.02197265625, 0.2333984375, 1.48876953125, 2.744140625, 3.99951171875, 5.2548828125, 6.51025390625, 7.765625, 9.02099609375, 10.2763671875, 11.53173828125, 12.787109375, 14.04248046875, 15.2978515625, 16.55322265625, 17.80859375, 19.06396484375, 20.3193359375, 21.57470703125, 22.830078125, 24.08544921875, 25.3408203125, 26.59619140625, 27.8515625, 29.10693359375, 30.3623046875, 31.61767578125, 32.873046875, 34.12841796875, 35.3837890625, 36.63916015625, 37.89453125, 39.14990234375, 40.4052734375, 41.66064453125, 42.916015625, 44.17138671875, 45.4267578125, 46.68212890625, 47.9375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 7.0, 10.0, 8.0, 14.0, 20.0, 22.0, 32.0, 31.0, 45.0, 67.0, 61.0, 77.0, 86.0, 73.0, 84.0, 78.0, 60.0, 36.0, 38.0, 30.0, 24.0, 22.0, 17.0, 9.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0020503997802734375, -0.00198933482170105, -0.0019282698631286621, -0.0018672049045562744, -0.0018061399459838867, -0.001745074987411499, -0.0016840100288391113, -0.0016229450702667236, -0.001561880111694336, -0.0015008151531219482, -0.0014397501945495605, -0.0013786852359771729, -0.0013176202774047852, -0.0012565553188323975, -0.0011954903602600098, -0.001134425401687622, -0.0010733604431152344, -0.0010122954845428467, -0.000951230525970459, -0.0008901655673980713, -0.0008291006088256836, -0.0007680356502532959, -0.0007069706916809082, -0.0006459057331085205, -0.0005848407745361328, -0.0005237758159637451, -0.0004627108573913574, -0.0004016458988189697, -0.00034058094024658203, -0.00027951598167419434, -0.00021845102310180664, -0.00015738606452941895, -9.632110595703125e-05, -3.5256147384643555e-05, 2.580881118774414e-05, 8.687376976013184e-05, 0.00014793872833251953, 0.00020900368690490723, 0.0002700686454772949, 0.0003311336040496826, 0.0003921985626220703, 0.000453263521194458, 0.0005143284797668457, 0.0005753934383392334, 0.0006364583969116211, 0.0006975233554840088, 0.0007585883140563965, 0.0008196532726287842, 0.0008807182312011719, 0.0009417831897735596, 0.0010028481483459473, 0.001063913106918335, 0.0011249780654907227, 0.0011860430240631104, 0.001247107982635498, 0.0013081729412078857, 0.0013692378997802734, 0.0014303028583526611, 0.0014913678169250488, 0.0015524327754974365, 0.0016134977340698242, 0.001674562692642212, 0.0017356276512145996, 0.0017966926097869873, 0.001857757568359375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 14.0, 9.0, 10.0, 22.0, 26.0, 53.0, 57.0, 101.0, 173.0, 242.0, 405.0, 746.0, 1433.0, 3079.0, 9245.0, 72147.0, 830242.0, 112212.0, 11166.0, 3448.0, 1566.0, 857.0, 429.0, 318.0, 181.0, 113.0, 73.0, 62.0, 35.0, 22.0, 14.0, 20.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.96875, -26.98974609375, -26.0107421875, -25.03173828125, -24.052734375, -23.07373046875, -22.0947265625, -21.11572265625, -20.13671875, -19.15771484375, -18.1787109375, -17.19970703125, -16.220703125, -15.24169921875, -14.2626953125, -13.28369140625, -12.3046875, -11.32568359375, -10.3466796875, -9.36767578125, -8.388671875, -7.40966796875, -6.4306640625, -5.45166015625, -4.47265625, -3.49365234375, -2.5146484375, -1.53564453125, -0.556640625, 0.42236328125, 1.4013671875, 2.38037109375, 3.359375, 4.33837890625, 5.3173828125, 6.29638671875, 7.275390625, 8.25439453125, 9.2333984375, 10.21240234375, 11.19140625, 12.17041015625, 13.1494140625, 14.12841796875, 15.107421875, 16.08642578125, 17.0654296875, 18.04443359375, 19.0234375, 20.00244140625, 20.9814453125, 21.96044921875, 22.939453125, 23.91845703125, 24.8974609375, 25.87646484375, 26.85546875, 27.83447265625, 28.8134765625, 29.79248046875, 30.771484375, 31.75048828125, 32.7294921875, 33.70849609375, 34.6875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 13.0, 14.0, 28.0, 64.0, 80.0, 170.0, 204.0, 178.0, 112.0, 55.0, 27.0, 13.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.8125, -26.983154296875, -26.15380859375, -25.324462890625, -24.4951171875, -23.665771484375, -22.83642578125, -22.007080078125, -21.177734375, -20.348388671875, -19.51904296875, -18.689697265625, -17.8603515625, -17.031005859375, -16.20166015625, -15.372314453125, -14.54296875, -13.713623046875, -12.88427734375, -12.054931640625, -11.2255859375, -10.396240234375, -9.56689453125, -8.737548828125, -7.908203125, -7.078857421875, -6.24951171875, -5.420166015625, -4.5908203125, -3.761474609375, -2.93212890625, -2.102783203125, -1.2734375, -0.444091796875, 0.38525390625, 1.214599609375, 2.0439453125, 2.873291015625, 3.70263671875, 4.531982421875, 5.361328125, 6.190673828125, 7.02001953125, 7.849365234375, 8.6787109375, 9.508056640625, 10.33740234375, 11.166748046875, 11.99609375, 12.825439453125, 13.65478515625, 14.484130859375, 15.3134765625, 16.142822265625, 16.97216796875, 17.801513671875, 18.630859375, 19.460205078125, 20.28955078125, 21.118896484375, 21.9482421875, 22.777587890625, 23.60693359375, 24.436279296875, 25.265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 12.0, 30.0, 92.0, 246.0, 368.0, 192.0, 48.0, 14.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-740.3248291015625, -721.56005859375, -702.7952880859375, -684.030517578125, -665.2657470703125, -646.5009765625, -627.7362060546875, -608.971435546875, -590.2066650390625, -571.44189453125, -552.6771240234375, -533.912353515625, -515.1475830078125, -496.3828125, -477.6180725097656, -458.8533020019531, -440.08856201171875, -421.32379150390625, -402.55902099609375, -383.79425048828125, -365.02947998046875, -346.26470947265625, -327.4999694824219, -308.7351989746094, -289.9704284667969, -271.2056579589844, -252.44088745117188, -233.67613220214844, -214.91136169433594, -196.14659118652344, -177.3818359375, -158.6170654296875, -139.852294921875, -121.0875244140625, -102.32276153564453, -83.55799865722656, -64.79322814941406, -46.02845764160156, -27.263694763183594, -8.498931884765625, 10.265838623046875, 29.03060531616211, 47.795372009277344, 66.56013488769531, 85.32490539550781, 104.08967590332031, 122.85443878173828, 141.61920166015625, 160.38397216796875, 179.14874267578125, 197.91351318359375, 216.6782684326172, 235.4430389404297, 254.2078094482422, 272.9725646972656, 291.7373352050781, 310.5021057128906, 329.2668762207031, 348.0316467285156, 366.7964172363281, 385.5611572265625, 404.325927734375, 423.0906982421875, 441.85546875, 460.6202392578125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 13.0, 13.0, 13.0, 16.0, 19.0, 20.0, 27.0, 18.0, 36.0, 30.0, 44.0, 46.0, 49.0, 39.0, 48.0, 60.0, 43.0, 48.0, 48.0, 34.0, 38.0, 50.0, 28.0, 26.0, 33.0, 22.0, 25.0, 17.0, 17.0, 13.0, 15.0, 14.0, 4.0, 4.0, 4.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-200.6685791015625, -195.3905792236328, -190.1125946044922, -184.8345947265625, -179.55661010742188, -174.2786102294922, -169.0006103515625, -163.72262573242188, -158.4446258544922, -153.1666259765625, -147.88864135742188, -142.6106414794922, -137.3326416015625, -132.05465698242188, -126.77665710449219, -121.49866485595703, -116.22067260742188, -110.94268035888672, -105.66468811035156, -100.38668823242188, -95.10869598388672, -89.83070373535156, -84.55270385742188, -79.27471160888672, -73.99671936035156, -68.7187271118164, -63.440731048583984, -58.16273498535156, -52.884742736816406, -47.60675048828125, -42.32875442504883, -37.050758361816406, -31.77276611328125, -26.49477195739746, -21.216777801513672, -15.938783645629883, -10.660789489746094, -5.382795333862305, -0.10480117797851562, 5.173194885253906, 10.451187133789062, 15.729181289672852, 21.00717544555664, 26.28516960144043, 31.56316375732422, 36.841156005859375, 42.1191520690918, 47.39714813232422, 52.675140380859375, 57.95313262939453, 63.23112869262695, 68.50912475585938, 73.78711700439453, 79.06510925292969, 84.34310913085938, 89.62110137939453, 94.89909362792969, 100.17708587646484, 105.455078125, 110.73307800292969, 116.01107025146484, 121.2890625, 126.56706237792969, 131.84506225585938, 137.123046875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 12.0, 18.0, 17.0, 18.0, 46.0, 50.0, 102.0, 122.0, 221.0, 479.0, 1175.0, 3054.0, 11172.0, 73948.0, 3680515.0, 385897.0, 28588.0, 5800.0, 1796.0, 664.0, 250.0, 125.0, 67.0, 53.0, 24.0, 22.0, 16.0, 8.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.3125, -47.7099609375, -46.107421875, -44.5048828125, -42.90234375, -41.2998046875, -39.697265625, -38.0947265625, -36.4921875, -34.8896484375, -33.287109375, -31.6845703125, -30.08203125, -28.4794921875, -26.876953125, -25.2744140625, -23.671875, -22.0693359375, -20.466796875, -18.8642578125, -17.26171875, -15.6591796875, -14.056640625, -12.4541015625, -10.8515625, -9.2490234375, -7.646484375, -6.0439453125, -4.44140625, -2.8388671875, -1.236328125, 0.3662109375, 1.96875, 3.5712890625, 5.173828125, 6.7763671875, 8.37890625, 9.9814453125, 11.583984375, 13.1865234375, 14.7890625, 16.3916015625, 17.994140625, 19.5966796875, 21.19921875, 22.8017578125, 24.404296875, 26.0068359375, 27.609375, 29.2119140625, 30.814453125, 32.4169921875, 34.01953125, 35.6220703125, 37.224609375, 38.8271484375, 40.4296875, 42.0322265625, 43.634765625, 45.2373046875, 46.83984375, 48.4423828125, 50.044921875, 51.6474609375, 53.25]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 8.0, 15.0, 32.0, 36.0, 40.0, 47.0, 64.0, 69.0, 80.0, 77.0, 74.0, 84.0, 66.0, 53.0, 64.0, 50.0, 46.0, 34.0, 12.0, 10.0, 6.0, 7.0, 1.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.6953125, -14.35406494140625, -14.0128173828125, -13.67156982421875, -13.330322265625, -12.98907470703125, -12.6478271484375, -12.30657958984375, -11.96533203125, -11.62408447265625, -11.2828369140625, -10.94158935546875, -10.600341796875, -10.25909423828125, -9.9178466796875, -9.57659912109375, -9.2353515625, -8.89410400390625, -8.5528564453125, -8.21160888671875, -7.870361328125, -7.52911376953125, -7.1878662109375, -6.84661865234375, -6.50537109375, -6.16412353515625, -5.8228759765625, -5.48162841796875, -5.140380859375, -4.79913330078125, -4.4578857421875, -4.11663818359375, -3.775390625, -3.43414306640625, -3.0928955078125, -2.75164794921875, -2.410400390625, -2.06915283203125, -1.7279052734375, -1.38665771484375, -1.04541015625, -0.70416259765625, -0.3629150390625, -0.02166748046875, 0.319580078125, 0.66082763671875, 1.0020751953125, 1.34332275390625, 1.6845703125, 2.02581787109375, 2.3670654296875, 2.70831298828125, 3.049560546875, 3.39080810546875, 3.7320556640625, 4.07330322265625, 4.41455078125, 4.75579833984375, 5.0970458984375, 5.43829345703125, 5.779541015625, 6.12078857421875, 6.4620361328125, 6.80328369140625, 7.14453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 16.0, 15.0, 20.0, 26.0, 26.0, 54.0, 63.0, 121.0, 232.0, 536.0, 1550.0, 7645.0, 78883.0, 3839942.0, 245898.0, 14964.0, 2726.0, 804.0, 315.0, 149.0, 72.0, 55.0, 39.0, 31.0, 23.0, 15.0, 22.0, 6.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-73.375, -71.52490234375, -69.6748046875, -67.82470703125, -65.974609375, -64.12451171875, -62.2744140625, -60.42431640625, -58.57421875, -56.72412109375, -54.8740234375, -53.02392578125, -51.173828125, -49.32373046875, -47.4736328125, -45.62353515625, -43.7734375, -41.92333984375, -40.0732421875, -38.22314453125, -36.373046875, -34.52294921875, -32.6728515625, -30.82275390625, -28.97265625, -27.12255859375, -25.2724609375, -23.42236328125, -21.572265625, -19.72216796875, -17.8720703125, -16.02197265625, -14.171875, -12.32177734375, -10.4716796875, -8.62158203125, -6.771484375, -4.92138671875, -3.0712890625, -1.22119140625, 0.62890625, 2.47900390625, 4.3291015625, 6.17919921875, 8.029296875, 9.87939453125, 11.7294921875, 13.57958984375, 15.4296875, 17.27978515625, 19.1298828125, 20.97998046875, 22.830078125, 24.68017578125, 26.5302734375, 28.38037109375, 30.23046875, 32.08056640625, 33.9306640625, 35.78076171875, 37.630859375, 39.48095703125, 41.3310546875, 43.18115234375, 45.03125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 17.0, 14.0, 16.0, 36.0, 85.0, 138.0, 285.0, 937.0, 1725.0, 408.0, 169.0, 90.0, 63.0, 22.0, 18.0, 10.0, 12.0, 12.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.5322265625, -16.017578125, -15.5029296875, -14.98828125, -14.4736328125, -13.958984375, -13.4443359375, -12.9296875, -12.4150390625, -11.900390625, -11.3857421875, -10.87109375, -10.3564453125, -9.841796875, -9.3271484375, -8.8125, -8.2978515625, -7.783203125, -7.2685546875, -6.75390625, -6.2392578125, -5.724609375, -5.2099609375, -4.6953125, -4.1806640625, -3.666015625, -3.1513671875, -2.63671875, -2.1220703125, -1.607421875, -1.0927734375, -0.578125, -0.0634765625, 0.451171875, 0.9658203125, 1.48046875, 1.9951171875, 2.509765625, 3.0244140625, 3.5390625, 4.0537109375, 4.568359375, 5.0830078125, 5.59765625, 6.1123046875, 6.626953125, 7.1416015625, 7.65625, 8.1708984375, 8.685546875, 9.2001953125, 9.71484375, 10.2294921875, 10.744140625, 11.2587890625, 11.7734375, 12.2880859375, 12.802734375, 13.3173828125, 13.83203125, 14.3466796875, 14.861328125, 15.3759765625, 15.890625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 13.0, 19.0, 38.0, 90.0, 150.0, 239.0, 191.0, 132.0, 68.0, 25.0, 18.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-72.64815521240234, -68.71588134765625, -64.78360748291016, -60.8513298034668, -56.9190559387207, -52.98678207397461, -49.05450439453125, -45.122230529785156, -41.18995666503906, -37.25768280029297, -33.325408935546875, -29.393131256103516, -25.460857391357422, -21.528583526611328, -17.5963077545166, -13.664031982421875, -9.731758117675781, -5.799483299255371, -1.867208480834961, 2.065066337585449, 5.997341156005859, 9.929615020751953, 13.86189079284668, 17.794166564941406, 21.7264404296875, 25.658714294433594, 29.59099006652832, 33.52326583862305, 37.45553970336914, 41.387813568115234, 45.320091247558594, 49.25236511230469, 53.18463134765625, 57.116905212402344, 61.04917907714844, 64.98145294189453, 68.91372680664062, 72.84600830078125, 76.77828216552734, 80.71055603027344, 84.64282989501953, 88.57510375976562, 92.50737762451172, 96.43965148925781, 100.37193298339844, 104.30419921875, 108.23648071289062, 112.16875457763672, 116.10102844238281, 120.0333023071289, 123.965576171875, 127.8978500366211, 131.8301239013672, 135.7624053955078, 139.69467163085938, 143.626953125, 147.55923461914062, 151.49151611328125, 155.4237823486328, 159.35606384277344, 163.288330078125, 167.22061157226562, 171.1528778076172, 175.0851593017578, 179.01742553710938]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 3.0, 8.0, 8.0, 12.0, 16.0, 15.0, 20.0, 22.0, 24.0, 25.0, 42.0, 36.0, 44.0, 44.0, 49.0, 49.0, 48.0, 52.0, 62.0, 44.0, 47.0, 52.0, 37.0, 36.0, 33.0, 30.0, 20.0, 20.0, 23.0, 22.0, 19.0, 9.0, 7.0, 5.0, 6.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.73074722290039, -45.22427749633789, -43.71780776977539, -42.21133804321289, -40.70486831665039, -39.19839859008789, -37.691925048828125, -36.185455322265625, -34.678985595703125, -33.172515869140625, -31.666046142578125, -30.159576416015625, -28.653106689453125, -27.146636962890625, -25.640165328979492, -24.133695602416992, -22.627227783203125, -21.120758056640625, -19.614288330078125, -18.107818603515625, -16.601348876953125, -15.094878196716309, -13.588407516479492, -12.081937789916992, -10.575468063354492, -9.068998336791992, -7.562528133392334, -6.056057929992676, -4.549588203430176, -3.043118476867676, -1.5366477966308594, -0.030178070068359375, 1.4762954711914062, 2.9827654361724854, 4.4892354011535645, 5.995705604553223, 7.502175331115723, 9.008645057678223, 10.515115737915039, 12.021585464477539, 13.528055191040039, 15.034524917602539, 16.54099464416504, 18.047466278076172, 19.553936004638672, 21.060405731201172, 22.566875457763672, 24.073345184326172, 25.579814910888672, 27.086284637451172, 28.592754364013672, 30.099224090576172, 31.605693817138672, 33.11216354370117, 34.61863708496094, 36.12510681152344, 37.63157653808594, 39.13804626464844, 40.64451599121094, 42.15098571777344, 43.65745544433594, 45.16392517089844, 46.67039489746094, 48.17686462402344, 49.68333435058594]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 6.0, 10.0, 10.0, 10.0, 19.0, 39.0, 42.0, 45.0, 88.0, 129.0, 203.0, 305.0, 608.0, 1152.0, 2469.0, 6565.0, 19050.0, 66443.0, 241573.0, 444618.0, 189206.0, 51058.0, 14976.0, 5348.0, 2186.0, 1004.0, 522.0, 293.0, 184.0, 112.0, 77.0, 43.0, 43.0, 34.0, 19.0, 16.0, 9.0, 10.0, 2.0, 8.0, 2.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-42.15625, -40.89404296875, -39.6318359375, -38.36962890625, -37.107421875, -35.84521484375, -34.5830078125, -33.32080078125, -32.05859375, -30.79638671875, -29.5341796875, -28.27197265625, -27.009765625, -25.74755859375, -24.4853515625, -23.22314453125, -21.9609375, -20.69873046875, -19.4365234375, -18.17431640625, -16.912109375, -15.64990234375, -14.3876953125, -13.12548828125, -11.86328125, -10.60107421875, -9.3388671875, -8.07666015625, -6.814453125, -5.55224609375, -4.2900390625, -3.02783203125, -1.765625, -0.50341796875, 0.7587890625, 2.02099609375, 3.283203125, 4.54541015625, 5.8076171875, 7.06982421875, 8.33203125, 9.59423828125, 10.8564453125, 12.11865234375, 13.380859375, 14.64306640625, 15.9052734375, 17.16748046875, 18.4296875, 19.69189453125, 20.9541015625, 22.21630859375, 23.478515625, 24.74072265625, 26.0029296875, 27.26513671875, 28.52734375, 29.78955078125, 31.0517578125, 32.31396484375, 33.576171875, 34.83837890625, 36.1005859375, 37.36279296875, 38.625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 15.0, 27.0, 47.0, 40.0, 57.0, 67.0, 84.0, 71.0, 90.0, 81.0, 90.0, 63.0, 66.0, 49.0, 41.0, 26.0, 30.0, 19.0, 6.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.61798095703125, -14.2672119140625, -13.91644287109375, -13.565673828125, -13.21490478515625, -12.8641357421875, -12.51336669921875, -12.16259765625, -11.81182861328125, -11.4610595703125, -11.11029052734375, -10.759521484375, -10.40875244140625, -10.0579833984375, -9.70721435546875, -9.3564453125, -9.00567626953125, -8.6549072265625, -8.30413818359375, -7.953369140625, -7.60260009765625, -7.2518310546875, -6.90106201171875, -6.55029296875, -6.19952392578125, -5.8487548828125, -5.49798583984375, -5.147216796875, -4.79644775390625, -4.4456787109375, -4.09490966796875, -3.744140625, -3.39337158203125, -3.0426025390625, -2.69183349609375, -2.341064453125, -1.99029541015625, -1.6395263671875, -1.28875732421875, -0.93798828125, -0.58721923828125, -0.2364501953125, 0.11431884765625, 0.465087890625, 0.81585693359375, 1.1666259765625, 1.51739501953125, 1.8681640625, 2.21893310546875, 2.5697021484375, 2.92047119140625, 3.271240234375, 3.62200927734375, 3.9727783203125, 4.32354736328125, 4.67431640625, 5.02508544921875, 5.3758544921875, 5.72662353515625, 6.077392578125, 6.42816162109375, 6.7789306640625, 7.12969970703125, 7.48046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 4.0, 15.0, 17.0, 20.0, 22.0, 35.0, 42.0, 54.0, 89.0, 127.0, 189.0, 274.0, 411.0, 527.0, 907.0, 1737.0, 3739.0, 8768.0, 24258.0, 75194.0, 242174.0, 413747.0, 186105.0, 57250.0, 18786.0, 7127.0, 2980.0, 1462.0, 844.0, 522.0, 321.0, 226.0, 149.0, 117.0, 90.0, 57.0, 42.0, 27.0, 31.0, 22.0, 10.0, 8.0, 4.0, 5.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.875, -28.952392578125, -28.02978515625, -27.107177734375, -26.1845703125, -25.261962890625, -24.33935546875, -23.416748046875, -22.494140625, -21.571533203125, -20.64892578125, -19.726318359375, -18.8037109375, -17.881103515625, -16.95849609375, -16.035888671875, -15.11328125, -14.190673828125, -13.26806640625, -12.345458984375, -11.4228515625, -10.500244140625, -9.57763671875, -8.655029296875, -7.732421875, -6.809814453125, -5.88720703125, -4.964599609375, -4.0419921875, -3.119384765625, -2.19677734375, -1.274169921875, -0.3515625, 0.571044921875, 1.49365234375, 2.416259765625, 3.3388671875, 4.261474609375, 5.18408203125, 6.106689453125, 7.029296875, 7.951904296875, 8.87451171875, 9.797119140625, 10.7197265625, 11.642333984375, 12.56494140625, 13.487548828125, 14.41015625, 15.332763671875, 16.25537109375, 17.177978515625, 18.1005859375, 19.023193359375, 19.94580078125, 20.868408203125, 21.791015625, 22.713623046875, 23.63623046875, 24.558837890625, 25.4814453125, 26.404052734375, 27.32666015625, 28.249267578125, 29.171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 13.0, 10.0, 12.0, 12.0, 14.0, 15.0, 17.0, 18.0, 26.0, 32.0, 28.0, 37.0, 42.0, 41.0, 49.0, 35.0, 56.0, 44.0, 46.0, 43.0, 49.0, 39.0, 38.0, 40.0, 34.0, 32.0, 34.0, 28.0, 13.0, 18.0, 21.0, 10.0, 10.0, 8.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-32.5625, -31.65966796875, -30.7568359375, -29.85400390625, -28.951171875, -28.04833984375, -27.1455078125, -26.24267578125, -25.33984375, -24.43701171875, -23.5341796875, -22.63134765625, -21.728515625, -20.82568359375, -19.9228515625, -19.02001953125, -18.1171875, -17.21435546875, -16.3115234375, -15.40869140625, -14.505859375, -13.60302734375, -12.7001953125, -11.79736328125, -10.89453125, -9.99169921875, -9.0888671875, -8.18603515625, -7.283203125, -6.38037109375, -5.4775390625, -4.57470703125, -3.671875, -2.76904296875, -1.8662109375, -0.96337890625, -0.060546875, 0.84228515625, 1.7451171875, 2.64794921875, 3.55078125, 4.45361328125, 5.3564453125, 6.25927734375, 7.162109375, 8.06494140625, 8.9677734375, 9.87060546875, 10.7734375, 11.67626953125, 12.5791015625, 13.48193359375, 14.384765625, 15.28759765625, 16.1904296875, 17.09326171875, 17.99609375, 18.89892578125, 19.8017578125, 20.70458984375, 21.607421875, 22.51025390625, 23.4130859375, 24.31591796875, 25.21875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 4.0, 13.0, 13.0, 27.0, 53.0, 89.0, 171.0, 341.0, 732.0, 1836.0, 5458.0, 23691.0, 227371.0, 686410.0, 83903.0, 12567.0, 3464.0, 1230.0, 547.0, 282.0, 128.0, 72.0, 38.0, 30.0, 15.0, 9.0, 17.0, 3.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-27.453125, -26.675537109375, -25.89794921875, -25.120361328125, -24.3427734375, -23.565185546875, -22.78759765625, -22.010009765625, -21.232421875, -20.454833984375, -19.67724609375, -18.899658203125, -18.1220703125, -17.344482421875, -16.56689453125, -15.789306640625, -15.01171875, -14.234130859375, -13.45654296875, -12.678955078125, -11.9013671875, -11.123779296875, -10.34619140625, -9.568603515625, -8.791015625, -8.013427734375, -7.23583984375, -6.458251953125, -5.6806640625, -4.903076171875, -4.12548828125, -3.347900390625, -2.5703125, -1.792724609375, -1.01513671875, -0.237548828125, 0.5400390625, 1.317626953125, 2.09521484375, 2.872802734375, 3.650390625, 4.427978515625, 5.20556640625, 5.983154296875, 6.7607421875, 7.538330078125, 8.31591796875, 9.093505859375, 9.87109375, 10.648681640625, 11.42626953125, 12.203857421875, 12.9814453125, 13.759033203125, 14.53662109375, 15.314208984375, 16.091796875, 16.869384765625, 17.64697265625, 18.424560546875, 19.2021484375, 19.979736328125, 20.75732421875, 21.534912109375, 22.3125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 12.0, 10.0, 10.0, 26.0, 34.0, 64.0, 91.0, 101.0, 144.0, 166.0, 118.0, 67.0, 57.0, 38.0, 21.0, 10.0, 12.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003177642822265625, -0.0030638575553894043, -0.0029500722885131836, -0.002836287021636963, -0.002722501754760742, -0.0026087164878845215, -0.0024949312210083008, -0.00238114595413208, -0.0022673606872558594, -0.0021535754203796387, -0.002039790153503418, -0.0019260048866271973, -0.0018122196197509766, -0.0016984343528747559, -0.0015846490859985352, -0.0014708638191223145, -0.0013570785522460938, -0.001243293285369873, -0.0011295080184936523, -0.0010157227516174316, -0.0009019374847412109, -0.0007881522178649902, -0.0006743669509887695, -0.0005605816841125488, -0.0004467964172363281, -0.0003330111503601074, -0.00021922588348388672, -0.00010544061660766602, 8.344650268554688e-06, 0.0001221299171447754, 0.0002359151840209961, 0.0003497004508972168, 0.0004634857177734375, 0.0005772709846496582, 0.0006910562515258789, 0.0008048415184020996, 0.0009186267852783203, 0.001032412052154541, 0.0011461973190307617, 0.0012599825859069824, 0.0013737678527832031, 0.0014875531196594238, 0.0016013383865356445, 0.0017151236534118652, 0.001828908920288086, 0.0019426941871643066, 0.0020564794540405273, 0.002170264720916748, 0.0022840499877929688, 0.0023978352546691895, 0.00251162052154541, 0.002625405788421631, 0.0027391910552978516, 0.0028529763221740723, 0.002966761589050293, 0.0030805468559265137, 0.0031943321228027344, 0.003308117389678955, 0.0034219026565551758, 0.0035356879234313965, 0.003649473190307617, 0.003763258457183838, 0.0038770437240600586, 0.003990828990936279, 0.0041046142578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 7.0, 11.0, 12.0, 21.0, 30.0, 36.0, 33.0, 67.0, 121.0, 203.0, 287.0, 546.0, 1209.0, 2831.0, 8605.0, 42477.0, 388439.0, 526558.0, 59789.0, 10932.0, 3426.0, 1368.0, 644.0, 344.0, 182.0, 127.0, 80.0, 67.0, 32.0, 26.0, 17.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-24.796875, -24.1624755859375, -23.528076171875, -22.8936767578125, -22.25927734375, -21.6248779296875, -20.990478515625, -20.3560791015625, -19.7216796875, -19.0872802734375, -18.452880859375, -17.8184814453125, -17.18408203125, -16.5496826171875, -15.915283203125, -15.2808837890625, -14.646484375, -14.0120849609375, -13.377685546875, -12.7432861328125, -12.10888671875, -11.4744873046875, -10.840087890625, -10.2056884765625, -9.5712890625, -8.9368896484375, -8.302490234375, -7.6680908203125, -7.03369140625, -6.3992919921875, -5.764892578125, -5.1304931640625, -4.49609375, -3.8616943359375, -3.227294921875, -2.5928955078125, -1.95849609375, -1.3240966796875, -0.689697265625, -0.0552978515625, 0.5791015625, 1.2135009765625, 1.847900390625, 2.4822998046875, 3.11669921875, 3.7510986328125, 4.385498046875, 5.0198974609375, 5.654296875, 6.2886962890625, 6.923095703125, 7.5574951171875, 8.19189453125, 8.8262939453125, 9.460693359375, 10.0950927734375, 10.7294921875, 11.3638916015625, 11.998291015625, 12.6326904296875, 13.26708984375, 13.9014892578125, 14.535888671875, 15.1702880859375, 15.8046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 6.0, 12.0, 20.0, 32.0, 27.0, 46.0, 77.0, 111.0, 105.0, 120.0, 131.0, 84.0, 76.0, 39.0, 29.0, 19.0, 10.0, 8.0, 9.0, 7.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.375, -19.8673095703125, -19.359619140625, -18.8519287109375, -18.34423828125, -17.8365478515625, -17.328857421875, -16.8211669921875, -16.3134765625, -15.8057861328125, -15.298095703125, -14.7904052734375, -14.28271484375, -13.7750244140625, -13.267333984375, -12.7596435546875, -12.251953125, -11.7442626953125, -11.236572265625, -10.7288818359375, -10.22119140625, -9.7135009765625, -9.205810546875, -8.6981201171875, -8.1904296875, -7.6827392578125, -7.175048828125, -6.6673583984375, -6.15966796875, -5.6519775390625, -5.144287109375, -4.6365966796875, -4.12890625, -3.6212158203125, -3.113525390625, -2.6058349609375, -2.09814453125, -1.5904541015625, -1.082763671875, -0.5750732421875, -0.0673828125, 0.4403076171875, 0.947998046875, 1.4556884765625, 1.96337890625, 2.4710693359375, 2.978759765625, 3.4864501953125, 3.994140625, 4.5018310546875, 5.009521484375, 5.5172119140625, 6.02490234375, 6.5325927734375, 7.040283203125, 7.5479736328125, 8.0556640625, 8.5633544921875, 9.071044921875, 9.5787353515625, 10.08642578125, 10.5941162109375, 11.101806640625, 11.6094970703125, 12.1171875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 14.0, 40.0, 131.0, 352.0, 304.0, 111.0, 32.0, 12.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-609.5525512695312, -589.2125244140625, -568.8724975585938, -548.532470703125, -528.1924438476562, -507.8524169921875, -487.5123596191406, -467.1723327636719, -446.8323059082031, -426.4922790527344, -406.1522521972656, -385.8122253417969, -365.47216796875, -345.13214111328125, -324.7921142578125, -304.45208740234375, -284.112060546875, -263.77203369140625, -243.4320068359375, -223.0919647216797, -202.75193786621094, -182.4119110107422, -162.07186889648438, -141.73184204101562, -121.39181518554688, -101.05178833007812, -80.71175384521484, -60.37172317504883, -40.03169250488281, -19.691665649414062, 0.6483688354492188, 20.9884033203125, 41.3284912109375, 61.668521881103516, 82.00855255126953, 102.34858703613281, 122.68861389160156, 143.0286407470703, 163.36868286132812, 183.70870971679688, 204.04873657226562, 224.38876342773438, 244.72879028320312, 265.0688171386719, 285.40887451171875, 305.7489013671875, 326.08892822265625, 346.428955078125, 366.76898193359375, 387.1090087890625, 407.44903564453125, 427.7890625, 448.12908935546875, 468.4691162109375, 488.8091735839844, 509.1492004394531, 529.4892578125, 549.8292846679688, 570.1693115234375, 590.5093383789062, 610.849365234375, 631.1893920898438, 651.5294189453125, 671.8695068359375, 692.20947265625]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 7.0, 6.0, 9.0, 17.0, 14.0, 16.0, 13.0, 21.0, 13.0, 29.0, 31.0, 29.0, 26.0, 22.0, 45.0, 19.0, 35.0, 31.0, 42.0, 33.0, 46.0, 39.0, 34.0, 38.0, 40.0, 40.0, 29.0, 33.0, 30.0, 29.0, 20.0, 16.0, 19.0, 19.0, 12.0, 9.0, 14.0, 15.0, 8.0, 8.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-159.02780151367188, -154.1536407470703, -149.2794647216797, -144.40530395507812, -139.53114318847656, -134.656982421875, -129.78280639648438, -124.90864562988281, -120.03447723388672, -115.16030883789062, -110.28614807128906, -105.41197967529297, -100.53781127929688, -95.66365051269531, -90.78948211669922, -85.91531372070312, -81.04115295410156, -76.16698455810547, -71.2928237915039, -66.41865539550781, -61.544490814208984, -56.670326232910156, -51.79615783691406, -46.921993255615234, -42.047828674316406, -37.17366409301758, -32.29949951171875, -27.425331115722656, -22.551166534423828, -17.677001953125, -12.802835464477539, -7.928668975830078, -3.05450439453125, 1.8196611404418945, 6.693826675415039, 11.567992210388184, 16.442157745361328, 21.316322326660156, 26.190488815307617, 31.064655303955078, 35.938819885253906, 40.812984466552734, 45.68714904785156, 50.561317443847656, 55.435482025146484, 60.30964660644531, 65.1838150024414, 70.0579833984375, 74.93214416503906, 79.80631256103516, 84.68047332763672, 89.55464172363281, 94.42880249023438, 99.30297088623047, 104.17713928222656, 109.05130004882812, 113.92546844482422, 118.79963684082031, 123.67379760742188, 128.54795837402344, 133.42213439941406, 138.29629516601562, 143.1704559326172, 148.0446319580078, 152.91879272460938]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 15.0, 7.0, 10.0, 22.0, 34.0, 53.0, 90.0, 138.0, 196.0, 384.0, 750.0, 1776.0, 4470.0, 13661.0, 57755.0, 780516.0, 3217689.0, 89041.0, 18263.0, 5508.0, 2150.0, 858.0, 395.0, 215.0, 111.0, 77.0, 28.0, 26.0, 13.0, 8.0, 8.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.40625, -39.064453125, -37.72265625, -36.380859375, -35.0390625, -33.697265625, -32.35546875, -31.013671875, -29.671875, -28.330078125, -26.98828125, -25.646484375, -24.3046875, -22.962890625, -21.62109375, -20.279296875, -18.9375, -17.595703125, -16.25390625, -14.912109375, -13.5703125, -12.228515625, -10.88671875, -9.544921875, -8.203125, -6.861328125, -5.51953125, -4.177734375, -2.8359375, -1.494140625, -0.15234375, 1.189453125, 2.53125, 3.873046875, 5.21484375, 6.556640625, 7.8984375, 9.240234375, 10.58203125, 11.923828125, 13.265625, 14.607421875, 15.94921875, 17.291015625, 18.6328125, 19.974609375, 21.31640625, 22.658203125, 24.0, 25.341796875, 26.68359375, 28.025390625, 29.3671875, 30.708984375, 32.05078125, 33.392578125, 34.734375, 36.076171875, 37.41796875, 38.759765625, 40.1015625, 41.443359375, 42.78515625, 44.126953125, 45.46875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 11.0, 13.0, 8.0, 23.0, 26.0, 31.0, 40.0, 45.0, 48.0, 57.0, 44.0, 54.0, 55.0, 65.0, 72.0, 62.0, 62.0, 59.0, 47.0, 36.0, 33.0, 26.0, 32.0, 17.0, 7.0, 8.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.390625, -13.05792236328125, -12.7252197265625, -12.39251708984375, -12.059814453125, -11.72711181640625, -11.3944091796875, -11.06170654296875, -10.72900390625, -10.39630126953125, -10.0635986328125, -9.73089599609375, -9.398193359375, -9.06549072265625, -8.7327880859375, -8.40008544921875, -8.0673828125, -7.73468017578125, -7.4019775390625, -7.06927490234375, -6.736572265625, -6.40386962890625, -6.0711669921875, -5.73846435546875, -5.40576171875, -5.07305908203125, -4.7403564453125, -4.40765380859375, -4.074951171875, -3.74224853515625, -3.4095458984375, -3.07684326171875, -2.744140625, -2.41143798828125, -2.0787353515625, -1.74603271484375, -1.413330078125, -1.08062744140625, -0.7479248046875, -0.41522216796875, -0.08251953125, 0.25018310546875, 0.5828857421875, 0.91558837890625, 1.248291015625, 1.58099365234375, 1.9136962890625, 2.24639892578125, 2.5791015625, 2.91180419921875, 3.2445068359375, 3.57720947265625, 3.909912109375, 4.24261474609375, 4.5753173828125, 4.90802001953125, 5.24072265625, 5.57342529296875, 5.9061279296875, 6.23883056640625, 6.571533203125, 6.90423583984375, 7.2369384765625, 7.56964111328125, 7.90234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 9.0, 10.0, 20.0, 28.0, 38.0, 78.0, 164.0, 317.0, 665.0, 1541.0, 4496.0, 16776.0, 107595.0, 3258193.0, 737494.0, 51447.0, 10138.0, 3091.0, 1132.0, 486.0, 259.0, 129.0, 78.0, 30.0, 23.0, 14.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-46.25, -44.921875, -43.59375, -42.265625, -40.9375, -39.609375, -38.28125, -36.953125, -35.625, -34.296875, -32.96875, -31.640625, -30.3125, -28.984375, -27.65625, -26.328125, -25.0, -23.671875, -22.34375, -21.015625, -19.6875, -18.359375, -17.03125, -15.703125, -14.375, -13.046875, -11.71875, -10.390625, -9.0625, -7.734375, -6.40625, -5.078125, -3.75, -2.421875, -1.09375, 0.234375, 1.5625, 2.890625, 4.21875, 5.546875, 6.875, 8.203125, 9.53125, 10.859375, 12.1875, 13.515625, 14.84375, 16.171875, 17.5, 18.828125, 20.15625, 21.484375, 22.8125, 24.140625, 25.46875, 26.796875, 28.125, 29.453125, 30.78125, 32.109375, 33.4375, 34.765625, 36.09375, 37.421875, 38.75]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 9.0, 5.0, 14.0, 19.0, 27.0, 36.0, 72.0, 106.0, 209.0, 499.0, 1491.0, 848.0, 333.0, 143.0, 91.0, 59.0, 30.0, 18.0, 17.0, 9.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.03125, -17.48046875, -16.9296875, -16.37890625, -15.828125, -15.27734375, -14.7265625, -14.17578125, -13.625, -13.07421875, -12.5234375, -11.97265625, -11.421875, -10.87109375, -10.3203125, -9.76953125, -9.21875, -8.66796875, -8.1171875, -7.56640625, -7.015625, -6.46484375, -5.9140625, -5.36328125, -4.8125, -4.26171875, -3.7109375, -3.16015625, -2.609375, -2.05859375, -1.5078125, -0.95703125, -0.40625, 0.14453125, 0.6953125, 1.24609375, 1.796875, 2.34765625, 2.8984375, 3.44921875, 4.0, 4.55078125, 5.1015625, 5.65234375, 6.203125, 6.75390625, 7.3046875, 7.85546875, 8.40625, 8.95703125, 9.5078125, 10.05859375, 10.609375, 11.16015625, 11.7109375, 12.26171875, 12.8125, 13.36328125, 13.9140625, 14.46484375, 15.015625, 15.56640625, 16.1171875, 16.66796875, 17.21875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 0.0, 7.0, 17.0, 36.0, 174.0, 265.0, 288.0, 143.0, 49.0, 10.0, 6.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.77386474609375, -194.27395629882812, -187.77406311035156, -181.27415466308594, -174.77426147460938, -168.27435302734375, -161.77444458007812, -155.2745361328125, -148.77464294433594, -142.2747344970703, -135.77484130859375, -129.27493286132812, -122.77503204345703, -116.27513122558594, -109.77522277832031, -103.27532196044922, -96.77542114257812, -90.27552032470703, -83.77561950683594, -77.27571105957031, -70.77581024169922, -64.27590942382812, -57.776004791259766, -51.276100158691406, -44.77619934082031, -38.27629852294922, -31.77639389038086, -25.276491165161133, -18.776588439941406, -12.276687622070312, -5.776782989501953, 0.7231216430664062, 7.2230224609375, 13.722925186157227, 20.222827911376953, 26.72273063659668, 33.222633361816406, 39.7225341796875, 46.22243881225586, 52.72234344482422, 59.22224426269531, 65.7221450805664, 72.2220458984375, 78.72195434570312, 85.22185516357422, 91.72175598144531, 98.22166442871094, 104.72156524658203, 111.22146606445312, 117.72136688232422, 124.22126770019531, 130.72117614746094, 137.2210693359375, 143.72097778320312, 150.22088623046875, 156.72079467773438, 163.22068786621094, 169.72059631347656, 176.22048950195312, 182.72039794921875, 189.22030639648438, 195.72019958496094, 202.22010803222656, 208.72000122070312, 215.21990966796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 11.0, 9.0, 7.0, 14.0, 17.0, 6.0, 12.0, 15.0, 29.0, 23.0, 27.0, 30.0, 31.0, 48.0, 32.0, 31.0, 47.0, 40.0, 35.0, 42.0, 46.0, 46.0, 37.0, 36.0, 41.0, 37.0, 21.0, 40.0, 30.0, 27.0, 25.0, 19.0, 11.0, 17.0, 12.0, 9.0, 7.0, 9.0, 10.0, 5.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-52.19124984741211, -50.71160888671875, -49.23196792602539, -47.75232696533203, -46.272682189941406, -44.79304122924805, -43.31340026855469, -41.83375930786133, -40.35411834716797, -38.87447738647461, -37.39483642578125, -35.91519546508789, -34.43555450439453, -32.955909729003906, -31.476268768310547, -29.996627807617188, -28.516986846923828, -27.03734588623047, -25.55770492553711, -24.078062057495117, -22.598421096801758, -21.1187801361084, -19.639137268066406, -18.159496307373047, -16.679855346679688, -15.200214385986328, -13.720572471618652, -12.240930557250977, -10.761289596557617, -9.281648635864258, -7.802006721496582, -6.322364807128906, -4.8427276611328125, -3.363086223602295, -1.8834447860717773, -0.40380334854125977, 1.0758380889892578, 2.5554795265197754, 4.035120964050293, 5.514762878417969, 6.994403839111328, 8.474044799804688, 9.953686714172363, 11.433328628540039, 12.912969589233398, 14.392610549926758, 15.872252464294434, 17.35189437866211, 18.83153533935547, 20.311176300048828, 21.790817260742188, 23.27046012878418, 24.75010108947754, 26.2297420501709, 27.70938491821289, 29.18902587890625, 30.66866683959961, 32.14830780029297, 33.62794876098633, 35.10758972167969, 36.58723449707031, 38.06687545776367, 39.54651641845703, 41.02615737915039, 42.50579833984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 8.0, 7.0, 15.0, 14.0, 27.0, 39.0, 78.0, 103.0, 213.0, 356.0, 704.0, 1579.0, 3791.0, 9950.0, 31007.0, 112247.0, 458741.0, 317783.0, 76760.0, 22088.0, 7484.0, 2936.0, 1251.0, 578.0, 304.0, 157.0, 143.0, 77.0, 34.0, 22.0, 14.0, 9.0, 11.0, 11.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.65625, -34.27734375, -32.8984375, -31.51953125, -30.140625, -28.76171875, -27.3828125, -26.00390625, -24.625, -23.24609375, -21.8671875, -20.48828125, -19.109375, -17.73046875, -16.3515625, -14.97265625, -13.59375, -12.21484375, -10.8359375, -9.45703125, -8.078125, -6.69921875, -5.3203125, -3.94140625, -2.5625, -1.18359375, 0.1953125, 1.57421875, 2.953125, 4.33203125, 5.7109375, 7.08984375, 8.46875, 9.84765625, 11.2265625, 12.60546875, 13.984375, 15.36328125, 16.7421875, 18.12109375, 19.5, 20.87890625, 22.2578125, 23.63671875, 25.015625, 26.39453125, 27.7734375, 29.15234375, 30.53125, 31.91015625, 33.2890625, 34.66796875, 36.046875, 37.42578125, 38.8046875, 40.18359375, 41.5625, 42.94140625, 44.3203125, 45.69921875, 47.078125, 48.45703125, 49.8359375, 51.21484375, 52.59375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 12.0, 10.0, 15.0, 8.0, 21.0, 26.0, 43.0, 44.0, 40.0, 37.0, 52.0, 49.0, 59.0, 59.0, 64.0, 65.0, 72.0, 58.0, 43.0, 41.0, 39.0, 31.0, 24.0, 28.0, 18.0, 12.0, 7.0, 6.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.5078125, -12.18792724609375, -11.8680419921875, -11.54815673828125, -11.228271484375, -10.90838623046875, -10.5885009765625, -10.26861572265625, -9.94873046875, -9.62884521484375, -9.3089599609375, -8.98907470703125, -8.669189453125, -8.34930419921875, -8.0294189453125, -7.70953369140625, -7.3896484375, -7.06976318359375, -6.7498779296875, -6.42999267578125, -6.110107421875, -5.79022216796875, -5.4703369140625, -5.15045166015625, -4.83056640625, -4.51068115234375, -4.1907958984375, -3.87091064453125, -3.551025390625, -3.23114013671875, -2.9112548828125, -2.59136962890625, -2.271484375, -1.95159912109375, -1.6317138671875, -1.31182861328125, -0.991943359375, -0.67205810546875, -0.3521728515625, -0.03228759765625, 0.28759765625, 0.60748291015625, 0.9273681640625, 1.24725341796875, 1.567138671875, 1.88702392578125, 2.2069091796875, 2.52679443359375, 2.8466796875, 3.16656494140625, 3.4864501953125, 3.80633544921875, 4.126220703125, 4.44610595703125, 4.7659912109375, 5.08587646484375, 5.40576171875, 5.72564697265625, 6.0455322265625, 6.36541748046875, 6.685302734375, 7.00518798828125, 7.3250732421875, 7.64495849609375, 7.96484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 15.0, 8.0, 13.0, 22.0, 36.0, 38.0, 63.0, 84.0, 127.0, 162.0, 242.0, 394.0, 535.0, 971.0, 1979.0, 4353.0, 10939.0, 34280.0, 130905.0, 499272.0, 267692.0, 64663.0, 18736.0, 6649.0, 2784.0, 1329.0, 720.0, 429.0, 312.0, 198.0, 143.0, 107.0, 81.0, 77.0, 37.0, 40.0, 22.0, 17.0, 12.0, 8.0, 11.0, 3.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-40.125, -38.8994140625, -37.673828125, -36.4482421875, -35.22265625, -33.9970703125, -32.771484375, -31.5458984375, -30.3203125, -29.0947265625, -27.869140625, -26.6435546875, -25.41796875, -24.1923828125, -22.966796875, -21.7412109375, -20.515625, -19.2900390625, -18.064453125, -16.8388671875, -15.61328125, -14.3876953125, -13.162109375, -11.9365234375, -10.7109375, -9.4853515625, -8.259765625, -7.0341796875, -5.80859375, -4.5830078125, -3.357421875, -2.1318359375, -0.90625, 0.3193359375, 1.544921875, 2.7705078125, 3.99609375, 5.2216796875, 6.447265625, 7.6728515625, 8.8984375, 10.1240234375, 11.349609375, 12.5751953125, 13.80078125, 15.0263671875, 16.251953125, 17.4775390625, 18.703125, 19.9287109375, 21.154296875, 22.3798828125, 23.60546875, 24.8310546875, 26.056640625, 27.2822265625, 28.5078125, 29.7333984375, 30.958984375, 32.1845703125, 33.41015625, 34.6357421875, 35.861328125, 37.0869140625, 38.3125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 9.0, 9.0, 9.0, 10.0, 21.0, 22.0, 16.0, 28.0, 37.0, 35.0, 41.0, 54.0, 57.0, 56.0, 54.0, 51.0, 58.0, 54.0, 50.0, 50.0, 48.0, 36.0, 33.0, 34.0, 26.0, 23.0, 23.0, 21.0, 12.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.5, -40.17138671875, -38.8427734375, -37.51416015625, -36.185546875, -34.85693359375, -33.5283203125, -32.19970703125, -30.87109375, -29.54248046875, -28.2138671875, -26.88525390625, -25.556640625, -24.22802734375, -22.8994140625, -21.57080078125, -20.2421875, -18.91357421875, -17.5849609375, -16.25634765625, -14.927734375, -13.59912109375, -12.2705078125, -10.94189453125, -9.61328125, -8.28466796875, -6.9560546875, -5.62744140625, -4.298828125, -2.97021484375, -1.6416015625, -0.31298828125, 1.015625, 2.34423828125, 3.6728515625, 5.00146484375, 6.330078125, 7.65869140625, 8.9873046875, 10.31591796875, 11.64453125, 12.97314453125, 14.3017578125, 15.63037109375, 16.958984375, 18.28759765625, 19.6162109375, 20.94482421875, 22.2734375, 23.60205078125, 24.9306640625, 26.25927734375, 27.587890625, 28.91650390625, 30.2451171875, 31.57373046875, 32.90234375, 34.23095703125, 35.5595703125, 36.88818359375, 38.216796875, 39.54541015625, 40.8740234375, 42.20263671875, 43.53125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 6.0, 21.0, 54.0, 98.0, 218.0, 806.0, 19939.0, 1020073.0, 6463.0, 539.0, 185.0, 80.0, 35.0, 13.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.375, -143.48828125, -138.6015625, -133.71484375, -128.828125, -123.94140625, -119.0546875, -114.16796875, -109.28125, -104.39453125, -99.5078125, -94.62109375, -89.734375, -84.84765625, -79.9609375, -75.07421875, -70.1875, -65.30078125, -60.4140625, -55.52734375, -50.640625, -45.75390625, -40.8671875, -35.98046875, -31.09375, -26.20703125, -21.3203125, -16.43359375, -11.546875, -6.66015625, -1.7734375, 3.11328125, 8.0, 12.88671875, 17.7734375, 22.66015625, 27.546875, 32.43359375, 37.3203125, 42.20703125, 47.09375, 51.98046875, 56.8671875, 61.75390625, 66.640625, 71.52734375, 76.4140625, 81.30078125, 86.1875, 91.07421875, 95.9609375, 100.84765625, 105.734375, 110.62109375, 115.5078125, 120.39453125, 125.28125, 130.16796875, 135.0546875, 139.94140625, 144.828125, 149.71484375, 154.6015625, 159.48828125, 164.375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 2.0, 3.0, 4.0, 4.0, 17.0, 24.0, 38.0, 51.0, 98.0, 178.0, 202.0, 155.0, 97.0, 37.0, 40.0, 25.0, 15.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00624847412109375, -0.006101042032241821, -0.005953609943389893, -0.005806177854537964, -0.005658745765686035, -0.0055113136768341064, -0.005363881587982178, -0.005216449499130249, -0.00506901741027832, -0.004921585321426392, -0.004774153232574463, -0.004626721143722534, -0.0044792890548706055, -0.004331856966018677, -0.004184424877166748, -0.004036992788314819, -0.0038895606994628906, -0.003742128610610962, -0.003594696521759033, -0.0034472644329071045, -0.0032998323440551758, -0.003152400255203247, -0.0030049681663513184, -0.0028575360774993896, -0.002710103988647461, -0.0025626718997955322, -0.0024152398109436035, -0.002267807722091675, -0.002120375633239746, -0.0019729435443878174, -0.0018255114555358887, -0.00167807936668396, -0.0015306472778320312, -0.0013832151889801025, -0.0012357831001281738, -0.0010883510112762451, -0.0009409189224243164, -0.0007934868335723877, -0.000646054744720459, -0.0004986226558685303, -0.00035119056701660156, -0.00020375847816467285, -5.632638931274414e-05, 9.110569953918457e-05, 0.00023853778839111328, 0.000385969877243042, 0.0005334019660949707, 0.0006808340549468994, 0.0008282661437988281, 0.0009756982326507568, 0.0011231303215026855, 0.0012705624103546143, 0.001417994499206543, 0.0015654265880584717, 0.0017128586769104004, 0.001860290765762329, 0.002007722854614258, 0.0021551549434661865, 0.0023025870323181152, 0.002450019121170044, 0.0025974512100219727, 0.0027448832988739014, 0.00289231538772583, 0.003039747476577759, 0.0031871795654296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 10.0, 23.0, 38.0, 68.0, 184.0, 434.0, 2758.0, 160152.0, 879035.0, 4833.0, 590.0, 197.0, 112.0, 52.0, 29.0, 17.0, 10.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-91.1875, -87.5556640625, -83.923828125, -80.2919921875, -76.66015625, -73.0283203125, -69.396484375, -65.7646484375, -62.1328125, -58.5009765625, -54.869140625, -51.2373046875, -47.60546875, -43.9736328125, -40.341796875, -36.7099609375, -33.078125, -29.4462890625, -25.814453125, -22.1826171875, -18.55078125, -14.9189453125, -11.287109375, -7.6552734375, -4.0234375, -0.3916015625, 3.240234375, 6.8720703125, 10.50390625, 14.1357421875, 17.767578125, 21.3994140625, 25.03125, 28.6630859375, 32.294921875, 35.9267578125, 39.55859375, 43.1904296875, 46.822265625, 50.4541015625, 54.0859375, 57.7177734375, 61.349609375, 64.9814453125, 68.61328125, 72.2451171875, 75.876953125, 79.5087890625, 83.140625, 86.7724609375, 90.404296875, 94.0361328125, 97.66796875, 101.2998046875, 104.931640625, 108.5634765625, 112.1953125, 115.8271484375, 119.458984375, 123.0908203125, 126.72265625, 130.3544921875, 133.986328125, 137.6181640625, 141.25]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 18.0, 65.0, 218.0, 442.0, 170.0, 53.0, 19.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.0, -68.2021484375, -65.404296875, -62.6064453125, -59.80859375, -57.0107421875, -54.212890625, -51.4150390625, -48.6171875, -45.8193359375, -43.021484375, -40.2236328125, -37.42578125, -34.6279296875, -31.830078125, -29.0322265625, -26.234375, -23.4365234375, -20.638671875, -17.8408203125, -15.04296875, -12.2451171875, -9.447265625, -6.6494140625, -3.8515625, -1.0537109375, 1.744140625, 4.5419921875, 7.33984375, 10.1376953125, 12.935546875, 15.7333984375, 18.53125, 21.3291015625, 24.126953125, 26.9248046875, 29.72265625, 32.5205078125, 35.318359375, 38.1162109375, 40.9140625, 43.7119140625, 46.509765625, 49.3076171875, 52.10546875, 54.9033203125, 57.701171875, 60.4990234375, 63.296875, 66.0947265625, 68.892578125, 71.6904296875, 74.48828125, 77.2861328125, 80.083984375, 82.8818359375, 85.6796875, 88.4775390625, 91.275390625, 94.0732421875, 96.87109375, 99.6689453125, 102.466796875, 105.2646484375, 108.0625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 8.0, 18.0, 45.0, 102.0, 193.0, 253.0, 186.0, 105.0, 41.0, 18.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-659.4761352539062, -643.8617553710938, -628.2474365234375, -612.633056640625, -597.0186767578125, -581.4043579101562, -565.7899780273438, -550.1756591796875, -534.561279296875, -518.9468994140625, -503.33258056640625, -487.71820068359375, -472.1038513183594, -456.489501953125, -440.8751220703125, -425.2607727050781, -409.64642333984375, -394.0320739746094, -378.417724609375, -362.8033447265625, -347.1889953613281, -331.57464599609375, -315.96026611328125, -300.3459167480469, -284.7315673828125, -269.1172180175781, -253.5028533935547, -237.88848876953125, -222.27413940429688, -206.6597900390625, -191.04542541503906, -175.43106079101562, -159.81668090820312, -144.20233154296875, -128.5879669189453, -112.9736099243164, -97.3592529296875, -81.7448959350586, -66.13053894042969, -50.51618194580078, -34.901824951171875, -19.28746795654297, -3.6731109619140625, 11.941246032714844, 27.55560302734375, 43.169960021972656, 58.78431701660156, 74.39867401123047, 90.01303100585938, 105.62738800048828, 121.24174499511719, 136.85610961914062, 152.470458984375, 168.08480834960938, 183.6991729736328, 199.31353759765625, 214.92788696289062, 230.542236328125, 246.15660095214844, 261.7709655761719, 277.38531494140625, 292.9996643066406, 308.614013671875, 324.2283935546875, 339.8427429199219]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 10.0, 6.0, 6.0, 8.0, 7.0, 16.0, 21.0, 21.0, 30.0, 25.0, 25.0, 16.0, 28.0, 32.0, 35.0, 38.0, 33.0, 37.0, 57.0, 31.0, 41.0, 42.0, 49.0, 38.0, 37.0, 31.0, 27.0, 44.0, 31.0, 23.0, 26.0, 13.0, 17.0, 12.0, 11.0, 11.0, 10.0, 8.0, 9.0, 6.0, 4.0, 7.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-187.11695861816406, -181.2986602783203, -175.48036193847656, -169.6620635986328, -163.84376525878906, -158.02545166015625, -152.2071533203125, -146.38885498046875, -140.570556640625, -134.75225830078125, -128.9339599609375, -123.11566162109375, -117.29735565185547, -111.47905731201172, -105.66075897216797, -99.84245300292969, -94.02416229248047, -88.20586395263672, -82.38756561279297, -76.56925964355469, -70.75096130371094, -64.93266296386719, -59.11436462402344, -53.29606246948242, -47.47776412963867, -41.65946578979492, -35.841163635253906, -30.022865295410156, -24.204565048217773, -18.38626480102539, -12.56796646118164, -6.749664306640625, -0.931365966796875, 4.88693380355835, 10.705233573913574, 16.52353286743164, 22.341833114624023, 28.160133361816406, 33.978431701660156, 39.79673385620117, 45.61503219604492, 51.43333053588867, 57.25163269042969, 63.06993103027344, 68.88822937011719, 74.70652770996094, 80.52482604980469, 86.34313201904297, 92.16143035888672, 97.97972869873047, 103.79802703857422, 109.6163330078125, 115.43463134765625, 121.2529296875, 127.07122802734375, 132.8895263671875, 138.70782470703125, 144.526123046875, 150.34442138671875, 156.1627197265625, 161.98101806640625, 167.79931640625, 173.61761474609375, 179.43592834472656, 185.2542266845703]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 11.0, 9.0, 31.0, 23.0, 33.0, 65.0, 85.0, 116.0, 182.0, 341.0, 590.0, 981.0, 1877.0, 4013.0, 9958.0, 30160.0, 135695.0, 3551966.0, 374220.0, 55607.0, 15965.0, 6255.0, 2768.0, 1377.0, 765.0, 420.0, 255.0, 175.0, 108.0, 78.0, 44.0, 30.0, 17.0, 16.0, 14.0, 9.0, 4.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.625, -44.3828125, -43.140625, -41.8984375, -40.65625, -39.4140625, -38.171875, -36.9296875, -35.6875, -34.4453125, -33.203125, -31.9609375, -30.71875, -29.4765625, -28.234375, -26.9921875, -25.75, -24.5078125, -23.265625, -22.0234375, -20.78125, -19.5390625, -18.296875, -17.0546875, -15.8125, -14.5703125, -13.328125, -12.0859375, -10.84375, -9.6015625, -8.359375, -7.1171875, -5.875, -4.6328125, -3.390625, -2.1484375, -0.90625, 0.3359375, 1.578125, 2.8203125, 4.0625, 5.3046875, 6.546875, 7.7890625, 9.03125, 10.2734375, 11.515625, 12.7578125, 14.0, 15.2421875, 16.484375, 17.7265625, 18.96875, 20.2109375, 21.453125, 22.6953125, 23.9375, 25.1796875, 26.421875, 27.6640625, 28.90625, 30.1484375, 31.390625, 32.6328125, 33.875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 11.0, 12.0, 25.0, 32.0, 31.0, 32.0, 51.0, 46.0, 55.0, 67.0, 69.0, 49.0, 62.0, 55.0, 63.0, 62.0, 37.0, 38.0, 38.0, 37.0, 19.0, 19.0, 21.0, 14.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-14.21875, -13.8536376953125, -13.488525390625, -13.1234130859375, -12.75830078125, -12.3931884765625, -12.028076171875, -11.6629638671875, -11.2978515625, -10.9327392578125, -10.567626953125, -10.2025146484375, -9.83740234375, -9.4722900390625, -9.107177734375, -8.7420654296875, -8.376953125, -8.0118408203125, -7.646728515625, -7.2816162109375, -6.91650390625, -6.5513916015625, -6.186279296875, -5.8211669921875, -5.4560546875, -5.0909423828125, -4.725830078125, -4.3607177734375, -3.99560546875, -3.6304931640625, -3.265380859375, -2.9002685546875, -2.53515625, -2.1700439453125, -1.804931640625, -1.4398193359375, -1.07470703125, -0.7095947265625, -0.344482421875, 0.0206298828125, 0.3857421875, 0.7508544921875, 1.115966796875, 1.4810791015625, 1.84619140625, 2.2113037109375, 2.576416015625, 2.9415283203125, 3.306640625, 3.6717529296875, 4.036865234375, 4.4019775390625, 4.76708984375, 5.1322021484375, 5.497314453125, 5.8624267578125, 6.2275390625, 6.5926513671875, 6.957763671875, 7.3228759765625, 7.68798828125, 8.0531005859375, 8.418212890625, 8.7833251953125, 9.1484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 11.0, 7.0, 9.0, 14.0, 28.0, 22.0, 35.0, 64.0, 62.0, 138.0, 202.0, 347.0, 614.0, 1097.0, 1946.0, 4372.0, 9326.0, 24470.0, 84703.0, 739471.0, 3137531.0, 134055.0, 32963.0, 11955.0, 5282.0, 2443.0, 1250.0, 698.0, 424.0, 238.0, 156.0, 123.0, 65.0, 44.0, 31.0, 26.0, 17.0, 11.0, 9.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-35.28125, -34.18359375, -33.0859375, -31.98828125, -30.890625, -29.79296875, -28.6953125, -27.59765625, -26.5, -25.40234375, -24.3046875, -23.20703125, -22.109375, -21.01171875, -19.9140625, -18.81640625, -17.71875, -16.62109375, -15.5234375, -14.42578125, -13.328125, -12.23046875, -11.1328125, -10.03515625, -8.9375, -7.83984375, -6.7421875, -5.64453125, -4.546875, -3.44921875, -2.3515625, -1.25390625, -0.15625, 0.94140625, 2.0390625, 3.13671875, 4.234375, 5.33203125, 6.4296875, 7.52734375, 8.625, 9.72265625, 10.8203125, 11.91796875, 13.015625, 14.11328125, 15.2109375, 16.30859375, 17.40625, 18.50390625, 19.6015625, 20.69921875, 21.796875, 22.89453125, 23.9921875, 25.08984375, 26.1875, 27.28515625, 28.3828125, 29.48046875, 30.578125, 31.67578125, 32.7734375, 33.87109375, 34.96875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 5.0, 2.0, 10.0, 8.0, 7.0, 17.0, 31.0, 28.0, 45.0, 77.0, 104.0, 210.0, 532.0, 2063.0, 440.0, 204.0, 109.0, 39.0, 43.0, 22.0, 21.0, 14.0, 8.0, 11.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.250244140625, -11.70361328125, -11.156982421875, -10.6103515625, -10.063720703125, -9.51708984375, -8.970458984375, -8.423828125, -7.877197265625, -7.33056640625, -6.783935546875, -6.2373046875, -5.690673828125, -5.14404296875, -4.597412109375, -4.05078125, -3.504150390625, -2.95751953125, -2.410888671875, -1.8642578125, -1.317626953125, -0.77099609375, -0.224365234375, 0.322265625, 0.868896484375, 1.41552734375, 1.962158203125, 2.5087890625, 3.055419921875, 3.60205078125, 4.148681640625, 4.6953125, 5.241943359375, 5.78857421875, 6.335205078125, 6.8818359375, 7.428466796875, 7.97509765625, 8.521728515625, 9.068359375, 9.614990234375, 10.16162109375, 10.708251953125, 11.2548828125, 11.801513671875, 12.34814453125, 12.894775390625, 13.44140625, 13.988037109375, 14.53466796875, 15.081298828125, 15.6279296875, 16.174560546875, 16.72119140625, 17.267822265625, 17.814453125, 18.361083984375, 18.90771484375, 19.454345703125, 20.0009765625, 20.547607421875, 21.09423828125, 21.640869140625, 22.1875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 14.0, 21.0, 49.0, 121.0, 210.0, 242.0, 184.0, 99.0, 31.0, 20.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.40354919433594, -69.8218765258789, -64.24019622802734, -58.65852355957031, -53.076847076416016, -47.49517059326172, -41.91349792480469, -36.33182144165039, -30.750144958496094, -25.168468475341797, -19.586793899536133, -14.005119323730469, -8.423442840576172, -2.841766357421875, 2.7399063110351562, 8.321582794189453, 13.90325927734375, 19.484935760498047, 25.06661033630371, 30.648284912109375, 36.22996139526367, 41.81163787841797, 47.393310546875, 52.9749870300293, 58.556663513183594, 64.13833618164062, 69.72001647949219, 75.30168914794922, 80.88336181640625, 86.46504211425781, 92.04671478271484, 97.62838745117188, 103.2100830078125, 108.79175567626953, 114.3734359741211, 119.95510864257812, 125.53678894042969, 131.11846923828125, 136.70013427734375, 142.2818145751953, 147.86349487304688, 153.44517517089844, 159.02684020996094, 164.6085205078125, 170.19020080566406, 175.77188110351562, 181.35354614257812, 186.9352264404297, 192.5168914794922, 198.09857177734375, 203.68023681640625, 209.2619171142578, 214.84359741210938, 220.42526245117188, 226.00694274902344, 231.588623046875, 237.1702880859375, 242.75196838378906, 248.33363342285156, 253.91531372070312, 259.4969787597656, 265.07867431640625, 270.66033935546875, 276.24200439453125, 281.8236999511719]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 9.0, 6.0, 17.0, 10.0, 26.0, 23.0, 29.0, 27.0, 35.0, 27.0, 54.0, 60.0, 46.0, 59.0, 66.0, 69.0, 55.0, 53.0, 61.0, 52.0, 35.0, 32.0, 33.0, 22.0, 28.0, 15.0, 8.0, 14.0, 8.0, 9.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.08144760131836, -59.02811050415039, -56.97477340698242, -54.92143630981445, -52.86809539794922, -50.81475830078125, -48.76142120361328, -46.70808410644531, -44.654747009277344, -42.601409912109375, -40.548072814941406, -38.49473571777344, -36.44139862060547, -34.3880615234375, -32.334720611572266, -30.281383514404297, -28.228046417236328, -26.17470932006836, -24.12137222290039, -22.06803321838379, -20.01469612121582, -17.96135902404785, -15.908020973205566, -13.854682922363281, -11.801345825195312, -9.748008728027344, -7.694670677185059, -5.641333103179932, -3.5879955291748047, -1.534658432006836, 0.5186796188354492, 2.5720176696777344, 4.6253509521484375, 6.6786885261535645, 8.732026100158691, 10.785364151000977, 12.838701248168945, 14.892038345336914, 16.945377349853516, 18.998714447021484, 21.052051544189453, 23.105388641357422, 25.15872573852539, 27.212064743041992, 29.26540184020996, 31.31873893737793, 33.37207794189453, 35.4254150390625, 37.47875213623047, 39.53208923339844, 41.585426330566406, 43.638763427734375, 45.692100524902344, 47.74543762207031, 49.79877853393555, 51.852115631103516, 53.905452728271484, 55.95878982543945, 58.01212692260742, 60.06546401977539, 62.118804931640625, 64.1721420288086, 66.22547912597656, 68.27881622314453, 70.3321533203125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 10.0, 6.0, 19.0, 12.0, 30.0, 51.0, 83.0, 134.0, 221.0, 502.0, 1291.0, 3735.0, 13431.0, 60152.0, 322403.0, 515341.0, 101281.0, 21154.0, 5516.0, 1782.0, 653.0, 311.0, 151.0, 86.0, 54.0, 44.0, 30.0, 21.0, 8.0, 6.0, 10.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.3125, -53.64453125, -51.9765625, -50.30859375, -48.640625, -46.97265625, -45.3046875, -43.63671875, -41.96875, -40.30078125, -38.6328125, -36.96484375, -35.296875, -33.62890625, -31.9609375, -30.29296875, -28.625, -26.95703125, -25.2890625, -23.62109375, -21.953125, -20.28515625, -18.6171875, -16.94921875, -15.28125, -13.61328125, -11.9453125, -10.27734375, -8.609375, -6.94140625, -5.2734375, -3.60546875, -1.9375, -0.26953125, 1.3984375, 3.06640625, 4.734375, 6.40234375, 8.0703125, 9.73828125, 11.40625, 13.07421875, 14.7421875, 16.41015625, 18.078125, 19.74609375, 21.4140625, 23.08203125, 24.75, 26.41796875, 28.0859375, 29.75390625, 31.421875, 33.08984375, 34.7578125, 36.42578125, 38.09375, 39.76171875, 41.4296875, 43.09765625, 44.765625, 46.43359375, 48.1015625, 49.76953125, 51.4375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 7.0, 9.0, 9.0, 16.0, 22.0, 22.0, 33.0, 41.0, 45.0, 51.0, 48.0, 60.0, 68.0, 66.0, 57.0, 65.0, 65.0, 46.0, 48.0, 49.0, 33.0, 24.0, 21.0, 23.0, 20.0, 10.0, 11.0, 10.0, 5.0, 6.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.4453125, -14.0758056640625, -13.706298828125, -13.3367919921875, -12.96728515625, -12.5977783203125, -12.228271484375, -11.8587646484375, -11.4892578125, -11.1197509765625, -10.750244140625, -10.3807373046875, -10.01123046875, -9.6417236328125, -9.272216796875, -8.9027099609375, -8.533203125, -8.1636962890625, -7.794189453125, -7.4246826171875, -7.05517578125, -6.6856689453125, -6.316162109375, -5.9466552734375, -5.5771484375, -5.2076416015625, -4.838134765625, -4.4686279296875, -4.09912109375, -3.7296142578125, -3.360107421875, -2.9906005859375, -2.62109375, -2.2515869140625, -1.882080078125, -1.5125732421875, -1.14306640625, -0.7735595703125, -0.404052734375, -0.0345458984375, 0.3349609375, 0.7044677734375, 1.073974609375, 1.4434814453125, 1.81298828125, 2.1824951171875, 2.552001953125, 2.9215087890625, 3.291015625, 3.6605224609375, 4.030029296875, 4.3995361328125, 4.76904296875, 5.1385498046875, 5.508056640625, 5.8775634765625, 6.2470703125, 6.6165771484375, 6.986083984375, 7.3555908203125, 7.72509765625, 8.0946044921875, 8.464111328125, 8.8336181640625, 9.203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 10.0, 15.0, 15.0, 20.0, 29.0, 51.0, 95.0, 134.0, 233.0, 433.0, 924.0, 2253.0, 7380.0, 34283.0, 228244.0, 636665.0, 110562.0, 19248.0, 4723.0, 1625.0, 727.0, 353.0, 200.0, 118.0, 67.0, 53.0, 28.0, 21.0, 9.0, 9.0, 4.0, 7.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.375, -44.677734375, -42.98046875, -41.283203125, -39.5859375, -37.888671875, -36.19140625, -34.494140625, -32.796875, -31.099609375, -29.40234375, -27.705078125, -26.0078125, -24.310546875, -22.61328125, -20.916015625, -19.21875, -17.521484375, -15.82421875, -14.126953125, -12.4296875, -10.732421875, -9.03515625, -7.337890625, -5.640625, -3.943359375, -2.24609375, -0.548828125, 1.1484375, 2.845703125, 4.54296875, 6.240234375, 7.9375, 9.634765625, 11.33203125, 13.029296875, 14.7265625, 16.423828125, 18.12109375, 19.818359375, 21.515625, 23.212890625, 24.91015625, 26.607421875, 28.3046875, 30.001953125, 31.69921875, 33.396484375, 35.09375, 36.791015625, 38.48828125, 40.185546875, 41.8828125, 43.580078125, 45.27734375, 46.974609375, 48.671875, 50.369140625, 52.06640625, 53.763671875, 55.4609375, 57.158203125, 58.85546875, 60.552734375, 62.25]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 5.0, 11.0, 12.0, 18.0, 29.0, 17.0, 36.0, 45.0, 45.0, 54.0, 64.0, 71.0, 71.0, 69.0, 55.0, 66.0, 51.0, 47.0, 41.0, 44.0, 29.0, 32.0, 21.0, 13.0, 14.0, 10.0, 8.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.93359375, -49.3046875, -47.67578125, -46.046875, -44.41796875, -42.7890625, -41.16015625, -39.53125, -37.90234375, -36.2734375, -34.64453125, -33.015625, -31.38671875, -29.7578125, -28.12890625, -26.5, -24.87109375, -23.2421875, -21.61328125, -19.984375, -18.35546875, -16.7265625, -15.09765625, -13.46875, -11.83984375, -10.2109375, -8.58203125, -6.953125, -5.32421875, -3.6953125, -2.06640625, -0.4375, 1.19140625, 2.8203125, 4.44921875, 6.078125, 7.70703125, 9.3359375, 10.96484375, 12.59375, 14.22265625, 15.8515625, 17.48046875, 19.109375, 20.73828125, 22.3671875, 23.99609375, 25.625, 27.25390625, 28.8828125, 30.51171875, 32.140625, 33.76953125, 35.3984375, 37.02734375, 38.65625, 40.28515625, 41.9140625, 43.54296875, 45.171875, 46.80078125, 48.4296875, 50.05859375, 51.6875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 7.0, 14.0, 18.0, 38.0, 54.0, 154.0, 452.0, 2172.0, 19028.0, 591082.0, 418289.0, 14704.0, 1882.0, 385.0, 142.0, 67.0, 33.0, 18.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.109375, -18.989013671875, -17.86865234375, -16.748291015625, -15.6279296875, -14.507568359375, -13.38720703125, -12.266845703125, -11.146484375, -10.026123046875, -8.90576171875, -7.785400390625, -6.6650390625, -5.544677734375, -4.42431640625, -3.303955078125, -2.18359375, -1.063232421875, 0.05712890625, 1.177490234375, 2.2978515625, 3.418212890625, 4.53857421875, 5.658935546875, 6.779296875, 7.899658203125, 9.02001953125, 10.140380859375, 11.2607421875, 12.381103515625, 13.50146484375, 14.621826171875, 15.7421875, 16.862548828125, 17.98291015625, 19.103271484375, 20.2236328125, 21.343994140625, 22.46435546875, 23.584716796875, 24.705078125, 25.825439453125, 26.94580078125, 28.066162109375, 29.1865234375, 30.306884765625, 31.42724609375, 32.547607421875, 33.66796875, 34.788330078125, 35.90869140625, 37.029052734375, 38.1494140625, 39.269775390625, 40.39013671875, 41.510498046875, 42.630859375, 43.751220703125, 44.87158203125, 45.991943359375, 47.1123046875, 48.232666015625, 49.35302734375, 50.473388671875, 51.59375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 7.0, 14.0, 12.0, 12.0, 22.0, 35.0, 52.0, 68.0, 131.0, 186.0, 173.0, 100.0, 52.0, 38.0, 20.0, 14.0, 12.0, 6.0, 7.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036163330078125, -0.0035153627395629883, -0.0034143924713134766, -0.003313422203063965, -0.003212451934814453, -0.0031114816665649414, -0.0030105113983154297, -0.002909541130065918, -0.0028085708618164062, -0.0027076005935668945, -0.002606630325317383, -0.002505660057067871, -0.0024046897888183594, -0.0023037195205688477, -0.002202749252319336, -0.0021017789840698242, -0.0020008087158203125, -0.0018998384475708008, -0.001798868179321289, -0.0016978979110717773, -0.0015969276428222656, -0.001495957374572754, -0.0013949871063232422, -0.0012940168380737305, -0.0011930465698242188, -0.001092076301574707, -0.0009911060333251953, -0.0008901357650756836, -0.0007891654968261719, -0.0006881952285766602, -0.0005872249603271484, -0.0004862546920776367, -0.000385284423828125, -0.0002843141555786133, -0.00018334388732910156, -8.237361907958984e-05, 1.8596649169921875e-05, 0.0001195669174194336, 0.0002205371856689453, 0.00032150745391845703, 0.00042247772216796875, 0.0005234479904174805, 0.0006244182586669922, 0.0007253885269165039, 0.0008263587951660156, 0.0009273290634155273, 0.001028299331665039, 0.0011292695999145508, 0.0012302398681640625, 0.0013312101364135742, 0.001432180404663086, 0.0015331506729125977, 0.0016341209411621094, 0.001735091209411621, 0.0018360614776611328, 0.0019370317459106445, 0.0020380020141601562, 0.002138972282409668, 0.0022399425506591797, 0.0023409128189086914, 0.002441883087158203, 0.002542853355407715, 0.0026438236236572266, 0.0027447938919067383, 0.00284576416015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 17.0, 30.0, 44.0, 68.0, 132.0, 254.0, 723.0, 3066.0, 28442.0, 680764.0, 317174.0, 14690.0, 2077.0, 584.0, 223.0, 106.0, 65.0, 33.0, 22.0, 11.0, 11.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.03125, -37.123046875, -36.21484375, -35.306640625, -34.3984375, -33.490234375, -32.58203125, -31.673828125, -30.765625, -29.857421875, -28.94921875, -28.041015625, -27.1328125, -26.224609375, -25.31640625, -24.408203125, -23.5, -22.591796875, -21.68359375, -20.775390625, -19.8671875, -18.958984375, -18.05078125, -17.142578125, -16.234375, -15.326171875, -14.41796875, -13.509765625, -12.6015625, -11.693359375, -10.78515625, -9.876953125, -8.96875, -8.060546875, -7.15234375, -6.244140625, -5.3359375, -4.427734375, -3.51953125, -2.611328125, -1.703125, -0.794921875, 0.11328125, 1.021484375, 1.9296875, 2.837890625, 3.74609375, 4.654296875, 5.5625, 6.470703125, 7.37890625, 8.287109375, 9.1953125, 10.103515625, 11.01171875, 11.919921875, 12.828125, 13.736328125, 14.64453125, 15.552734375, 16.4609375, 17.369140625, 18.27734375, 19.185546875, 20.09375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 9.0, 10.0, 6.0, 18.0, 26.0, 49.0, 66.0, 102.0, 161.0, 193.0, 131.0, 93.0, 44.0, 37.0, 19.0, 15.0, 13.0, 10.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.59375, -26.907958984375, -26.22216796875, -25.536376953125, -24.8505859375, -24.164794921875, -23.47900390625, -22.793212890625, -22.107421875, -21.421630859375, -20.73583984375, -20.050048828125, -19.3642578125, -18.678466796875, -17.99267578125, -17.306884765625, -16.62109375, -15.935302734375, -15.24951171875, -14.563720703125, -13.8779296875, -13.192138671875, -12.50634765625, -11.820556640625, -11.134765625, -10.448974609375, -9.76318359375, -9.077392578125, -8.3916015625, -7.705810546875, -7.02001953125, -6.334228515625, -5.6484375, -4.962646484375, -4.27685546875, -3.591064453125, -2.9052734375, -2.219482421875, -1.53369140625, -0.847900390625, -0.162109375, 0.523681640625, 1.20947265625, 1.895263671875, 2.5810546875, 3.266845703125, 3.95263671875, 4.638427734375, 5.32421875, 6.010009765625, 6.69580078125, 7.381591796875, 8.0673828125, 8.753173828125, 9.43896484375, 10.124755859375, 10.810546875, 11.496337890625, 12.18212890625, 12.867919921875, 13.5537109375, 14.239501953125, 14.92529296875, 15.611083984375, 16.296875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 24.0, 38.0, 68.0, 129.0, 157.0, 188.0, 133.0, 116.0, 63.0, 33.0, 19.0, 11.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-307.7582092285156, -297.3272399902344, -286.8962707519531, -276.4653015136719, -266.0343322753906, -255.60336303710938, -245.17239379882812, -234.74142456054688, -224.31045532226562, -213.87948608398438, -203.44851684570312, -193.01754760742188, -182.58657836914062, -172.15560913085938, -161.72463989257812, -151.29367065429688, -140.86270141601562, -130.43173217773438, -120.00076293945312, -109.56979370117188, -99.13882446289062, -88.70785522460938, -78.27688598632812, -67.84591674804688, -57.414947509765625, -46.983978271484375, -36.553009033203125, -26.122039794921875, -15.691070556640625, -5.260101318359375, 5.170867919921875, 15.601837158203125, 26.03277587890625, 36.4637451171875, 46.89471435546875, 57.32568359375, 67.75665283203125, 78.1876220703125, 88.61859130859375, 99.049560546875, 109.48052978515625, 119.9114990234375, 130.34246826171875, 140.7734375, 151.20440673828125, 161.6353759765625, 172.06634521484375, 182.497314453125, 192.92828369140625, 203.3592529296875, 213.79022216796875, 224.22119140625, 234.65216064453125, 245.0831298828125, 255.51409912109375, 265.945068359375, 276.37603759765625, 286.8070068359375, 297.23797607421875, 307.6689453125, 318.09991455078125, 328.5308837890625, 338.96185302734375, 349.392822265625, 359.82379150390625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 9.0, 5.0, 10.0, 12.0, 17.0, 14.0, 24.0, 22.0, 30.0, 30.0, 22.0, 24.0, 44.0, 36.0, 47.0, 30.0, 36.0, 60.0, 42.0, 41.0, 36.0, 52.0, 44.0, 39.0, 37.0, 35.0, 32.0, 32.0, 20.0, 21.0, 14.0, 12.0, 15.0, 12.0, 9.0, 9.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.6598358154297, -173.86297607421875, -168.0661163330078, -162.26925659179688, -156.47238159179688, -150.67552185058594, -144.878662109375, -139.08180236816406, -133.28494262695312, -127.48808288574219, -121.69121551513672, -115.89435577392578, -110.09748840332031, -104.30062866210938, -98.50376892089844, -92.7069091796875, -86.9100341796875, -81.11317443847656, -75.3163070678711, -69.51944732666016, -63.72258377075195, -57.92572021484375, -52.12886047363281, -46.33199691772461, -40.535133361816406, -34.7382698059082, -28.941408157348633, -23.144546508789062, -17.34768295288086, -11.550819396972656, -5.753959655761719, 0.042903900146484375, 5.839752197265625, 11.636614799499512, 17.4334774017334, 23.23033905029297, 29.027202606201172, 34.824066162109375, 40.62092590332031, 46.417789459228516, 52.21465301513672, 58.01151657104492, 63.808380126953125, 69.60523986816406, 75.402099609375, 81.19896697998047, 86.9958267211914, 92.79269409179688, 98.58955383300781, 104.38641357421875, 110.18328094482422, 115.98014068603516, 121.77700805664062, 127.57386779785156, 133.3707275390625, 139.16758728027344, 144.96444702148438, 150.7613067626953, 156.55816650390625, 162.35504150390625, 168.1519012451172, 173.94876098632812, 179.74562072753906, 185.54248046875, 191.33935546875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 12.0, 8.0, 16.0, 22.0, 44.0, 85.0, 101.0, 226.0, 368.0, 659.0, 1319.0, 2804.0, 6867.0, 20738.0, 91201.0, 3724271.0, 285390.0, 40111.0, 11658.0, 4335.0, 1941.0, 941.0, 481.0, 271.0, 153.0, 87.0, 56.0, 39.0, 26.0, 10.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.125, -46.255859375, -44.38671875, -42.517578125, -40.6484375, -38.779296875, -36.91015625, -35.041015625, -33.171875, -31.302734375, -29.43359375, -27.564453125, -25.6953125, -23.826171875, -21.95703125, -20.087890625, -18.21875, -16.349609375, -14.48046875, -12.611328125, -10.7421875, -8.873046875, -7.00390625, -5.134765625, -3.265625, -1.396484375, 0.47265625, 2.341796875, 4.2109375, 6.080078125, 7.94921875, 9.818359375, 11.6875, 13.556640625, 15.42578125, 17.294921875, 19.1640625, 21.033203125, 22.90234375, 24.771484375, 26.640625, 28.509765625, 30.37890625, 32.248046875, 34.1171875, 35.986328125, 37.85546875, 39.724609375, 41.59375, 43.462890625, 45.33203125, 47.201171875, 49.0703125, 50.939453125, 52.80859375, 54.677734375, 56.546875, 58.416015625, 60.28515625, 62.154296875, 64.0234375, 65.892578125, 67.76171875, 69.630859375, 71.5]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 6.0, 11.0, 8.0, 12.0, 11.0, 13.0, 19.0, 16.0, 26.0, 39.0, 42.0, 47.0, 37.0, 57.0, 60.0, 63.0, 47.0, 57.0, 49.0, 48.0, 46.0, 39.0, 49.0, 37.0, 26.0, 23.0, 21.0, 21.0, 15.0, 13.0, 10.0, 6.0, 5.0, 7.0, 2.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-13.28125, -12.9296875, -12.578125, -12.2265625, -11.875, -11.5234375, -11.171875, -10.8203125, -10.46875, -10.1171875, -9.765625, -9.4140625, -9.0625, -8.7109375, -8.359375, -8.0078125, -7.65625, -7.3046875, -6.953125, -6.6015625, -6.25, -5.8984375, -5.546875, -5.1953125, -4.84375, -4.4921875, -4.140625, -3.7890625, -3.4375, -3.0859375, -2.734375, -2.3828125, -2.03125, -1.6796875, -1.328125, -0.9765625, -0.625, -0.2734375, 0.078125, 0.4296875, 0.78125, 1.1328125, 1.484375, 1.8359375, 2.1875, 2.5390625, 2.890625, 3.2421875, 3.59375, 3.9453125, 4.296875, 4.6484375, 5.0, 5.3515625, 5.703125, 6.0546875, 6.40625, 6.7578125, 7.109375, 7.4609375, 7.8125, 8.1640625, 8.515625, 8.8671875, 9.21875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 4.0, 4.0, 10.0, 5.0, 11.0, 8.0, 20.0, 17.0, 31.0, 35.0, 73.0, 86.0, 151.0, 227.0, 306.0, 543.0, 1083.0, 2347.0, 6281.0, 21723.0, 124652.0, 3699765.0, 283818.0, 37140.0, 9272.0, 3271.0, 1431.0, 789.0, 410.0, 242.0, 150.0, 127.0, 78.0, 50.0, 42.0, 23.0, 18.0, 13.0, 10.0, 5.0, 6.0, 7.0, 3.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.529296875, -43.68359375, -41.837890625, -39.9921875, -38.146484375, -36.30078125, -34.455078125, -32.609375, -30.763671875, -28.91796875, -27.072265625, -25.2265625, -23.380859375, -21.53515625, -19.689453125, -17.84375, -15.998046875, -14.15234375, -12.306640625, -10.4609375, -8.615234375, -6.76953125, -4.923828125, -3.078125, -1.232421875, 0.61328125, 2.458984375, 4.3046875, 6.150390625, 7.99609375, 9.841796875, 11.6875, 13.533203125, 15.37890625, 17.224609375, 19.0703125, 20.916015625, 22.76171875, 24.607421875, 26.453125, 28.298828125, 30.14453125, 31.990234375, 33.8359375, 35.681640625, 37.52734375, 39.373046875, 41.21875, 43.064453125, 44.91015625, 46.755859375, 48.6015625, 50.447265625, 52.29296875, 54.138671875, 55.984375, 57.830078125, 59.67578125, 61.521484375, 63.3671875, 65.212890625, 67.05859375, 68.904296875, 70.75]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 5.0, 12.0, 51.0, 76.0, 175.0, 558.0, 2640.0, 276.0, 121.0, 61.0, 26.0, 23.0, 15.0, 9.0, 4.0, 3.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.859375, -21.831298828125, -20.80322265625, -19.775146484375, -18.7470703125, -17.718994140625, -16.69091796875, -15.662841796875, -14.634765625, -13.606689453125, -12.57861328125, -11.550537109375, -10.5224609375, -9.494384765625, -8.46630859375, -7.438232421875, -6.41015625, -5.382080078125, -4.35400390625, -3.325927734375, -2.2978515625, -1.269775390625, -0.24169921875, 0.786376953125, 1.814453125, 2.842529296875, 3.87060546875, 4.898681640625, 5.9267578125, 6.954833984375, 7.98291015625, 9.010986328125, 10.0390625, 11.067138671875, 12.09521484375, 13.123291015625, 14.1513671875, 15.179443359375, 16.20751953125, 17.235595703125, 18.263671875, 19.291748046875, 20.31982421875, 21.347900390625, 22.3759765625, 23.404052734375, 24.43212890625, 25.460205078125, 26.48828125, 27.516357421875, 28.54443359375, 29.572509765625, 30.6005859375, 31.628662109375, 32.65673828125, 33.684814453125, 34.712890625, 35.740966796875, 36.76904296875, 37.797119140625, 38.8251953125, 39.853271484375, 40.88134765625, 41.909423828125, 42.9375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 17.0, 21.0, 39.0, 96.0, 188.0, 267.0, 208.0, 97.0, 28.0, 27.0, 8.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.31983947753906, -77.1464614868164, -70.97308349609375, -64.79971313476562, -58.6263313293457, -52.45295333862305, -46.279579162597656, -40.106201171875, -33.932823181152344, -27.759445190429688, -21.586069107055664, -15.41269302368164, -9.239315032958984, -3.065937042236328, 3.1074371337890625, 9.280815124511719, 15.454193115234375, 21.62757110595703, 27.800947189331055, 33.97432327270508, 40.147701263427734, 46.32107925415039, 52.49445343017578, 58.66783142089844, 64.8412094116211, 71.01458740234375, 77.1879653930664, 83.36134338378906, 89.53471374511719, 95.70809936523438, 101.8814697265625, 108.05484771728516, 114.22821044921875, 120.4015884399414, 126.57496643066406, 132.7483367919922, 138.92172241210938, 145.0950927734375, 151.26846313476562, 157.4418487548828, 163.615234375, 169.78860473632812, 175.9619903564453, 182.13536071777344, 188.30874633789062, 194.48211669921875, 200.65548706054688, 206.82887268066406, 213.0022430419922, 219.1756134033203, 225.3489990234375, 231.52236938476562, 237.6957550048828, 243.86912536621094, 250.04251098632812, 256.21588134765625, 262.3892517089844, 268.5626220703125, 274.7359924316406, 280.9093933105469, 287.082763671875, 293.2561340332031, 299.42950439453125, 305.6029052734375, 311.7762756347656]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 9.0, 11.0, 16.0, 28.0, 25.0, 43.0, 27.0, 43.0, 46.0, 50.0, 48.0, 52.0, 60.0, 67.0, 68.0, 62.0, 57.0, 54.0, 40.0, 40.0, 33.0, 34.0, 21.0, 10.0, 8.0, 6.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-79.67032623291016, -77.08490753173828, -74.49949645996094, -71.91407775878906, -69.32865905761719, -66.74324035644531, -64.15782165527344, -61.572410583496094, -58.98699188232422, -56.401573181152344, -53.816158294677734, -51.230743408203125, -48.64532470703125, -46.059906005859375, -43.474491119384766, -40.889076232910156, -38.30365753173828, -35.718238830566406, -33.1328239440918, -30.547407150268555, -27.961990356445312, -25.37657356262207, -22.791156768798828, -20.205739974975586, -17.620323181152344, -15.034906387329102, -12.44948959350586, -9.864072799682617, -7.278656005859375, -4.693239212036133, -2.1078224182128906, 0.47759437561035156, 3.063018798828125, 5.648435592651367, 8.23385238647461, 10.819269180297852, 13.404685974121094, 15.990102767944336, 18.575519561767578, 21.16093635559082, 23.746353149414062, 26.331769943237305, 28.917186737060547, 31.50260353088379, 34.08802032470703, 36.673439025878906, 39.258853912353516, 41.844268798828125, 44.4296875, 47.015106201171875, 49.600521087646484, 52.185935974121094, 54.77135467529297, 57.356773376464844, 59.94218826293945, 62.52760314941406, 65.11302185058594, 67.69844055175781, 70.28385925292969, 72.86927032470703, 75.4546890258789, 78.04010772705078, 80.62551879882812, 83.2109375, 85.79635620117188]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 11.0, 12.0, 20.0, 14.0, 14.0, 36.0, 66.0, 51.0, 109.0, 181.0, 272.0, 418.0, 703.0, 1067.0, 1724.0, 2995.0, 4961.0, 8674.0, 15564.0, 29308.0, 55707.0, 108213.0, 204782.0, 274999.0, 159669.0, 83656.0, 43175.0, 22577.0, 12143.0, 6952.0, 4060.0, 2492.0, 1466.0, 879.0, 548.0, 343.0, 229.0, 146.0, 102.0, 59.0, 56.0, 28.0, 19.0, 20.0, 17.0, 3.0, 4.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.1875, -28.283935546875, -27.38037109375, -26.476806640625, -25.5732421875, -24.669677734375, -23.76611328125, -22.862548828125, -21.958984375, -21.055419921875, -20.15185546875, -19.248291015625, -18.3447265625, -17.441162109375, -16.53759765625, -15.634033203125, -14.73046875, -13.826904296875, -12.92333984375, -12.019775390625, -11.1162109375, -10.212646484375, -9.30908203125, -8.405517578125, -7.501953125, -6.598388671875, -5.69482421875, -4.791259765625, -3.8876953125, -2.984130859375, -2.08056640625, -1.177001953125, -0.2734375, 0.630126953125, 1.53369140625, 2.437255859375, 3.3408203125, 4.244384765625, 5.14794921875, 6.051513671875, 6.955078125, 7.858642578125, 8.76220703125, 9.665771484375, 10.5693359375, 11.472900390625, 12.37646484375, 13.280029296875, 14.18359375, 15.087158203125, 15.99072265625, 16.894287109375, 17.7978515625, 18.701416015625, 19.60498046875, 20.508544921875, 21.412109375, 22.315673828125, 23.21923828125, 24.122802734375, 25.0263671875, 25.929931640625, 26.83349609375, 27.737060546875, 28.640625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 4.0, 7.0, 10.0, 8.0, 18.0, 14.0, 13.0, 19.0, 24.0, 23.0, 16.0, 23.0, 31.0, 46.0, 37.0, 45.0, 36.0, 56.0, 53.0, 48.0, 41.0, 52.0, 44.0, 38.0, 39.0, 39.0, 27.0, 26.0, 26.0, 28.0, 20.0, 10.0, 16.0, 12.0, 10.0, 9.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-11.2265625, -10.9078369140625, -10.589111328125, -10.2703857421875, -9.95166015625, -9.6329345703125, -9.314208984375, -8.9954833984375, -8.6767578125, -8.3580322265625, -8.039306640625, -7.7205810546875, -7.40185546875, -7.0831298828125, -6.764404296875, -6.4456787109375, -6.126953125, -5.8082275390625, -5.489501953125, -5.1707763671875, -4.85205078125, -4.5333251953125, -4.214599609375, -3.8958740234375, -3.5771484375, -3.2584228515625, -2.939697265625, -2.6209716796875, -2.30224609375, -1.9835205078125, -1.664794921875, -1.3460693359375, -1.02734375, -0.7086181640625, -0.389892578125, -0.0711669921875, 0.24755859375, 0.5662841796875, 0.885009765625, 1.2037353515625, 1.5224609375, 1.8411865234375, 2.159912109375, 2.4786376953125, 2.79736328125, 3.1160888671875, 3.434814453125, 3.7535400390625, 4.072265625, 4.3909912109375, 4.709716796875, 5.0284423828125, 5.34716796875, 5.6658935546875, 5.984619140625, 6.3033447265625, 6.6220703125, 6.9407958984375, 7.259521484375, 7.5782470703125, 7.89697265625, 8.2156982421875, 8.534423828125, 8.8531494140625, 9.171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 6.0, 4.0, 8.0, 12.0, 22.0, 26.0, 42.0, 44.0, 53.0, 93.0, 137.0, 243.0, 342.0, 519.0, 815.0, 1352.0, 2788.0, 5890.0, 15336.0, 47797.0, 188829.0, 520369.0, 188055.0, 47926.0, 15435.0, 5921.0, 2659.0, 1467.0, 833.0, 520.0, 285.0, 224.0, 146.0, 114.0, 68.0, 52.0, 35.0, 22.0, 16.0, 16.0, 7.0, 12.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.96875, -50.31884765625, -48.6689453125, -47.01904296875, -45.369140625, -43.71923828125, -42.0693359375, -40.41943359375, -38.76953125, -37.11962890625, -35.4697265625, -33.81982421875, -32.169921875, -30.52001953125, -28.8701171875, -27.22021484375, -25.5703125, -23.92041015625, -22.2705078125, -20.62060546875, -18.970703125, -17.32080078125, -15.6708984375, -14.02099609375, -12.37109375, -10.72119140625, -9.0712890625, -7.42138671875, -5.771484375, -4.12158203125, -2.4716796875, -0.82177734375, 0.828125, 2.47802734375, 4.1279296875, 5.77783203125, 7.427734375, 9.07763671875, 10.7275390625, 12.37744140625, 14.02734375, 15.67724609375, 17.3271484375, 18.97705078125, 20.626953125, 22.27685546875, 23.9267578125, 25.57666015625, 27.2265625, 28.87646484375, 30.5263671875, 32.17626953125, 33.826171875, 35.47607421875, 37.1259765625, 38.77587890625, 40.42578125, 42.07568359375, 43.7255859375, 45.37548828125, 47.025390625, 48.67529296875, 50.3251953125, 51.97509765625, 53.625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 5.0, 14.0, 11.0, 17.0, 19.0, 27.0, 32.0, 39.0, 48.0, 60.0, 51.0, 82.0, 62.0, 72.0, 66.0, 63.0, 64.0, 41.0, 41.0, 21.0, 27.0, 34.0, 32.0, 11.0, 7.0, 10.0, 11.0, 4.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.6875, -65.359375, -63.03125, -60.703125, -58.375, -56.046875, -53.71875, -51.390625, -49.0625, -46.734375, -44.40625, -42.078125, -39.75, -37.421875, -35.09375, -32.765625, -30.4375, -28.109375, -25.78125, -23.453125, -21.125, -18.796875, -16.46875, -14.140625, -11.8125, -9.484375, -7.15625, -4.828125, -2.5, -0.171875, 2.15625, 4.484375, 6.8125, 9.140625, 11.46875, 13.796875, 16.125, 18.453125, 20.78125, 23.109375, 25.4375, 27.765625, 30.09375, 32.421875, 34.75, 37.078125, 39.40625, 41.734375, 44.0625, 46.390625, 48.71875, 51.046875, 53.375, 55.703125, 58.03125, 60.359375, 62.6875, 65.015625, 67.34375, 69.671875, 72.0, 74.328125, 76.65625, 78.984375, 81.3125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 7.0, 9.0, 12.0, 30.0, 42.0, 83.0, 108.0, 189.0, 281.0, 464.0, 856.0, 2231.0, 7370.0, 43922.0, 517296.0, 427352.0, 37488.0, 6802.0, 1966.0, 849.0, 446.0, 260.0, 167.0, 109.0, 55.0, 42.0, 29.0, 14.0, 10.0, 12.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-36.375, -35.271484375, -34.16796875, -33.064453125, -31.9609375, -30.857421875, -29.75390625, -28.650390625, -27.546875, -26.443359375, -25.33984375, -24.236328125, -23.1328125, -22.029296875, -20.92578125, -19.822265625, -18.71875, -17.615234375, -16.51171875, -15.408203125, -14.3046875, -13.201171875, -12.09765625, -10.994140625, -9.890625, -8.787109375, -7.68359375, -6.580078125, -5.4765625, -4.373046875, -3.26953125, -2.166015625, -1.0625, 0.041015625, 1.14453125, 2.248046875, 3.3515625, 4.455078125, 5.55859375, 6.662109375, 7.765625, 8.869140625, 9.97265625, 11.076171875, 12.1796875, 13.283203125, 14.38671875, 15.490234375, 16.59375, 17.697265625, 18.80078125, 19.904296875, 21.0078125, 22.111328125, 23.21484375, 24.318359375, 25.421875, 26.525390625, 27.62890625, 28.732421875, 29.8359375, 30.939453125, 32.04296875, 33.146484375, 34.25]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 9.0, 22.0, 21.0, 54.0, 66.0, 131.0, 222.0, 206.0, 110.0, 61.0, 49.0, 17.0, 14.0, 8.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0046844482421875, -0.004470229148864746, -0.004256010055541992, -0.004041790962219238, -0.0038275718688964844, -0.0036133527755737305, -0.0033991336822509766, -0.0031849145889282227, -0.0029706954956054688, -0.002756476402282715, -0.002542257308959961, -0.002328038215637207, -0.002113819122314453, -0.0018996000289916992, -0.0016853809356689453, -0.0014711618423461914, -0.0012569427490234375, -0.0010427236557006836, -0.0008285045623779297, -0.0006142854690551758, -0.0004000663757324219, -0.00018584728240966797, 2.8371810913085938e-05, 0.00024259090423583984, 0.00045680999755859375, 0.0006710290908813477, 0.0008852481842041016, 0.0010994672775268555, 0.0013136863708496094, 0.0015279054641723633, 0.0017421245574951172, 0.001956343650817871, 0.002170562744140625, 0.002384781837463379, 0.002599000930786133, 0.0028132200241088867, 0.0030274391174316406, 0.0032416582107543945, 0.0034558773040771484, 0.0036700963973999023, 0.0038843154907226562, 0.00409853458404541, 0.004312753677368164, 0.004526972770690918, 0.004741191864013672, 0.004955410957336426, 0.00516963005065918, 0.005383849143981934, 0.0055980682373046875, 0.005812287330627441, 0.006026506423950195, 0.006240725517272949, 0.006454944610595703, 0.006669163703918457, 0.006883382797241211, 0.007097601890563965, 0.007311820983886719, 0.007526040077209473, 0.0077402591705322266, 0.00795447826385498, 0.008168697357177734, 0.008382916450500488, 0.008597135543823242, 0.008811354637145996, 0.00902557373046875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 6.0, 9.0, 9.0, 17.0, 32.0, 55.0, 77.0, 140.0, 244.0, 529.0, 1130.0, 2988.0, 13630.0, 150409.0, 785591.0, 80249.0, 9072.0, 2434.0, 906.0, 454.0, 228.0, 113.0, 79.0, 49.0, 17.0, 23.0, 10.0, 6.0, 9.0, 6.0, 4.0, 8.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-45.65625, -44.43505859375, -43.2138671875, -41.99267578125, -40.771484375, -39.55029296875, -38.3291015625, -37.10791015625, -35.88671875, -34.66552734375, -33.4443359375, -32.22314453125, -31.001953125, -29.78076171875, -28.5595703125, -27.33837890625, -26.1171875, -24.89599609375, -23.6748046875, -22.45361328125, -21.232421875, -20.01123046875, -18.7900390625, -17.56884765625, -16.34765625, -15.12646484375, -13.9052734375, -12.68408203125, -11.462890625, -10.24169921875, -9.0205078125, -7.79931640625, -6.578125, -5.35693359375, -4.1357421875, -2.91455078125, -1.693359375, -0.47216796875, 0.7490234375, 1.97021484375, 3.19140625, 4.41259765625, 5.6337890625, 6.85498046875, 8.076171875, 9.29736328125, 10.5185546875, 11.73974609375, 12.9609375, 14.18212890625, 15.4033203125, 16.62451171875, 17.845703125, 19.06689453125, 20.2880859375, 21.50927734375, 22.73046875, 23.95166015625, 25.1728515625, 26.39404296875, 27.615234375, 28.83642578125, 30.0576171875, 31.27880859375, 32.5]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 19.0, 24.0, 58.0, 58.0, 87.0, 127.0, 126.0, 121.0, 100.0, 92.0, 51.0, 29.0, 22.0, 17.0, 8.0, 6.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.0, -41.884033203125, -40.76806640625, -39.652099609375, -38.5361328125, -37.420166015625, -36.30419921875, -35.188232421875, -34.072265625, -32.956298828125, -31.84033203125, -30.724365234375, -29.6083984375, -28.492431640625, -27.37646484375, -26.260498046875, -25.14453125, -24.028564453125, -22.91259765625, -21.796630859375, -20.6806640625, -19.564697265625, -18.44873046875, -17.332763671875, -16.216796875, -15.100830078125, -13.98486328125, -12.868896484375, -11.7529296875, -10.636962890625, -9.52099609375, -8.405029296875, -7.2890625, -6.173095703125, -5.05712890625, -3.941162109375, -2.8251953125, -1.709228515625, -0.59326171875, 0.522705078125, 1.638671875, 2.754638671875, 3.87060546875, 4.986572265625, 6.1025390625, 7.218505859375, 8.33447265625, 9.450439453125, 10.56640625, 11.682373046875, 12.79833984375, 13.914306640625, 15.0302734375, 16.146240234375, 17.26220703125, 18.378173828125, 19.494140625, 20.610107421875, 21.72607421875, 22.842041015625, 23.9580078125, 25.073974609375, 26.18994140625, 27.305908203125, 28.421875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 7.0, 11.0, 6.0, 18.0, 26.0, 27.0, 37.0, 63.0, 104.0, 87.0, 122.0, 95.0, 98.0, 91.0, 62.0, 50.0, 29.0, 17.0, 9.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-403.4252624511719, -391.63177490234375, -379.8382873535156, -368.0447998046875, -356.25128173828125, -344.4577941894531, -332.664306640625, -320.8708190917969, -309.07733154296875, -297.2838439941406, -285.4903564453125, -273.69683837890625, -261.9033508300781, -250.10986328125, -238.31637573242188, -226.52288818359375, -214.7293701171875, -202.93588256835938, -191.1423797607422, -179.34889221191406, -167.55538940429688, -155.76190185546875, -143.96841430664062, -132.1749267578125, -120.38142395019531, -108.58792877197266, -96.79443359375, -85.00094604492188, -73.20745086669922, -61.41395568847656, -49.62046813964844, -37.82697296142578, -26.033477783203125, -14.239984512329102, -2.446491241455078, 9.347000122070312, 21.14049530029297, 32.933990478515625, 44.72747802734375, 56.520973205566406, 68.31446838378906, 80.10796356201172, 91.90145874023438, 103.6949462890625, 115.48844146728516, 127.28193664550781, 139.07542419433594, 150.86892700195312, 162.66241455078125, 174.45590209960938, 186.24940490722656, 198.0428924560547, 209.83639526367188, 221.6298828125, 233.42337036132812, 245.21685791015625, 257.0103759765625, 268.8038635253906, 280.59735107421875, 292.390869140625, 304.1843566894531, 315.97784423828125, 327.7713317871094, 339.5648193359375, 351.3583068847656]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 9.0, 6.0, 7.0, 18.0, 18.0, 29.0, 27.0, 28.0, 39.0, 51.0, 34.0, 44.0, 69.0, 59.0, 55.0, 66.0, 56.0, 57.0, 41.0, 64.0, 48.0, 33.0, 27.0, 27.0, 32.0, 15.0, 16.0, 6.0, 5.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-480.408447265625, -466.667724609375, -452.927001953125, -439.186279296875, -425.445556640625, -411.704833984375, -397.9641418457031, -384.2234191894531, -370.4826965332031, -356.7419738769531, -343.0012512207031, -329.2605285644531, -315.51983642578125, -301.77911376953125, -288.03839111328125, -274.29766845703125, -260.55694580078125, -246.81622314453125, -233.07550048828125, -219.3347930908203, -205.5940704345703, -191.8533477783203, -178.11264038085938, -164.37191772460938, -150.63119506835938, -136.89047241210938, -123.1497573852539, -109.40904235839844, -95.66831970214844, -81.92759704589844, -68.18688201904297, -54.4461669921875, -40.705413818359375, -26.96469497680664, -13.223976135253906, 0.5167427062988281, 14.257461547851562, 27.998184204101562, 41.73889923095703, 55.4796142578125, 69.2203369140625, 82.9610595703125, 96.70177459716797, 110.44248962402344, 124.18321228027344, 137.92393493652344, 151.66464233398438, 165.40536499023438, 179.14608764648438, 192.88681030273438, 206.62753295898438, 220.3682403564453, 234.1089630126953, 247.8496856689453, 261.59039306640625, 275.33111572265625, 289.07183837890625, 302.81256103515625, 316.55328369140625, 330.29400634765625, 344.03472900390625, 357.77545166015625, 371.5161437988281, 385.2568664550781, 398.9975891113281]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 11.0, 27.0, 24.0, 48.0, 66.0, 98.0, 136.0, 214.0, 307.0, 542.0, 934.0, 1523.0, 2653.0, 4867.0, 9806.0, 21927.0, 60927.0, 309646.0, 3567236.0, 142251.0, 39291.0, 15575.0, 7303.0, 3639.0, 2023.0, 1217.0, 721.0, 416.0, 281.0, 203.0, 111.0, 85.0, 48.0, 35.0, 26.0, 17.0, 7.0, 11.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.625, -63.76611328125, -61.9072265625, -60.04833984375, -58.189453125, -56.33056640625, -54.4716796875, -52.61279296875, -50.75390625, -48.89501953125, -47.0361328125, -45.17724609375, -43.318359375, -41.45947265625, -39.6005859375, -37.74169921875, -35.8828125, -34.02392578125, -32.1650390625, -30.30615234375, -28.447265625, -26.58837890625, -24.7294921875, -22.87060546875, -21.01171875, -19.15283203125, -17.2939453125, -15.43505859375, -13.576171875, -11.71728515625, -9.8583984375, -7.99951171875, -6.140625, -4.28173828125, -2.4228515625, -0.56396484375, 1.294921875, 3.15380859375, 5.0126953125, 6.87158203125, 8.73046875, 10.58935546875, 12.4482421875, 14.30712890625, 16.166015625, 18.02490234375, 19.8837890625, 21.74267578125, 23.6015625, 25.46044921875, 27.3193359375, 29.17822265625, 31.037109375, 32.89599609375, 34.7548828125, 36.61376953125, 38.47265625, 40.33154296875, 42.1904296875, 44.04931640625, 45.908203125, 47.76708984375, 49.6259765625, 51.48486328125, 53.34375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 5.0, 2.0, 9.0, 10.0, 15.0, 17.0, 23.0, 22.0, 35.0, 33.0, 37.0, 54.0, 40.0, 48.0, 50.0, 51.0, 61.0, 58.0, 59.0, 48.0, 52.0, 54.0, 39.0, 33.0, 25.0, 25.0, 22.0, 15.0, 8.0, 14.0, 14.0, 10.0, 6.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.703125, -18.17919921875, -17.6552734375, -17.13134765625, -16.607421875, -16.08349609375, -15.5595703125, -15.03564453125, -14.51171875, -13.98779296875, -13.4638671875, -12.93994140625, -12.416015625, -11.89208984375, -11.3681640625, -10.84423828125, -10.3203125, -9.79638671875, -9.2724609375, -8.74853515625, -8.224609375, -7.70068359375, -7.1767578125, -6.65283203125, -6.12890625, -5.60498046875, -5.0810546875, -4.55712890625, -4.033203125, -3.50927734375, -2.9853515625, -2.46142578125, -1.9375, -1.41357421875, -0.8896484375, -0.36572265625, 0.158203125, 0.68212890625, 1.2060546875, 1.72998046875, 2.25390625, 2.77783203125, 3.3017578125, 3.82568359375, 4.349609375, 4.87353515625, 5.3974609375, 5.92138671875, 6.4453125, 6.96923828125, 7.4931640625, 8.01708984375, 8.541015625, 9.06494140625, 9.5888671875, 10.11279296875, 10.63671875, 11.16064453125, 11.6845703125, 12.20849609375, 12.732421875, 13.25634765625, 13.7802734375, 14.30419921875, 14.828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 3.0, 0.0, 7.0, 8.0, 9.0, 6.0, 10.0, 20.0, 24.0, 44.0, 70.0, 77.0, 119.0, 151.0, 197.0, 330.0, 482.0, 796.0, 1540.0, 3618.0, 10354.0, 41715.0, 488381.0, 3547022.0, 74418.0, 15295.0, 4768.0, 2014.0, 964.0, 605.0, 330.0, 269.0, 173.0, 124.0, 102.0, 67.0, 48.0, 24.0, 29.0, 20.0, 19.0, 12.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-123.8125, -120.48046875, -117.1484375, -113.81640625, -110.484375, -107.15234375, -103.8203125, -100.48828125, -97.15625, -93.82421875, -90.4921875, -87.16015625, -83.828125, -80.49609375, -77.1640625, -73.83203125, -70.5, -67.16796875, -63.8359375, -60.50390625, -57.171875, -53.83984375, -50.5078125, -47.17578125, -43.84375, -40.51171875, -37.1796875, -33.84765625, -30.515625, -27.18359375, -23.8515625, -20.51953125, -17.1875, -13.85546875, -10.5234375, -7.19140625, -3.859375, -0.52734375, 2.8046875, 6.13671875, 9.46875, 12.80078125, 16.1328125, 19.46484375, 22.796875, 26.12890625, 29.4609375, 32.79296875, 36.125, 39.45703125, 42.7890625, 46.12109375, 49.453125, 52.78515625, 56.1171875, 59.44921875, 62.78125, 66.11328125, 69.4453125, 72.77734375, 76.109375, 79.44140625, 82.7734375, 86.10546875, 89.4375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 8.0, 12.0, 31.0, 45.0, 106.0, 381.0, 2839.0, 372.0, 123.0, 58.0, 28.0, 24.0, 9.0, 10.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.5, -92.044921875, -89.58984375, -87.134765625, -84.6796875, -82.224609375, -79.76953125, -77.314453125, -74.859375, -72.404296875, -69.94921875, -67.494140625, -65.0390625, -62.583984375, -60.12890625, -57.673828125, -55.21875, -52.763671875, -50.30859375, -47.853515625, -45.3984375, -42.943359375, -40.48828125, -38.033203125, -35.578125, -33.123046875, -30.66796875, -28.212890625, -25.7578125, -23.302734375, -20.84765625, -18.392578125, -15.9375, -13.482421875, -11.02734375, -8.572265625, -6.1171875, -3.662109375, -1.20703125, 1.248046875, 3.703125, 6.158203125, 8.61328125, 11.068359375, 13.5234375, 15.978515625, 18.43359375, 20.888671875, 23.34375, 25.798828125, 28.25390625, 30.708984375, 33.1640625, 35.619140625, 38.07421875, 40.529296875, 42.984375, 45.439453125, 47.89453125, 50.349609375, 52.8046875, 55.259765625, 57.71484375, 60.169921875, 62.625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 7.0, 17.0, 23.0, 37.0, 56.0, 100.0, 130.0, 162.0, 128.0, 115.0, 71.0, 51.0, 37.0, 18.0, 14.0, 7.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-161.06800842285156, -153.37513732910156, -145.68228149414062, -137.98941040039062, -130.29653930664062, -122.60366821289062, -114.91080474853516, -107.21794128417969, -99.52507019042969, -91.83219909667969, -84.13933563232422, -76.44647216796875, -68.75360107421875, -61.060733795166016, -53.36786651611328, -45.67499923706055, -37.98213195800781, -30.289264678955078, -22.596397399902344, -14.90353012084961, -7.210662841796875, 0.4822044372558594, 8.175071716308594, 15.867938995361328, 23.560806274414062, 31.253673553466797, 38.94654083251953, 46.639408111572266, 54.332275390625, 62.025142669677734, 69.71800994873047, 77.41087341308594, 85.10372924804688, 92.79660034179688, 100.48946380615234, 108.18232727050781, 115.87519836425781, 123.56806945800781, 131.26092529296875, 138.95379638671875, 146.64666748046875, 154.33953857421875, 162.03240966796875, 169.7252655029297, 177.4181365966797, 185.1110076904297, 192.80386352539062, 200.49673461914062, 208.18960571289062, 215.88247680664062, 223.57534790039062, 231.26820373535156, 238.96107482910156, 246.65394592285156, 254.3468017578125, 262.0396728515625, 269.7325439453125, 277.4254150390625, 285.1182861328125, 292.8111572265625, 300.5040283203125, 308.1968688964844, 315.8897399902344, 323.5826110839844, 331.2754821777344]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 8.0, 5.0, 7.0, 12.0, 9.0, 19.0, 19.0, 35.0, 23.0, 14.0, 16.0, 28.0, 34.0, 32.0, 28.0, 43.0, 51.0, 39.0, 36.0, 42.0, 42.0, 45.0, 38.0, 37.0, 30.0, 31.0, 25.0, 25.0, 28.0, 26.0, 26.0, 22.0, 26.0, 3.0, 13.0, 14.0, 14.0, 11.0, 10.0, 6.0, 5.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-134.34027099609375, -130.07669067382812, -125.8131103515625, -121.54953002929688, -117.28594970703125, -113.02236938476562, -108.75878143310547, -104.49520111083984, -100.23162078857422, -95.9680404663086, -91.70446014404297, -87.44087982177734, -83.17729187011719, -78.91371154785156, -74.65013122558594, -70.38655090332031, -66.12297058105469, -61.85939025878906, -57.59580993652344, -53.33222579956055, -49.06864547729492, -44.8050651550293, -40.541481018066406, -36.27790069580078, -32.014320373535156, -27.75074005126953, -23.487157821655273, -19.223575592041016, -14.95999526977539, -10.696414947509766, -6.432832717895508, -2.16925048828125, 2.094329833984375, 6.357911109924316, 10.621492385864258, 14.8850736618042, 19.14865493774414, 23.412235260009766, 27.675817489624023, 31.93939971923828, 36.202980041503906, 40.46656036376953, 44.730140686035156, 48.99372482299805, 53.25730514526367, 57.5208854675293, 61.78446960449219, 66.04804992675781, 70.31163024902344, 74.57521057128906, 78.83879089355469, 83.10237121582031, 87.36595153808594, 91.62953186035156, 95.89311981201172, 100.15670013427734, 104.42028045654297, 108.6838607788086, 112.94744110107422, 117.21102142333984, 121.474609375, 125.73818969726562, 130.00177001953125, 134.26535034179688, 138.5289306640625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 14.0, 14.0, 26.0, 36.0, 69.0, 107.0, 212.0, 379.0, 716.0, 1462.0, 3207.0, 7321.0, 18360.0, 51919.0, 166293.0, 411280.0, 260489.0, 80992.0, 26818.0, 10307.0, 4411.0, 2042.0, 967.0, 481.0, 267.0, 149.0, 84.0, 49.0, 29.0, 23.0, 9.0, 12.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.5556640625, -64.236328125, -61.9169921875, -59.59765625, -57.2783203125, -54.958984375, -52.6396484375, -50.3203125, -48.0009765625, -45.681640625, -43.3623046875, -41.04296875, -38.7236328125, -36.404296875, -34.0849609375, -31.765625, -29.4462890625, -27.126953125, -24.8076171875, -22.48828125, -20.1689453125, -17.849609375, -15.5302734375, -13.2109375, -10.8916015625, -8.572265625, -6.2529296875, -3.93359375, -1.6142578125, 0.705078125, 3.0244140625, 5.34375, 7.6630859375, 9.982421875, 12.3017578125, 14.62109375, 16.9404296875, 19.259765625, 21.5791015625, 23.8984375, 26.2177734375, 28.537109375, 30.8564453125, 33.17578125, 35.4951171875, 37.814453125, 40.1337890625, 42.453125, 44.7724609375, 47.091796875, 49.4111328125, 51.73046875, 54.0498046875, 56.369140625, 58.6884765625, 61.0078125, 63.3271484375, 65.646484375, 67.9658203125, 70.28515625, 72.6044921875, 74.923828125, 77.2431640625, 79.5625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 8.0, 8.0, 15.0, 13.0, 20.0, 24.0, 32.0, 46.0, 36.0, 34.0, 59.0, 61.0, 44.0, 44.0, 63.0, 56.0, 53.0, 61.0, 51.0, 34.0, 31.0, 31.0, 21.0, 29.0, 26.0, 26.0, 18.0, 9.0, 10.0, 9.0, 5.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.734375, -22.147216796875, -21.56005859375, -20.972900390625, -20.3857421875, -19.798583984375, -19.21142578125, -18.624267578125, -18.037109375, -17.449951171875, -16.86279296875, -16.275634765625, -15.6884765625, -15.101318359375, -14.51416015625, -13.927001953125, -13.33984375, -12.752685546875, -12.16552734375, -11.578369140625, -10.9912109375, -10.404052734375, -9.81689453125, -9.229736328125, -8.642578125, -8.055419921875, -7.46826171875, -6.881103515625, -6.2939453125, -5.706787109375, -5.11962890625, -4.532470703125, -3.9453125, -3.358154296875, -2.77099609375, -2.183837890625, -1.5966796875, -1.009521484375, -0.42236328125, 0.164794921875, 0.751953125, 1.339111328125, 1.92626953125, 2.513427734375, 3.1005859375, 3.687744140625, 4.27490234375, 4.862060546875, 5.44921875, 6.036376953125, 6.62353515625, 7.210693359375, 7.7978515625, 8.385009765625, 8.97216796875, 9.559326171875, 10.146484375, 10.733642578125, 11.32080078125, 11.907958984375, 12.4951171875, 13.082275390625, 13.66943359375, 14.256591796875, 14.84375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 12.0, 7.0, 11.0, 16.0, 11.0, 29.0, 33.0, 52.0, 70.0, 85.0, 113.0, 159.0, 207.0, 357.0, 534.0, 994.0, 1915.0, 4065.0, 8837.0, 23248.0, 74326.0, 299853.0, 448624.0, 125707.0, 35446.0, 12705.0, 5240.0, 2516.0, 1287.0, 714.0, 432.0, 263.0, 190.0, 119.0, 72.0, 83.0, 57.0, 34.0, 25.0, 26.0, 19.0, 11.0, 12.0, 9.0, 10.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-91.3125, -88.5615234375, -85.810546875, -83.0595703125, -80.30859375, -77.5576171875, -74.806640625, -72.0556640625, -69.3046875, -66.5537109375, -63.802734375, -61.0517578125, -58.30078125, -55.5498046875, -52.798828125, -50.0478515625, -47.296875, -44.5458984375, -41.794921875, -39.0439453125, -36.29296875, -33.5419921875, -30.791015625, -28.0400390625, -25.2890625, -22.5380859375, -19.787109375, -17.0361328125, -14.28515625, -11.5341796875, -8.783203125, -6.0322265625, -3.28125, -0.5302734375, 2.220703125, 4.9716796875, 7.72265625, 10.4736328125, 13.224609375, 15.9755859375, 18.7265625, 21.4775390625, 24.228515625, 26.9794921875, 29.73046875, 32.4814453125, 35.232421875, 37.9833984375, 40.734375, 43.4853515625, 46.236328125, 48.9873046875, 51.73828125, 54.4892578125, 57.240234375, 59.9912109375, 62.7421875, 65.4931640625, 68.244140625, 70.9951171875, 73.74609375, 76.4970703125, 79.248046875, 81.9990234375, 84.75]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 8.0, 4.0, 4.0, 11.0, 11.0, 15.0, 8.0, 22.0, 19.0, 21.0, 19.0, 22.0, 33.0, 27.0, 40.0, 35.0, 43.0, 36.0, 48.0, 54.0, 40.0, 38.0, 39.0, 48.0, 35.0, 44.0, 33.0, 31.0, 27.0, 19.0, 24.0, 25.0, 16.0, 16.0, 11.0, 8.0, 7.0, 3.0, 17.0, 3.0, 7.0, 1.0, 7.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-99.875, -96.8740234375, -93.873046875, -90.8720703125, -87.87109375, -84.8701171875, -81.869140625, -78.8681640625, -75.8671875, -72.8662109375, -69.865234375, -66.8642578125, -63.86328125, -60.8623046875, -57.861328125, -54.8603515625, -51.859375, -48.8583984375, -45.857421875, -42.8564453125, -39.85546875, -36.8544921875, -33.853515625, -30.8525390625, -27.8515625, -24.8505859375, -21.849609375, -18.8486328125, -15.84765625, -12.8466796875, -9.845703125, -6.8447265625, -3.84375, -0.8427734375, 2.158203125, 5.1591796875, 8.16015625, 11.1611328125, 14.162109375, 17.1630859375, 20.1640625, 23.1650390625, 26.166015625, 29.1669921875, 32.16796875, 35.1689453125, 38.169921875, 41.1708984375, 44.171875, 47.1728515625, 50.173828125, 53.1748046875, 56.17578125, 59.1767578125, 62.177734375, 65.1787109375, 68.1796875, 71.1806640625, 74.181640625, 77.1826171875, 80.18359375, 83.1845703125, 86.185546875, 89.1865234375, 92.1875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 7.0, 12.0, 26.0, 44.0, 61.0, 113.0, 189.0, 325.0, 636.0, 1419.0, 3716.0, 12337.0, 58123.0, 501944.0, 404144.0, 48724.0, 10712.0, 3409.0, 1308.0, 561.0, 325.0, 165.0, 106.0, 47.0, 34.0, 21.0, 9.0, 6.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.46875, -44.44384765625, -42.4189453125, -40.39404296875, -38.369140625, -36.34423828125, -34.3193359375, -32.29443359375, -30.26953125, -28.24462890625, -26.2197265625, -24.19482421875, -22.169921875, -20.14501953125, -18.1201171875, -16.09521484375, -14.0703125, -12.04541015625, -10.0205078125, -7.99560546875, -5.970703125, -3.94580078125, -1.9208984375, 0.10400390625, 2.12890625, 4.15380859375, 6.1787109375, 8.20361328125, 10.228515625, 12.25341796875, 14.2783203125, 16.30322265625, 18.328125, 20.35302734375, 22.3779296875, 24.40283203125, 26.427734375, 28.45263671875, 30.4775390625, 32.50244140625, 34.52734375, 36.55224609375, 38.5771484375, 40.60205078125, 42.626953125, 44.65185546875, 46.6767578125, 48.70166015625, 50.7265625, 52.75146484375, 54.7763671875, 56.80126953125, 58.826171875, 60.85107421875, 62.8759765625, 64.90087890625, 66.92578125, 68.95068359375, 70.9755859375, 73.00048828125, 75.025390625, 77.05029296875, 79.0751953125, 81.10009765625, 83.125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 16.0, 16.0, 20.0, 24.0, 30.0, 47.0, 57.0, 90.0, 95.0, 128.0, 94.0, 89.0, 65.0, 59.0, 46.0, 25.0, 17.0, 11.0, 15.0, 10.0, 6.0, 4.0, 3.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006366729736328125, -0.006158769130706787, -0.005950808525085449, -0.005742847919464111, -0.0055348873138427734, -0.0053269267082214355, -0.005118966102600098, -0.00491100549697876, -0.004703044891357422, -0.004495084285736084, -0.004287123680114746, -0.004079163074493408, -0.0038712024688720703, -0.0036632418632507324, -0.0034552812576293945, -0.0032473206520080566, -0.0030393600463867188, -0.002831399440765381, -0.002623438835144043, -0.002415478229522705, -0.002207517623901367, -0.0019995570182800293, -0.0017915964126586914, -0.0015836358070373535, -0.0013756752014160156, -0.0011677145957946777, -0.0009597539901733398, -0.000751793384552002, -0.0005438327789306641, -0.00033587217330932617, -0.00012791156768798828, 8.004903793334961e-05, 0.0002880096435546875, 0.0004959702491760254, 0.0007039308547973633, 0.0009118914604187012, 0.001119852066040039, 0.001327812671661377, 0.0015357732772827148, 0.0017437338829040527, 0.0019516944885253906, 0.0021596550941467285, 0.0023676156997680664, 0.0025755763053894043, 0.002783536911010742, 0.00299149751663208, 0.003199458122253418, 0.003407418727874756, 0.0036153793334960938, 0.0038233399391174316, 0.0040313005447387695, 0.004239261150360107, 0.004447221755981445, 0.004655182361602783, 0.004863142967224121, 0.005071103572845459, 0.005279064178466797, 0.005487024784088135, 0.005694985389709473, 0.0059029459953308105, 0.0061109066009521484, 0.006318867206573486, 0.006526827812194824, 0.006734788417816162, 0.0069427490234375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 6.0, 18.0, 24.0, 43.0, 49.0, 100.0, 156.0, 264.0, 586.0, 1440.0, 5327.0, 35794.0, 616512.0, 359232.0, 22920.0, 3785.0, 1178.0, 486.0, 237.0, 139.0, 74.0, 66.0, 29.0, 19.0, 12.0, 10.0, 18.0, 2.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.75, -64.1728515625, -61.595703125, -59.0185546875, -56.44140625, -53.8642578125, -51.287109375, -48.7099609375, -46.1328125, -43.5556640625, -40.978515625, -38.4013671875, -35.82421875, -33.2470703125, -30.669921875, -28.0927734375, -25.515625, -22.9384765625, -20.361328125, -17.7841796875, -15.20703125, -12.6298828125, -10.052734375, -7.4755859375, -4.8984375, -2.3212890625, 0.255859375, 2.8330078125, 5.41015625, 7.9873046875, 10.564453125, 13.1416015625, 15.71875, 18.2958984375, 20.873046875, 23.4501953125, 26.02734375, 28.6044921875, 31.181640625, 33.7587890625, 36.3359375, 38.9130859375, 41.490234375, 44.0673828125, 46.64453125, 49.2216796875, 51.798828125, 54.3759765625, 56.953125, 59.5302734375, 62.107421875, 64.6845703125, 67.26171875, 69.8388671875, 72.416015625, 74.9931640625, 77.5703125, 80.1474609375, 82.724609375, 85.3017578125, 87.87890625, 90.4560546875, 93.033203125, 95.6103515625, 98.1875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 10.0, 12.0, 14.0, 17.0, 27.0, 29.0, 41.0, 44.0, 76.0, 91.0, 138.0, 99.0, 85.0, 71.0, 61.0, 38.0, 29.0, 23.0, 27.0, 15.0, 14.0, 11.0, 3.0, 1.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.75, -56.65625, -54.5625, -52.46875, -50.375, -48.28125, -46.1875, -44.09375, -42.0, -39.90625, -37.8125, -35.71875, -33.625, -31.53125, -29.4375, -27.34375, -25.25, -23.15625, -21.0625, -18.96875, -16.875, -14.78125, -12.6875, -10.59375, -8.5, -6.40625, -4.3125, -2.21875, -0.125, 1.96875, 4.0625, 6.15625, 8.25, 10.34375, 12.4375, 14.53125, 16.625, 18.71875, 20.8125, 22.90625, 25.0, 27.09375, 29.1875, 31.28125, 33.375, 35.46875, 37.5625, 39.65625, 41.75, 43.84375, 45.9375, 48.03125, 50.125, 52.21875, 54.3125, 56.40625, 58.5, 60.59375, 62.6875, 64.78125, 66.875, 68.96875, 71.0625, 73.15625, 75.25]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 21.0, 38.0, 65.0, 85.0, 98.0, 167.0, 141.0, 136.0, 87.0, 64.0, 35.0, 19.0, 10.0, 8.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-705.160400390625, -678.1300048828125, -651.0995483398438, -624.0691528320312, -597.0387573242188, -570.00830078125, -542.9779052734375, -515.947509765625, -488.91705322265625, -461.8866271972656, -434.8562316894531, -407.8258056640625, -380.7953796386719, -353.76495361328125, -326.73455810546875, -299.7041320800781, -272.6737365722656, -245.64332580566406, -218.61289978027344, -191.58248901367188, -164.55206298828125, -137.5216522216797, -110.49124145507812, -83.4608154296875, -56.43040466308594, -29.399988174438477, -2.3695716857910156, 24.660842895507812, 51.691261291503906, 78.7216796875, 105.75209045410156, 132.7825164794922, 159.81292724609375, 186.8433380126953, 213.87376403808594, 240.9041748046875, 267.9346008300781, 294.96502685546875, 321.99542236328125, 349.0258483886719, 376.0562744140625, 403.0867004394531, 430.1170959472656, 457.14752197265625, 484.1779479980469, 511.2083740234375, 538.23876953125, 565.2691650390625, 592.299560546875, 619.3299560546875, 646.3604125976562, 673.3908081054688, 700.4212036132812, 727.45166015625, 754.4820556640625, 781.512451171875, 808.5429077148438, 835.5733032226562, 862.603759765625, 889.6341552734375, 916.66455078125, 943.6950073242188, 970.7254028320312, 997.755859375, 1024.7862548828125]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 10.0, 2.0, 11.0, 7.0, 16.0, 19.0, 19.0, 28.0, 28.0, 42.0, 36.0, 33.0, 45.0, 41.0, 57.0, 67.0, 77.0, 56.0, 54.0, 54.0, 59.0, 33.0, 43.0, 34.0, 20.0, 23.0, 14.0, 15.0, 9.0, 14.0, 8.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-805.1224975585938, -782.1176147460938, -759.1127319335938, -736.10791015625, -713.10302734375, -690.09814453125, -667.09326171875, -644.08837890625, -621.08349609375, -598.07861328125, -575.07373046875, -552.06884765625, -529.0640258789062, -506.05914306640625, -483.05426025390625, -460.04937744140625, -437.0445556640625, -414.0396728515625, -391.0348205566406, -368.0299377441406, -345.02508544921875, -322.02020263671875, -299.01531982421875, -276.01043701171875, -253.00558471679688, -230.00071716308594, -206.995849609375, -183.990966796875, -160.98609924316406, -137.98123168945312, -114.97634887695312, -91.97148132324219, -68.96661376953125, -45.96174240112305, -22.956871032714844, 0.048004150390625, 23.052871704101562, 46.0577392578125, 69.0626220703125, 92.06748962402344, 115.07235717773438, 138.0772247314453, 161.08209228515625, 184.08697509765625, 207.0918426513672, 230.09671020507812, 253.10159301757812, 276.1064453125, 299.111328125, 322.1162109375, 345.1210632324219, 368.1259460449219, 391.13079833984375, 414.13568115234375, 437.14056396484375, 460.14544677734375, 483.1502990722656, 506.1551818847656, 529.1600341796875, 552.1649169921875, 575.1697998046875, 598.1746826171875, 621.1795654296875, 644.1843872070312, 667.1892700195312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 6.0, 5.0, 15.0, 19.0, 40.0, 57.0, 76.0, 139.0, 210.0, 435.0, 767.0, 1969.0, 7769.0, 4050030.0, 122904.0, 6575.0, 1675.0, 693.0, 367.0, 203.0, 115.0, 61.0, 50.0, 32.0, 17.0, 10.0, 10.0, 6.0, 11.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-336.75, -327.634765625, -318.51953125, -309.404296875, -300.2890625, -291.173828125, -282.05859375, -272.943359375, -263.828125, -254.712890625, -245.59765625, -236.482421875, -227.3671875, -218.251953125, -209.13671875, -200.021484375, -190.90625, -181.791015625, -172.67578125, -163.560546875, -154.4453125, -145.330078125, -136.21484375, -127.099609375, -117.984375, -108.869140625, -99.75390625, -90.638671875, -81.5234375, -72.408203125, -63.29296875, -54.177734375, -45.0625, -35.947265625, -26.83203125, -17.716796875, -8.6015625, 0.513671875, 9.62890625, 18.744140625, 27.859375, 36.974609375, 46.08984375, 55.205078125, 64.3203125, 73.435546875, 82.55078125, 91.666015625, 100.78125, 109.896484375, 119.01171875, 128.126953125, 137.2421875, 146.357421875, 155.47265625, 164.587890625, 173.703125, 182.818359375, 191.93359375, 201.048828125, 210.1640625, 219.279296875, 228.39453125, 237.509765625, 246.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 13.0, 12.0, 13.0, 17.0, 23.0, 44.0, 43.0, 51.0, 57.0, 68.0, 81.0, 70.0, 91.0, 81.0, 63.0, 57.0, 43.0, 42.0, 33.0, 21.0, 18.0, 25.0, 3.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.28125, -42.10107421875, -40.9208984375, -39.74072265625, -38.560546875, -37.38037109375, -36.2001953125, -35.02001953125, -33.83984375, -32.65966796875, -31.4794921875, -30.29931640625, -29.119140625, -27.93896484375, -26.7587890625, -25.57861328125, -24.3984375, -23.21826171875, -22.0380859375, -20.85791015625, -19.677734375, -18.49755859375, -17.3173828125, -16.13720703125, -14.95703125, -13.77685546875, -12.5966796875, -11.41650390625, -10.236328125, -9.05615234375, -7.8759765625, -6.69580078125, -5.515625, -4.33544921875, -3.1552734375, -1.97509765625, -0.794921875, 0.38525390625, 1.5654296875, 2.74560546875, 3.92578125, 5.10595703125, 6.2861328125, 7.46630859375, 8.646484375, 9.82666015625, 11.0068359375, 12.18701171875, 13.3671875, 14.54736328125, 15.7275390625, 16.90771484375, 18.087890625, 19.26806640625, 20.4482421875, 21.62841796875, 22.80859375, 23.98876953125, 25.1689453125, 26.34912109375, 27.529296875, 28.70947265625, 29.8896484375, 31.06982421875, 32.25]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 4.0, 7.0, 7.0, 12.0, 13.0, 19.0, 29.0, 25.0, 34.0, 53.0, 70.0, 121.0, 160.0, 234.0, 380.0, 750.0, 1453.0, 3164.0, 8769.0, 40243.0, 4078977.0, 44123.0, 8984.0, 3324.0, 1445.0, 733.0, 391.0, 248.0, 147.0, 105.0, 71.0, 60.0, 37.0, 29.0, 16.0, 16.0, 5.0, 7.0, 3.0, 1.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.875, -176.6796875, -170.484375, -164.2890625, -158.09375, -151.8984375, -145.703125, -139.5078125, -133.3125, -127.1171875, -120.921875, -114.7265625, -108.53125, -102.3359375, -96.140625, -89.9453125, -83.75, -77.5546875, -71.359375, -65.1640625, -58.96875, -52.7734375, -46.578125, -40.3828125, -34.1875, -27.9921875, -21.796875, -15.6015625, -9.40625, -3.2109375, 2.984375, 9.1796875, 15.375, 21.5703125, 27.765625, 33.9609375, 40.15625, 46.3515625, 52.546875, 58.7421875, 64.9375, 71.1328125, 77.328125, 83.5234375, 89.71875, 95.9140625, 102.109375, 108.3046875, 114.5, 120.6953125, 126.890625, 133.0859375, 139.28125, 145.4765625, 151.671875, 157.8671875, 164.0625, 170.2578125, 176.453125, 182.6484375, 188.84375, 195.0390625, 201.234375, 207.4296875, 213.625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 4.0, 3.0, 2.0, 11.0, 13.0, 39.0, 195.0, 3688.0, 57.0, 26.0, 18.0, 7.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-86.75, -84.8720703125, -82.994140625, -81.1162109375, -79.23828125, -77.3603515625, -75.482421875, -73.6044921875, -71.7265625, -69.8486328125, -67.970703125, -66.0927734375, -64.21484375, -62.3369140625, -60.458984375, -58.5810546875, -56.703125, -54.8251953125, -52.947265625, -51.0693359375, -49.19140625, -47.3134765625, -45.435546875, -43.5576171875, -41.6796875, -39.8017578125, -37.923828125, -36.0458984375, -34.16796875, -32.2900390625, -30.412109375, -28.5341796875, -26.65625, -24.7783203125, -22.900390625, -21.0224609375, -19.14453125, -17.2666015625, -15.388671875, -13.5107421875, -11.6328125, -9.7548828125, -7.876953125, -5.9990234375, -4.12109375, -2.2431640625, -0.365234375, 1.5126953125, 3.390625, 5.2685546875, 7.146484375, 9.0244140625, 10.90234375, 12.7802734375, 14.658203125, 16.5361328125, 18.4140625, 20.2919921875, 22.169921875, 24.0478515625, 25.92578125, 27.8037109375, 29.681640625, 31.5595703125, 33.4375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 14.0, 11.0, 33.0, 89.0, 145.0, 278.0, 230.0, 126.0, 44.0, 17.0, 6.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.8420104980469, -292.5265197753906, -285.21099853515625, -277.8955078125, -270.58001708984375, -263.2644958496094, -255.94900512695312, -248.6334991455078, -241.3179931640625, -234.0024871826172, -226.68699645996094, -219.37149047851562, -212.0559844970703, -204.740478515625, -197.42498779296875, -190.10948181152344, -182.79397583007812, -175.4784698486328, -168.16297912597656, -160.84747314453125, -153.53196716308594, -146.21646118164062, -138.90097045898438, -131.58546447753906, -124.26997375488281, -116.95447540283203, -109.63896942138672, -102.32347106933594, -95.00796508789062, -87.69246673583984, -80.37696838378906, -73.06146240234375, -65.74595642089844, -58.43045425415039, -51.114952087402344, -43.79945373535156, -36.48394775390625, -29.16844940185547, -21.852947235107422, -14.537445068359375, -7.221942901611328, 0.09355878829956055, 7.409060478210449, 14.72456169128418, 22.040063858032227, 29.35556411743164, 36.67106628417969, 43.986568450927734, 51.30207061767578, 58.61757278442383, 65.93307495117188, 73.24857330322266, 80.56407928466797, 87.87957763671875, 95.19508361816406, 102.51058197021484, 109.82608032226562, 117.1415786743164, 124.45708465576172, 131.7725830078125, 139.0880889892578, 146.40359497070312, 153.71908569335938, 161.0345916748047, 168.35009765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 8.0, 3.0, 3.0, 9.0, 9.0, 15.0, 18.0, 15.0, 30.0, 27.0, 36.0, 33.0, 42.0, 51.0, 45.0, 64.0, 49.0, 68.0, 51.0, 46.0, 52.0, 44.0, 52.0, 36.0, 34.0, 39.0, 24.0, 24.0, 20.0, 16.0, 12.0, 7.0, 9.0, 7.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.61791229248047, -83.47785949707031, -80.33780670166016, -77.19775390625, -74.05770111083984, -70.91764831542969, -67.777587890625, -64.63754272460938, -61.49748611450195, -58.3574333190918, -55.21738052368164, -52.07732391357422, -48.93727111816406, -45.797218322753906, -42.65716552734375, -39.517112731933594, -36.37705993652344, -33.23700714111328, -30.096954345703125, -26.956899642944336, -23.81684684753418, -20.676794052124023, -17.536739349365234, -14.396686553955078, -11.256633758544922, -8.116580963134766, -4.976527214050293, -1.8364734649658203, 1.303579330444336, 4.443632125854492, 7.583686828613281, 10.723739624023438, 13.863792419433594, 17.00384521484375, 20.143898010253906, 23.283952713012695, 26.42400550842285, 29.564058303833008, 32.7041130065918, 35.84416580200195, 38.98421859741211, 42.124271392822266, 45.26432418823242, 48.404380798339844, 51.54443359375, 54.684486389160156, 57.82453918457031, 60.96459197998047, 64.10464477539062, 67.24469757080078, 70.38475036621094, 73.5248031616211, 76.66485595703125, 79.8049087524414, 82.94496154785156, 86.08502197265625, 89.22506713867188, 92.36511993408203, 95.50517272949219, 98.64522552490234, 101.7852783203125, 104.92533111572266, 108.06538391113281, 111.2054443359375, 114.34549713134766]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 12.0, 5.0, 16.0, 25.0, 30.0, 46.0, 74.0, 135.0, 209.0, 325.0, 627.0, 1201.0, 2334.0, 4865.0, 11409.0, 28252.0, 77227.0, 218014.0, 373534.0, 208810.0, 73911.0, 26802.0, 10894.0, 4929.0, 2277.0, 1135.0, 594.0, 311.0, 216.0, 100.0, 73.0, 66.0, 38.0, 16.0, 13.0, 5.0, 10.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.6875, -83.1279296875, -80.568359375, -78.0087890625, -75.44921875, -72.8896484375, -70.330078125, -67.7705078125, -65.2109375, -62.6513671875, -60.091796875, -57.5322265625, -54.97265625, -52.4130859375, -49.853515625, -47.2939453125, -44.734375, -42.1748046875, -39.615234375, -37.0556640625, -34.49609375, -31.9365234375, -29.376953125, -26.8173828125, -24.2578125, -21.6982421875, -19.138671875, -16.5791015625, -14.01953125, -11.4599609375, -8.900390625, -6.3408203125, -3.78125, -1.2216796875, 1.337890625, 3.8974609375, 6.45703125, 9.0166015625, 11.576171875, 14.1357421875, 16.6953125, 19.2548828125, 21.814453125, 24.3740234375, 26.93359375, 29.4931640625, 32.052734375, 34.6123046875, 37.171875, 39.7314453125, 42.291015625, 44.8505859375, 47.41015625, 49.9697265625, 52.529296875, 55.0888671875, 57.6484375, 60.2080078125, 62.767578125, 65.3271484375, 67.88671875, 70.4462890625, 73.005859375, 75.5654296875, 78.125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 8.0, 9.0, 17.0, 8.0, 11.0, 23.0, 28.0, 36.0, 41.0, 48.0, 40.0, 50.0, 60.0, 69.0, 73.0, 68.0, 43.0, 49.0, 60.0, 47.0, 51.0, 36.0, 28.0, 26.0, 18.0, 7.0, 14.0, 4.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-43.0, -41.910888671875, -40.82177734375, -39.732666015625, -38.6435546875, -37.554443359375, -36.46533203125, -35.376220703125, -34.287109375, -33.197998046875, -32.10888671875, -31.019775390625, -29.9306640625, -28.841552734375, -27.75244140625, -26.663330078125, -25.57421875, -24.485107421875, -23.39599609375, -22.306884765625, -21.2177734375, -20.128662109375, -19.03955078125, -17.950439453125, -16.861328125, -15.772216796875, -14.68310546875, -13.593994140625, -12.5048828125, -11.415771484375, -10.32666015625, -9.237548828125, -8.1484375, -7.059326171875, -5.97021484375, -4.881103515625, -3.7919921875, -2.702880859375, -1.61376953125, -0.524658203125, 0.564453125, 1.653564453125, 2.74267578125, 3.831787109375, 4.9208984375, 6.010009765625, 7.09912109375, 8.188232421875, 9.27734375, 10.366455078125, 11.45556640625, 12.544677734375, 13.6337890625, 14.722900390625, 15.81201171875, 16.901123046875, 17.990234375, 19.079345703125, 20.16845703125, 21.257568359375, 22.3466796875, 23.435791015625, 24.52490234375, 25.614013671875, 26.703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 4.0, 14.0, 8.0, 13.0, 21.0, 31.0, 28.0, 42.0, 68.0, 82.0, 99.0, 125.0, 184.0, 304.0, 464.0, 765.0, 1554.0, 3577.0, 10239.0, 37351.0, 194151.0, 600482.0, 152548.0, 30879.0, 8869.0, 3260.0, 1312.0, 691.0, 422.0, 276.0, 174.0, 139.0, 71.0, 77.0, 56.0, 39.0, 39.0, 25.0, 22.0, 8.0, 9.0, 9.0, 10.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-145.0, -140.529296875, -136.05859375, -131.587890625, -127.1171875, -122.646484375, -118.17578125, -113.705078125, -109.234375, -104.763671875, -100.29296875, -95.822265625, -91.3515625, -86.880859375, -82.41015625, -77.939453125, -73.46875, -68.998046875, -64.52734375, -60.056640625, -55.5859375, -51.115234375, -46.64453125, -42.173828125, -37.703125, -33.232421875, -28.76171875, -24.291015625, -19.8203125, -15.349609375, -10.87890625, -6.408203125, -1.9375, 2.533203125, 7.00390625, 11.474609375, 15.9453125, 20.416015625, 24.88671875, 29.357421875, 33.828125, 38.298828125, 42.76953125, 47.240234375, 51.7109375, 56.181640625, 60.65234375, 65.123046875, 69.59375, 74.064453125, 78.53515625, 83.005859375, 87.4765625, 91.947265625, 96.41796875, 100.888671875, 105.359375, 109.830078125, 114.30078125, 118.771484375, 123.2421875, 127.712890625, 132.18359375, 136.654296875, 141.125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 14.0, 13.0, 13.0, 15.0, 17.0, 19.0, 18.0, 24.0, 27.0, 31.0, 33.0, 36.0, 31.0, 47.0, 40.0, 45.0, 57.0, 55.0, 38.0, 52.0, 27.0, 33.0, 36.0, 38.0, 30.0, 31.0, 19.0, 23.0, 24.0, 15.0, 18.0, 8.0, 13.0, 6.0, 9.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-156.0, -151.03515625, -146.0703125, -141.10546875, -136.140625, -131.17578125, -126.2109375, -121.24609375, -116.28125, -111.31640625, -106.3515625, -101.38671875, -96.421875, -91.45703125, -86.4921875, -81.52734375, -76.5625, -71.59765625, -66.6328125, -61.66796875, -56.703125, -51.73828125, -46.7734375, -41.80859375, -36.84375, -31.87890625, -26.9140625, -21.94921875, -16.984375, -12.01953125, -7.0546875, -2.08984375, 2.875, 7.83984375, 12.8046875, 17.76953125, 22.734375, 27.69921875, 32.6640625, 37.62890625, 42.59375, 47.55859375, 52.5234375, 57.48828125, 62.453125, 67.41796875, 72.3828125, 77.34765625, 82.3125, 87.27734375, 92.2421875, 97.20703125, 102.171875, 107.13671875, 112.1015625, 117.06640625, 122.03125, 126.99609375, 131.9609375, 136.92578125, 141.890625, 146.85546875, 151.8203125, 156.78515625, 161.75]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 8.0, 10.0, 17.0, 22.0, 31.0, 57.0, 98.0, 186.0, 283.0, 648.0, 1522.0, 5126.0, 23035.0, 288949.0, 672642.0, 44166.0, 7733.0, 2259.0, 824.0, 415.0, 217.0, 103.0, 62.0, 43.0, 40.0, 15.0, 12.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-116.8125, -113.6689453125, -110.525390625, -107.3818359375, -104.23828125, -101.0947265625, -97.951171875, -94.8076171875, -91.6640625, -88.5205078125, -85.376953125, -82.2333984375, -79.08984375, -75.9462890625, -72.802734375, -69.6591796875, -66.515625, -63.3720703125, -60.228515625, -57.0849609375, -53.94140625, -50.7978515625, -47.654296875, -44.5107421875, -41.3671875, -38.2236328125, -35.080078125, -31.9365234375, -28.79296875, -25.6494140625, -22.505859375, -19.3623046875, -16.21875, -13.0751953125, -9.931640625, -6.7880859375, -3.64453125, -0.5009765625, 2.642578125, 5.7861328125, 8.9296875, 12.0732421875, 15.216796875, 18.3603515625, 21.50390625, 24.6474609375, 27.791015625, 30.9345703125, 34.078125, 37.2216796875, 40.365234375, 43.5087890625, 46.65234375, 49.7958984375, 52.939453125, 56.0830078125, 59.2265625, 62.3701171875, 65.513671875, 68.6572265625, 71.80078125, 74.9443359375, 78.087890625, 81.2314453125, 84.375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 8.0, 2.0, 8.0, 4.0, 14.0, 14.0, 14.0, 21.0, 36.0, 32.0, 53.0, 57.0, 71.0, 89.0, 91.0, 92.0, 71.0, 72.0, 45.0, 49.0, 41.0, 23.0, 20.0, 10.0, 11.0, 12.0, 8.0, 12.0, 1.0, 5.0, 3.0, 1.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00719451904296875, -0.006953120231628418, -0.006711721420288086, -0.006470322608947754, -0.006228923797607422, -0.00598752498626709, -0.005746126174926758, -0.005504727363586426, -0.005263328552246094, -0.005021929740905762, -0.00478053092956543, -0.004539132118225098, -0.004297733306884766, -0.004056334495544434, -0.0038149356842041016, -0.0035735368728637695, -0.0033321380615234375, -0.0030907392501831055, -0.0028493404388427734, -0.0026079416275024414, -0.0023665428161621094, -0.0021251440048217773, -0.0018837451934814453, -0.0016423463821411133, -0.0014009475708007812, -0.0011595487594604492, -0.0009181499481201172, -0.0006767511367797852, -0.0004353523254394531, -0.0001939535140991211, 4.744529724121094e-05, 0.00028884410858154297, 0.000530242919921875, 0.000771641731262207, 0.001013040542602539, 0.001254439353942871, 0.0014958381652832031, 0.0017372369766235352, 0.001978635787963867, 0.0022200345993041992, 0.0024614334106445312, 0.0027028322219848633, 0.0029442310333251953, 0.0031856298446655273, 0.0034270286560058594, 0.0036684274673461914, 0.0039098262786865234, 0.0041512250900268555, 0.0043926239013671875, 0.0046340227127075195, 0.0048754215240478516, 0.005116820335388184, 0.005358219146728516, 0.005599617958068848, 0.00584101676940918, 0.006082415580749512, 0.006323814392089844, 0.006565213203430176, 0.006806612014770508, 0.00704801082611084, 0.007289409637451172, 0.007530808448791504, 0.007772207260131836, 0.008013606071472168, 0.0082550048828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 15.0, 20.0, 16.0, 31.0, 46.0, 100.0, 200.0, 478.0, 1529.0, 11237.0, 797383.0, 229869.0, 5758.0, 1108.0, 326.0, 188.0, 93.0, 47.0, 32.0, 19.0, 16.0, 10.0, 9.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.25, -136.955078125, -131.66015625, -126.365234375, -121.0703125, -115.775390625, -110.48046875, -105.185546875, -99.890625, -94.595703125, -89.30078125, -84.005859375, -78.7109375, -73.416015625, -68.12109375, -62.826171875, -57.53125, -52.236328125, -46.94140625, -41.646484375, -36.3515625, -31.056640625, -25.76171875, -20.466796875, -15.171875, -9.876953125, -4.58203125, 0.712890625, 6.0078125, 11.302734375, 16.59765625, 21.892578125, 27.1875, 32.482421875, 37.77734375, 43.072265625, 48.3671875, 53.662109375, 58.95703125, 64.251953125, 69.546875, 74.841796875, 80.13671875, 85.431640625, 90.7265625, 96.021484375, 101.31640625, 106.611328125, 111.90625, 117.201171875, 122.49609375, 127.791015625, 133.0859375, 138.380859375, 143.67578125, 148.970703125, 154.265625, 159.560546875, 164.85546875, 170.150390625, 175.4453125, 180.740234375, 186.03515625, 191.330078125, 196.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 12.0, 4.0, 6.0, 8.0, 16.0, 28.0, 44.0, 61.0, 135.0, 194.0, 181.0, 104.0, 80.0, 45.0, 29.0, 17.0, 13.0, 12.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5, -95.328125, -91.15625, -86.984375, -82.8125, -78.640625, -74.46875, -70.296875, -66.125, -61.953125, -57.78125, -53.609375, -49.4375, -45.265625, -41.09375, -36.921875, -32.75, -28.578125, -24.40625, -20.234375, -16.0625, -11.890625, -7.71875, -3.546875, 0.625, 4.796875, 8.96875, 13.140625, 17.3125, 21.484375, 25.65625, 29.828125, 34.0, 38.171875, 42.34375, 46.515625, 50.6875, 54.859375, 59.03125, 63.203125, 67.375, 71.546875, 75.71875, 79.890625, 84.0625, 88.234375, 92.40625, 96.578125, 100.75, 104.921875, 109.09375, 113.265625, 117.4375, 121.609375, 125.78125, 129.953125, 134.125, 138.296875, 142.46875, 146.640625, 150.8125, 154.984375, 159.15625, 163.328125, 167.5]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 14.0, 36.0, 60.0, 148.0, 237.0, 236.0, 139.0, 72.0, 28.0, 14.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2408.574951171875, -2348.70263671875, -2288.830322265625, -2228.957763671875, -2169.08544921875, -2109.213134765625, -2049.3408203125, -1989.468505859375, -1929.5960693359375, -1869.7237548828125, -1809.851318359375, -1749.97900390625, -1690.106689453125, -1630.2342529296875, -1570.3619384765625, -1510.489501953125, -1450.6171875, -1390.744873046875, -1330.8724365234375, -1271.0001220703125, -1211.127685546875, -1151.25537109375, -1091.383056640625, -1031.5107421875, -971.6383056640625, -911.7659301757812, -851.8935546875, -792.021240234375, -732.1488647460938, -672.2764892578125, -612.4041748046875, -552.5317993164062, -492.6593017578125, -432.78692626953125, -372.9145812988281, -313.042236328125, -253.16986083984375, -193.2974853515625, -133.42514038085938, -73.55279541015625, -13.680419921875, 46.19194030761719, 106.06430053710938, 165.93666076660156, 225.80902099609375, 285.681396484375, 345.5537414550781, 405.42608642578125, 465.2984619140625, 525.1708374023438, 585.043212890625, 644.91552734375, 704.7879028320312, 764.6602783203125, 824.5325927734375, 884.4049682617188, 944.27734375, 1004.1497192382812, 1064.0220947265625, 1123.8944091796875, 1183.766845703125, 1243.63916015625, 1303.511474609375, 1363.3837890625, 1423.2562255859375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 9.0, 6.0, 11.0, 15.0, 24.0, 16.0, 25.0, 22.0, 37.0, 35.0, 39.0, 47.0, 46.0, 58.0, 61.0, 44.0, 62.0, 55.0, 48.0, 36.0, 43.0, 32.0, 28.0, 30.0, 25.0, 20.0, 22.0, 17.0, 19.0, 9.0, 12.0, 10.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-888.6234130859375, -859.3818359375, -830.1402587890625, -800.898681640625, -771.6571044921875, -742.41552734375, -713.1739501953125, -683.932373046875, -654.6907958984375, -625.44921875, -596.2076416015625, -566.966064453125, -537.7244873046875, -508.48291015625, -479.2413330078125, -449.999755859375, -420.7581787109375, -391.5166015625, -362.2750244140625, -333.033447265625, -303.7918701171875, -274.55029296875, -245.3087158203125, -216.067138671875, -186.8255615234375, -157.583984375, -128.3424072265625, -99.100830078125, -69.8592529296875, -40.61767578125, -11.3760986328125, 17.865478515625, 47.10699462890625, 76.34857177734375, 105.59014892578125, 134.83172607421875, 164.07330322265625, 193.31488037109375, 222.55645751953125, 251.79803466796875, 281.03961181640625, 310.28118896484375, 339.52276611328125, 368.76434326171875, 398.00592041015625, 427.24749755859375, 456.48907470703125, 485.73065185546875, 514.9722290039062, 544.2138061523438, 573.4553833007812, 602.6969604492188, 631.9385375976562, 661.1801147460938, 690.4216918945312, 719.6632690429688, 748.9048461914062, 778.1464233398438, 807.3880004882812, 836.6295776367188, 865.8711547851562, 895.1127319335938, 924.3543090820312, 953.5958862304688, 982.8374633789062]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 6.0, 9.0, 11.0, 18.0, 24.0, 23.0, 45.0, 55.0, 107.0, 154.0, 269.0, 569.0, 1483.0, 4676.0, 28810.0, 4131561.0, 20176.0, 3994.0, 1227.0, 501.0, 212.0, 115.0, 68.0, 55.0, 29.0, 19.0, 15.0, 10.0, 9.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-278.5, -271.609375, -264.71875, -257.828125, -250.9375, -244.046875, -237.15625, -230.265625, -223.375, -216.484375, -209.59375, -202.703125, -195.8125, -188.921875, -182.03125, -175.140625, -168.25, -161.359375, -154.46875, -147.578125, -140.6875, -133.796875, -126.90625, -120.015625, -113.125, -106.234375, -99.34375, -92.453125, -85.5625, -78.671875, -71.78125, -64.890625, -58.0, -51.109375, -44.21875, -37.328125, -30.4375, -23.546875, -16.65625, -9.765625, -2.875, 4.015625, 10.90625, 17.796875, 24.6875, 31.578125, 38.46875, 45.359375, 52.25, 59.140625, 66.03125, 72.921875, 79.8125, 86.703125, 93.59375, 100.484375, 107.375, 114.265625, 121.15625, 128.046875, 134.9375, 141.828125, 148.71875, 155.609375, 162.5]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 12.0, 13.0, 20.0, 13.0, 30.0, 16.0, 30.0, 41.0, 40.0, 41.0, 72.0, 52.0, 80.0, 72.0, 74.0, 69.0, 64.0, 44.0, 35.0, 33.0, 24.0, 23.0, 21.0, 21.0, 16.0, 13.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.375, -44.015625, -42.65625, -41.296875, -39.9375, -38.578125, -37.21875, -35.859375, -34.5, -33.140625, -31.78125, -30.421875, -29.0625, -27.703125, -26.34375, -24.984375, -23.625, -22.265625, -20.90625, -19.546875, -18.1875, -16.828125, -15.46875, -14.109375, -12.75, -11.390625, -10.03125, -8.671875, -7.3125, -5.953125, -4.59375, -3.234375, -1.875, -0.515625, 0.84375, 2.203125, 3.5625, 4.921875, 6.28125, 7.640625, 9.0, 10.359375, 11.71875, 13.078125, 14.4375, 15.796875, 17.15625, 18.515625, 19.875, 21.234375, 22.59375, 23.953125, 25.3125, 26.671875, 28.03125, 29.390625, 30.75, 32.109375, 33.46875, 34.828125, 36.1875, 37.546875, 38.90625, 40.265625, 41.625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 11.0, 9.0, 14.0, 18.0, 21.0, 19.0, 32.0, 43.0, 56.0, 111.0, 145.0, 303.0, 546.0, 1156.0, 2993.0, 9472.0, 74295.0, 4078634.0, 18460.0, 4568.0, 1679.0, 695.0, 357.0, 220.0, 118.0, 74.0, 64.0, 44.0, 33.0, 16.0, 19.0, 21.0, 11.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-347.75, -337.875, -328.0, -318.125, -308.25, -298.375, -288.5, -278.625, -268.75, -258.875, -249.0, -239.125, -229.25, -219.375, -209.5, -199.625, -189.75, -179.875, -170.0, -160.125, -150.25, -140.375, -130.5, -120.625, -110.75, -100.875, -91.0, -81.125, -71.25, -61.375, -51.5, -41.625, -31.75, -21.875, -12.0, -2.125, 7.75, 17.625, 27.5, 37.375, 47.25, 57.125, 67.0, 76.875, 86.75, 96.625, 106.5, 116.375, 126.25, 136.125, 146.0, 155.875, 165.75, 175.625, 185.5, 195.375, 205.25, 215.125, 225.0, 234.875, 244.75, 254.625, 264.5, 274.375, 284.25]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 13.0, 14.0, 35.0, 266.0, 3613.0, 52.0, 24.0, 16.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.0625, -94.64111328125, -92.2197265625, -89.79833984375, -87.376953125, -84.95556640625, -82.5341796875, -80.11279296875, -77.69140625, -75.27001953125, -72.8486328125, -70.42724609375, -68.005859375, -65.58447265625, -63.1630859375, -60.74169921875, -58.3203125, -55.89892578125, -53.4775390625, -51.05615234375, -48.634765625, -46.21337890625, -43.7919921875, -41.37060546875, -38.94921875, -36.52783203125, -34.1064453125, -31.68505859375, -29.263671875, -26.84228515625, -24.4208984375, -21.99951171875, -19.578125, -17.15673828125, -14.7353515625, -12.31396484375, -9.892578125, -7.47119140625, -5.0498046875, -2.62841796875, -0.20703125, 2.21435546875, 4.6357421875, 7.05712890625, 9.478515625, 11.89990234375, 14.3212890625, 16.74267578125, 19.1640625, 21.58544921875, 24.0068359375, 26.42822265625, 28.849609375, 31.27099609375, 33.6923828125, 36.11376953125, 38.53515625, 40.95654296875, 43.3779296875, 45.79931640625, 48.220703125, 50.64208984375, 53.0634765625, 55.48486328125, 57.90625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 30.0, 83.0, 237.0, 386.0, 185.0, 51.0, 16.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.79632568359375, -246.5220947265625, -229.24786376953125, -211.9736328125, -194.69940185546875, -177.4251708984375, -160.15093994140625, -142.876708984375, -125.60247802734375, -108.3282470703125, -91.05401611328125, -73.77978515625, -56.50555419921875, -39.2313232421875, -21.95709228515625, -4.682861328125, 12.59136962890625, 29.8656005859375, 47.13983154296875, 64.4140625, 81.68829345703125, 98.9625244140625, 116.23675537109375, 133.510986328125, 150.78521728515625, 168.0594482421875, 185.33367919921875, 202.60791015625, 219.88214111328125, 237.1563720703125, 254.43060302734375, 271.704833984375, 288.9791259765625, 306.25335693359375, 323.527587890625, 340.80181884765625, 358.0760498046875, 375.35028076171875, 392.62451171875, 409.89874267578125, 427.1729736328125, 444.44720458984375, 461.721435546875, 478.99566650390625, 496.2698974609375, 513.5441284179688, 530.818359375, 548.0925903320312, 565.3668212890625, 582.6410522460938, 599.915283203125, 617.1895141601562, 634.4637451171875, 651.7379760742188, 669.01220703125, 686.2864379882812, 703.5606689453125, 720.8348999023438, 738.109130859375, 755.3833618164062, 772.6575927734375, 789.9318237304688, 807.2060546875, 824.4802856445312, 841.7545166015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 11.0, 8.0, 8.0, 7.0, 25.0, 19.0, 27.0, 27.0, 18.0, 30.0, 30.0, 30.0, 43.0, 49.0, 50.0, 44.0, 52.0, 38.0, 51.0, 54.0, 48.0, 41.0, 37.0, 34.0, 27.0, 32.0, 28.0, 28.0, 19.0, 16.0, 24.0, 13.0, 6.0, 9.0, 7.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.3844985961914, -107.6120834350586, -103.83966827392578, -100.06725311279297, -96.29484558105469, -92.52243041992188, -88.75001525878906, -84.97760009765625, -81.20518493652344, -77.43276977539062, -73.66035461425781, -69.887939453125, -66.11552429199219, -62.34311294555664, -58.570701599121094, -54.79828643798828, -51.02587127685547, -47.253456115722656, -43.481040954589844, -39.7086296081543, -35.936214447021484, -32.16379928588867, -28.391386032104492, -24.618972778320312, -20.8465576171875, -17.074142456054688, -13.301729202270508, -9.529314994812012, -5.756900787353516, -1.9844856262207031, 1.7879276275634766, 5.560340881347656, 9.332763671875, 13.105177879333496, 16.877592086791992, 20.650005340576172, 24.422420501708984, 28.194835662841797, 31.967248916625977, 35.739662170410156, 39.51207733154297, 43.28449249267578, 47.056907653808594, 50.82931900024414, 54.60173416137695, 58.374149322509766, 62.14656066894531, 65.91897583007812, 69.69139099121094, 73.46380615234375, 77.23622131347656, 81.00863647460938, 84.78105163574219, 88.553466796875, 92.32587432861328, 96.0982894897461, 99.8707046508789, 103.64311981201172, 107.41553497314453, 111.18795013427734, 114.96035766601562, 118.73277282714844, 122.50518798828125, 126.27760314941406, 130.05001831054688]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 13.0, 17.0, 23.0, 48.0, 49.0, 85.0, 110.0, 186.0, 301.0, 463.0, 827.0, 1479.0, 2687.0, 4997.0, 9925.0, 20199.0, 42902.0, 97184.0, 222014.0, 317765.0, 179319.0, 78522.0, 34929.0, 16617.0, 8306.0, 4162.0, 2252.0, 1190.0, 730.0, 437.0, 245.0, 188.0, 125.0, 73.0, 49.0, 23.0, 34.0, 24.0, 7.0, 8.0, 12.0, 6.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-64.25, -61.90234375, -59.5546875, -57.20703125, -54.859375, -52.51171875, -50.1640625, -47.81640625, -45.46875, -43.12109375, -40.7734375, -38.42578125, -36.078125, -33.73046875, -31.3828125, -29.03515625, -26.6875, -24.33984375, -21.9921875, -19.64453125, -17.296875, -14.94921875, -12.6015625, -10.25390625, -7.90625, -5.55859375, -3.2109375, -0.86328125, 1.484375, 3.83203125, 6.1796875, 8.52734375, 10.875, 13.22265625, 15.5703125, 17.91796875, 20.265625, 22.61328125, 24.9609375, 27.30859375, 29.65625, 32.00390625, 34.3515625, 36.69921875, 39.046875, 41.39453125, 43.7421875, 46.08984375, 48.4375, 50.78515625, 53.1328125, 55.48046875, 57.828125, 60.17578125, 62.5234375, 64.87109375, 67.21875, 69.56640625, 71.9140625, 74.26171875, 76.609375, 78.95703125, 81.3046875, 83.65234375, 86.0]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 3.0, 9.0, 4.0, 9.0, 8.0, 14.0, 15.0, 22.0, 20.0, 21.0, 35.0, 47.0, 52.0, 60.0, 65.0, 44.0, 64.0, 67.0, 69.0, 65.0, 58.0, 45.0, 38.0, 33.0, 29.0, 28.0, 13.0, 18.0, 10.0, 14.0, 7.0, 5.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.1875, -45.7919921875, -44.396484375, -43.0009765625, -41.60546875, -40.2099609375, -38.814453125, -37.4189453125, -36.0234375, -34.6279296875, -33.232421875, -31.8369140625, -30.44140625, -29.0458984375, -27.650390625, -26.2548828125, -24.859375, -23.4638671875, -22.068359375, -20.6728515625, -19.27734375, -17.8818359375, -16.486328125, -15.0908203125, -13.6953125, -12.2998046875, -10.904296875, -9.5087890625, -8.11328125, -6.7177734375, -5.322265625, -3.9267578125, -2.53125, -1.1357421875, 0.259765625, 1.6552734375, 3.05078125, 4.4462890625, 5.841796875, 7.2373046875, 8.6328125, 10.0283203125, 11.423828125, 12.8193359375, 14.21484375, 15.6103515625, 17.005859375, 18.4013671875, 19.796875, 21.1923828125, 22.587890625, 23.9833984375, 25.37890625, 26.7744140625, 28.169921875, 29.5654296875, 30.9609375, 32.3564453125, 33.751953125, 35.1474609375, 36.54296875, 37.9384765625, 39.333984375, 40.7294921875, 42.125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 12.0, 13.0, 7.0, 20.0, 44.0, 33.0, 53.0, 91.0, 102.0, 189.0, 251.0, 481.0, 819.0, 1731.0, 4351.0, 15427.0, 88751.0, 627866.0, 261675.0, 33338.0, 7719.0, 2663.0, 1203.0, 623.0, 328.0, 224.0, 134.0, 112.0, 75.0, 58.0, 39.0, 25.0, 19.0, 18.0, 21.0, 12.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-214.375, -208.205078125, -202.03515625, -195.865234375, -189.6953125, -183.525390625, -177.35546875, -171.185546875, -165.015625, -158.845703125, -152.67578125, -146.505859375, -140.3359375, -134.166015625, -127.99609375, -121.826171875, -115.65625, -109.486328125, -103.31640625, -97.146484375, -90.9765625, -84.806640625, -78.63671875, -72.466796875, -66.296875, -60.126953125, -53.95703125, -47.787109375, -41.6171875, -35.447265625, -29.27734375, -23.107421875, -16.9375, -10.767578125, -4.59765625, 1.572265625, 7.7421875, 13.912109375, 20.08203125, 26.251953125, 32.421875, 38.591796875, 44.76171875, 50.931640625, 57.1015625, 63.271484375, 69.44140625, 75.611328125, 81.78125, 87.951171875, 94.12109375, 100.291015625, 106.4609375, 112.630859375, 118.80078125, 124.970703125, 131.140625, 137.310546875, 143.48046875, 149.650390625, 155.8203125, 161.990234375, 168.16015625, 174.330078125, 180.5]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 8.0, 7.0, 9.0, 11.0, 10.0, 15.0, 25.0, 22.0, 30.0, 29.0, 33.0, 32.0, 36.0, 46.0, 45.0, 57.0, 64.0, 54.0, 61.0, 48.0, 51.0, 42.0, 44.0, 45.0, 29.0, 24.0, 18.0, 19.0, 18.0, 15.0, 13.0, 11.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-206.375, -199.734375, -193.09375, -186.453125, -179.8125, -173.171875, -166.53125, -159.890625, -153.25, -146.609375, -139.96875, -133.328125, -126.6875, -120.046875, -113.40625, -106.765625, -100.125, -93.484375, -86.84375, -80.203125, -73.5625, -66.921875, -60.28125, -53.640625, -47.0, -40.359375, -33.71875, -27.078125, -20.4375, -13.796875, -7.15625, -0.515625, 6.125, 12.765625, 19.40625, 26.046875, 32.6875, 39.328125, 45.96875, 52.609375, 59.25, 65.890625, 72.53125, 79.171875, 85.8125, 92.453125, 99.09375, 105.734375, 112.375, 119.015625, 125.65625, 132.296875, 138.9375, 145.578125, 152.21875, 158.859375, 165.5, 172.140625, 178.78125, 185.421875, 192.0625, 198.703125, 205.34375, 211.984375, 218.625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 2.0, 8.0, 4.0, 16.0, 21.0, 38.0, 57.0, 84.0, 160.0, 282.0, 540.0, 1250.0, 3285.0, 11081.0, 59179.0, 597620.0, 327474.0, 35385.0, 7615.0, 2501.0, 945.0, 430.0, 225.0, 130.0, 74.0, 48.0, 28.0, 27.0, 18.0, 9.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-129.375, -126.208984375, -123.04296875, -119.876953125, -116.7109375, -113.544921875, -110.37890625, -107.212890625, -104.046875, -100.880859375, -97.71484375, -94.548828125, -91.3828125, -88.216796875, -85.05078125, -81.884765625, -78.71875, -75.552734375, -72.38671875, -69.220703125, -66.0546875, -62.888671875, -59.72265625, -56.556640625, -53.390625, -50.224609375, -47.05859375, -43.892578125, -40.7265625, -37.560546875, -34.39453125, -31.228515625, -28.0625, -24.896484375, -21.73046875, -18.564453125, -15.3984375, -12.232421875, -9.06640625, -5.900390625, -2.734375, 0.431640625, 3.59765625, 6.763671875, 9.9296875, 13.095703125, 16.26171875, 19.427734375, 22.59375, 25.759765625, 28.92578125, 32.091796875, 35.2578125, 38.423828125, 41.58984375, 44.755859375, 47.921875, 51.087890625, 54.25390625, 57.419921875, 60.5859375, 63.751953125, 66.91796875, 70.083984375, 73.25]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 12.0, 10.0, 12.0, 25.0, 14.0, 19.0, 40.0, 54.0, 61.0, 85.0, 89.0, 96.0, 88.0, 93.0, 76.0, 52.0, 42.0, 30.0, 26.0, 27.0, 12.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01181793212890625, -0.011406183242797852, -0.010994434356689453, -0.010582685470581055, -0.010170936584472656, -0.009759187698364258, -0.00934743881225586, -0.008935689926147461, -0.008523941040039062, -0.008112192153930664, -0.007700443267822266, -0.007288694381713867, -0.006876945495605469, -0.00646519660949707, -0.006053447723388672, -0.0056416988372802734, -0.005229949951171875, -0.0048182010650634766, -0.004406452178955078, -0.00399470329284668, -0.0035829544067382812, -0.003171205520629883, -0.0027594566345214844, -0.002347707748413086, -0.0019359588623046875, -0.001524209976196289, -0.0011124610900878906, -0.0007007122039794922, -0.00028896331787109375, 0.0001227855682373047, 0.0005345344543457031, 0.0009462833404541016, 0.0013580322265625, 0.0017697811126708984, 0.002181529998779297, 0.0025932788848876953, 0.0030050277709960938, 0.003416776657104492, 0.0038285255432128906, 0.004240274429321289, 0.0046520233154296875, 0.005063772201538086, 0.005475521087646484, 0.005887269973754883, 0.006299018859863281, 0.00671076774597168, 0.007122516632080078, 0.0075342655181884766, 0.007946014404296875, 0.008357763290405273, 0.008769512176513672, 0.00918126106262207, 0.009593009948730469, 0.010004758834838867, 0.010416507720947266, 0.010828256607055664, 0.011240005493164062, 0.011651754379272461, 0.01206350326538086, 0.012475252151489258, 0.012887001037597656, 0.013298749923706055, 0.013710498809814453, 0.014122247695922852, 0.01453399658203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 6.0, 14.0, 17.0, 13.0, 31.0, 64.0, 72.0, 154.0, 308.0, 660.0, 1612.0, 5538.0, 31498.0, 566033.0, 410223.0, 24741.0, 4854.0, 1451.0, 633.0, 284.0, 131.0, 76.0, 36.0, 32.0, 22.0, 9.0, 12.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-109.625, -105.556640625, -101.48828125, -97.419921875, -93.3515625, -89.283203125, -85.21484375, -81.146484375, -77.078125, -73.009765625, -68.94140625, -64.873046875, -60.8046875, -56.736328125, -52.66796875, -48.599609375, -44.53125, -40.462890625, -36.39453125, -32.326171875, -28.2578125, -24.189453125, -20.12109375, -16.052734375, -11.984375, -7.916015625, -3.84765625, 0.220703125, 4.2890625, 8.357421875, 12.42578125, 16.494140625, 20.5625, 24.630859375, 28.69921875, 32.767578125, 36.8359375, 40.904296875, 44.97265625, 49.041015625, 53.109375, 57.177734375, 61.24609375, 65.314453125, 69.3828125, 73.451171875, 77.51953125, 81.587890625, 85.65625, 89.724609375, 93.79296875, 97.861328125, 101.9296875, 105.998046875, 110.06640625, 114.134765625, 118.203125, 122.271484375, 126.33984375, 130.408203125, 134.4765625, 138.544921875, 142.61328125, 146.681640625, 150.75]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 5.0, 11.0, 17.0, 32.0, 42.0, 50.0, 83.0, 89.0, 118.0, 133.0, 104.0, 100.0, 77.0, 45.0, 33.0, 24.0, 9.0, 8.0, 6.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-109.0625, -105.4658203125, -101.869140625, -98.2724609375, -94.67578125, -91.0791015625, -87.482421875, -83.8857421875, -80.2890625, -76.6923828125, -73.095703125, -69.4990234375, -65.90234375, -62.3056640625, -58.708984375, -55.1123046875, -51.515625, -47.9189453125, -44.322265625, -40.7255859375, -37.12890625, -33.5322265625, -29.935546875, -26.3388671875, -22.7421875, -19.1455078125, -15.548828125, -11.9521484375, -8.35546875, -4.7587890625, -1.162109375, 2.4345703125, 6.03125, 9.6279296875, 13.224609375, 16.8212890625, 20.41796875, 24.0146484375, 27.611328125, 31.2080078125, 34.8046875, 38.4013671875, 41.998046875, 45.5947265625, 49.19140625, 52.7880859375, 56.384765625, 59.9814453125, 63.578125, 67.1748046875, 70.771484375, 74.3681640625, 77.96484375, 81.5615234375, 85.158203125, 88.7548828125, 92.3515625, 95.9482421875, 99.544921875, 103.1416015625, 106.73828125, 110.3349609375, 113.931640625, 117.5283203125, 121.125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 9.0, 23.0, 44.0, 76.0, 118.0, 138.0, 173.0, 148.0, 96.0, 68.0, 44.0, 19.0, 11.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1333.699951171875, -1287.9351806640625, -1242.1705322265625, -1196.40576171875, -1150.6409912109375, -1104.8763427734375, -1059.111572265625, -1013.3468627929688, -967.5821533203125, -921.8174438476562, -876.0526733398438, -830.2879638671875, -784.5232543945312, -738.758544921875, -692.9937744140625, -647.2290649414062, -601.4642944335938, -555.6995849609375, -509.9348449707031, -464.17010498046875, -418.4053955078125, -372.6406555175781, -326.87591552734375, -281.1112060546875, -235.34646606445312, -189.5817413330078, -143.8170166015625, -98.05227661132812, -52.28755187988281, -6.5228271484375, 39.241912841796875, 85.00662231445312, 130.7713623046875, 176.5360870361328, 222.30081176757812, 268.0655517578125, 313.83026123046875, 359.5950012207031, 405.3597412109375, 451.12445068359375, 496.8891906738281, 542.6539306640625, 588.4186401367188, 634.183349609375, 679.9481201171875, 725.7128295898438, 771.4775390625, 817.2423095703125, 863.0070190429688, 908.771728515625, 954.5364990234375, 1000.3012084960938, 1046.06591796875, 1091.8306884765625, 1137.595458984375, 1183.360107421875, 1229.1248779296875, 1274.8896484375, 1320.654296875, 1366.4190673828125, 1412.183837890625, 1457.948486328125, 1503.7132568359375, 1549.47802734375, 1595.24267578125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 6.0, 3.0, 5.0, 8.0, 7.0, 17.0, 9.0, 21.0, 22.0, 27.0, 22.0, 28.0, 31.0, 31.0, 46.0, 37.0, 46.0, 46.0, 41.0, 51.0, 54.0, 42.0, 43.0, 50.0, 37.0, 22.0, 37.0, 42.0, 23.0, 21.0, 25.0, 18.0, 14.0, 10.0, 16.0, 3.0, 3.0, 9.0, 8.0, 4.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-880.0364990234375, -852.17919921875, -824.3219604492188, -796.4647216796875, -768.607421875, -740.7501220703125, -712.8928833007812, -685.03564453125, -657.1783447265625, -629.321044921875, -601.4638061523438, -573.6065673828125, -545.749267578125, -517.8919677734375, -490.03472900390625, -462.1774597167969, -434.3201904296875, -406.4629211425781, -378.60565185546875, -350.7483825683594, -322.89111328125, -295.0338439941406, -267.17657470703125, -239.31930541992188, -211.4620361328125, -183.60476684570312, -155.74749755859375, -127.89022827148438, -100.032958984375, -72.17568969726562, -44.31842041015625, -16.461151123046875, 11.39605712890625, 39.253326416015625, 67.110595703125, 94.96786499023438, 122.82513427734375, 150.68240356445312, 178.5396728515625, 206.39694213867188, 234.25421142578125, 262.1114807128906, 289.96875, 317.8260192871094, 345.68328857421875, 373.5405578613281, 401.3978271484375, 429.2550964355469, 457.11236572265625, 484.9696350097656, 512.826904296875, 540.6842041015625, 568.5414428710938, 596.398681640625, 624.2559814453125, 652.11328125, 679.9705200195312, 707.8277587890625, 735.68505859375, 763.5423583984375, 791.3995971679688, 819.2568359375, 847.1141357421875, 874.971435546875, 902.8286743164062]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 2.0, 6.0, 7.0, 14.0, 15.0, 18.0, 30.0, 44.0, 58.0, 84.0, 114.0, 182.0, 328.0, 600.0, 1450.0, 3884.0, 16202.0, 4150700.0, 14166.0, 3561.0, 1322.0, 563.0, 337.0, 172.0, 115.0, 83.0, 59.0, 41.0, 25.0, 27.0, 12.0, 9.0, 8.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-297.5, -289.111328125, -280.72265625, -272.333984375, -263.9453125, -255.556640625, -247.16796875, -238.779296875, -230.390625, -222.001953125, -213.61328125, -205.224609375, -196.8359375, -188.447265625, -180.05859375, -171.669921875, -163.28125, -154.892578125, -146.50390625, -138.115234375, -129.7265625, -121.337890625, -112.94921875, -104.560546875, -96.171875, -87.783203125, -79.39453125, -71.005859375, -62.6171875, -54.228515625, -45.83984375, -37.451171875, -29.0625, -20.673828125, -12.28515625, -3.896484375, 4.4921875, 12.880859375, 21.26953125, 29.658203125, 38.046875, 46.435546875, 54.82421875, 63.212890625, 71.6015625, 79.990234375, 88.37890625, 96.767578125, 105.15625, 113.544921875, 121.93359375, 130.322265625, 138.7109375, 147.099609375, 155.48828125, 163.876953125, 172.265625, 180.654296875, 189.04296875, 197.431640625, 205.8203125, 214.208984375, 222.59765625, 230.986328125, 239.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 1.0, 6.0, 6.0, 7.0, 8.0, 13.0, 20.0, 30.0, 28.0, 36.0, 57.0, 36.0, 51.0, 47.0, 60.0, 53.0, 66.0, 62.0, 60.0, 50.0, 40.0, 36.0, 36.0, 38.0, 23.0, 30.0, 19.0, 20.0, 11.0, 10.0, 4.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-46.53125, -45.21240234375, -43.8935546875, -42.57470703125, -41.255859375, -39.93701171875, -38.6181640625, -37.29931640625, -35.98046875, -34.66162109375, -33.3427734375, -32.02392578125, -30.705078125, -29.38623046875, -28.0673828125, -26.74853515625, -25.4296875, -24.11083984375, -22.7919921875, -21.47314453125, -20.154296875, -18.83544921875, -17.5166015625, -16.19775390625, -14.87890625, -13.56005859375, -12.2412109375, -10.92236328125, -9.603515625, -8.28466796875, -6.9658203125, -5.64697265625, -4.328125, -3.00927734375, -1.6904296875, -0.37158203125, 0.947265625, 2.26611328125, 3.5849609375, 4.90380859375, 6.22265625, 7.54150390625, 8.8603515625, 10.17919921875, 11.498046875, 12.81689453125, 14.1357421875, 15.45458984375, 16.7734375, 18.09228515625, 19.4111328125, 20.72998046875, 22.048828125, 23.36767578125, 24.6865234375, 26.00537109375, 27.32421875, 28.64306640625, 29.9619140625, 31.28076171875, 32.599609375, 33.91845703125, 35.2373046875, 36.55615234375, 37.875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 5.0, 3.0, 10.0, 17.0, 12.0, 15.0, 26.0, 35.0, 57.0, 78.0, 108.0, 178.0, 271.0, 546.0, 992.0, 1878.0, 4036.0, 10873.0, 143540.0, 4010382.0, 12524.0, 4299.0, 1927.0, 1004.0, 576.0, 314.0, 180.0, 121.0, 83.0, 53.0, 31.0, 24.0, 19.0, 20.0, 10.0, 6.0, 6.0, 2.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-228.0, -220.65625, -213.3125, -205.96875, -198.625, -191.28125, -183.9375, -176.59375, -169.25, -161.90625, -154.5625, -147.21875, -139.875, -132.53125, -125.1875, -117.84375, -110.5, -103.15625, -95.8125, -88.46875, -81.125, -73.78125, -66.4375, -59.09375, -51.75, -44.40625, -37.0625, -29.71875, -22.375, -15.03125, -7.6875, -0.34375, 7.0, 14.34375, 21.6875, 29.03125, 36.375, 43.71875, 51.0625, 58.40625, 65.75, 73.09375, 80.4375, 87.78125, 95.125, 102.46875, 109.8125, 117.15625, 124.5, 131.84375, 139.1875, 146.53125, 153.875, 161.21875, 168.5625, 175.90625, 183.25, 190.59375, 197.9375, 205.28125, 212.625, 219.96875, 227.3125, 234.65625, 242.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 3.0, 10.0, 20.0, 46.0, 3849.0, 65.0, 30.0, 10.0, 8.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.5625, -70.677734375, -68.79296875, -66.908203125, -65.0234375, -63.138671875, -61.25390625, -59.369140625, -57.484375, -55.599609375, -53.71484375, -51.830078125, -49.9453125, -48.060546875, -46.17578125, -44.291015625, -42.40625, -40.521484375, -38.63671875, -36.751953125, -34.8671875, -32.982421875, -31.09765625, -29.212890625, -27.328125, -25.443359375, -23.55859375, -21.673828125, -19.7890625, -17.904296875, -16.01953125, -14.134765625, -12.25, -10.365234375, -8.48046875, -6.595703125, -4.7109375, -2.826171875, -0.94140625, 0.943359375, 2.828125, 4.712890625, 6.59765625, 8.482421875, 10.3671875, 12.251953125, 14.13671875, 16.021484375, 17.90625, 19.791015625, 21.67578125, 23.560546875, 25.4453125, 27.330078125, 29.21484375, 31.099609375, 32.984375, 34.869140625, 36.75390625, 38.638671875, 40.5234375, 42.408203125, 44.29296875, 46.177734375, 48.0625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 15.0, 51.0, 111.0, 212.0, 263.0, 182.0, 86.0, 36.0, 23.0, 7.0, 1.0, 0.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-334.885009765625, -324.16644287109375, -313.4478759765625, -302.72930908203125, -292.0107421875, -281.29217529296875, -270.5736083984375, -259.85504150390625, -249.13648986816406, -238.4179229736328, -227.69935607910156, -216.98080444335938, -206.26223754882812, -195.54367065429688, -184.82510375976562, -174.10653686523438, -163.38796997070312, -152.66940307617188, -141.95083618164062, -131.23226928710938, -120.51371002197266, -109.7951431274414, -99.07658386230469, -88.35801696777344, -77.63945007324219, -66.92088317871094, -56.20232009887695, -45.48375701904297, -34.76519012451172, -24.04662322998047, -13.32806396484375, -2.6094970703125, 8.10906982421875, 18.827634811401367, 29.546199798583984, 40.26476287841797, 50.98332977294922, 61.70189666748047, 72.42045593261719, 83.13902282714844, 93.85758972167969, 104.57615661621094, 115.29472351074219, 126.0132827758789, 136.73184204101562, 147.45040893554688, 158.16897583007812, 168.88754272460938, 179.60610961914062, 190.32467651367188, 201.04324340820312, 211.76181030273438, 222.48037719726562, 233.19894409179688, 243.91749572753906, 254.6360626220703, 265.3546142578125, 276.07318115234375, 286.791748046875, 297.51031494140625, 308.2288818359375, 318.94744873046875, 329.666015625, 340.38458251953125, 351.1031494140625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 7.0, 7.0, 2.0, 7.0, 16.0, 17.0, 17.0, 21.0, 19.0, 23.0, 24.0, 33.0, 31.0, 37.0, 37.0, 43.0, 35.0, 45.0, 33.0, 48.0, 40.0, 51.0, 55.0, 48.0, 48.0, 34.0, 28.0, 30.0, 23.0, 22.0, 22.0, 22.0, 10.0, 15.0, 16.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.12903594970703, -105.96149444580078, -102.7939453125, -99.62640380859375, -96.4588623046875, -93.29131317138672, -90.12377166748047, -86.95622253417969, -83.78868103027344, -80.62113952636719, -77.4535903930664, -74.28604888916016, -71.11849975585938, -67.95095825195312, -64.78341674804688, -61.61587142944336, -58.448326110839844, -55.28078079223633, -52.11323547363281, -48.94569396972656, -45.77814865112305, -42.61060333251953, -39.44306182861328, -36.275516510009766, -33.10797119140625, -29.940425872802734, -26.77288246154785, -23.60533905029297, -20.437793731689453, -17.270248413085938, -14.102705001831055, -10.935161590576172, -7.767608642578125, -4.600064277648926, -1.4325199127197266, 1.7350244522094727, 4.902568817138672, 8.070113182067871, 11.23765754699707, 14.405200958251953, 17.57274627685547, 20.740291595458984, 23.907835006713867, 27.07537841796875, 30.242923736572266, 33.41046905517578, 36.57801055908203, 39.74555587768555, 42.91310119628906, 46.08064651489258, 49.248191833496094, 52.415733337402344, 55.58327865600586, 58.750823974609375, 61.918365478515625, 65.08590698242188, 68.25345611572266, 71.4209976196289, 74.58854675292969, 77.75608825683594, 80.92362976074219, 84.09117889404297, 87.25872039794922, 90.42626953125, 93.59381103515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 12.0, 15.0, 13.0, 33.0, 20.0, 34.0, 77.0, 133.0, 275.0, 639.0, 1632.0, 4640.0, 15048.0, 57652.0, 243147.0, 500392.0, 167323.0, 40606.0, 11036.0, 3441.0, 1291.0, 529.0, 227.0, 124.0, 91.0, 43.0, 27.0, 18.0, 15.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.0, -141.625, -137.25, -132.875, -128.5, -124.125, -119.75, -115.375, -111.0, -106.625, -102.25, -97.875, -93.5, -89.125, -84.75, -80.375, -76.0, -71.625, -67.25, -62.875, -58.5, -54.125, -49.75, -45.375, -41.0, -36.625, -32.25, -27.875, -23.5, -19.125, -14.75, -10.375, -6.0, -1.625, 2.75, 7.125, 11.5, 15.875, 20.25, 24.625, 29.0, 33.375, 37.75, 42.125, 46.5, 50.875, 55.25, 59.625, 64.0, 68.375, 72.75, 77.125, 81.5, 85.875, 90.25, 94.625, 99.0, 103.375, 107.75, 112.125, 116.5, 120.875, 125.25, 129.625, 134.0]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 7.0, 6.0, 9.0, 12.0, 15.0, 21.0, 12.0, 28.0, 33.0, 37.0, 41.0, 52.0, 42.0, 50.0, 49.0, 53.0, 56.0, 68.0, 34.0, 51.0, 45.0, 32.0, 37.0, 27.0, 31.0, 22.0, 17.0, 20.0, 25.0, 15.0, 9.0, 10.0, 4.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.21875, -43.81591796875, -42.4130859375, -41.01025390625, -39.607421875, -38.20458984375, -36.8017578125, -35.39892578125, -33.99609375, -32.59326171875, -31.1904296875, -29.78759765625, -28.384765625, -26.98193359375, -25.5791015625, -24.17626953125, -22.7734375, -21.37060546875, -19.9677734375, -18.56494140625, -17.162109375, -15.75927734375, -14.3564453125, -12.95361328125, -11.55078125, -10.14794921875, -8.7451171875, -7.34228515625, -5.939453125, -4.53662109375, -3.1337890625, -1.73095703125, -0.328125, 1.07470703125, 2.4775390625, 3.88037109375, 5.283203125, 6.68603515625, 8.0888671875, 9.49169921875, 10.89453125, 12.29736328125, 13.7001953125, 15.10302734375, 16.505859375, 17.90869140625, 19.3115234375, 20.71435546875, 22.1171875, 23.52001953125, 24.9228515625, 26.32568359375, 27.728515625, 29.13134765625, 30.5341796875, 31.93701171875, 33.33984375, 34.74267578125, 36.1455078125, 37.54833984375, 38.951171875, 40.35400390625, 41.7568359375, 43.15966796875, 44.5625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 9.0, 10.0, 13.0, 13.0, 24.0, 24.0, 41.0, 37.0, 78.0, 136.0, 195.0, 294.0, 508.0, 1093.0, 2545.0, 10985.0, 139413.0, 815916.0, 65944.0, 7184.0, 1956.0, 881.0, 452.0, 263.0, 166.0, 105.0, 72.0, 53.0, 39.0, 26.0, 24.0, 11.0, 9.0, 4.0, 6.0, 7.0, 11.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-275.25, -265.55078125, -255.8515625, -246.15234375, -236.453125, -226.75390625, -217.0546875, -207.35546875, -197.65625, -187.95703125, -178.2578125, -168.55859375, -158.859375, -149.16015625, -139.4609375, -129.76171875, -120.0625, -110.36328125, -100.6640625, -90.96484375, -81.265625, -71.56640625, -61.8671875, -52.16796875, -42.46875, -32.76953125, -23.0703125, -13.37109375, -3.671875, 6.02734375, 15.7265625, 25.42578125, 35.125, 44.82421875, 54.5234375, 64.22265625, 73.921875, 83.62109375, 93.3203125, 103.01953125, 112.71875, 122.41796875, 132.1171875, 141.81640625, 151.515625, 161.21484375, 170.9140625, 180.61328125, 190.3125, 200.01171875, 209.7109375, 219.41015625, 229.109375, 238.80859375, 248.5078125, 258.20703125, 267.90625, 277.60546875, 287.3046875, 297.00390625, 306.703125, 316.40234375, 326.1015625, 335.80078125, 345.5]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 7.0, 8.0, 14.0, 38.0, 21.0, 32.0, 62.0, 63.0, 72.0, 63.0, 89.0, 87.0, 91.0, 70.0, 70.0, 55.0, 42.0, 36.0, 20.0, 27.0, 12.0, 12.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-537.5, -523.55078125, -509.6015625, -495.65234375, -481.703125, -467.75390625, -453.8046875, -439.85546875, -425.90625, -411.95703125, -398.0078125, -384.05859375, -370.109375, -356.16015625, -342.2109375, -328.26171875, -314.3125, -300.36328125, -286.4140625, -272.46484375, -258.515625, -244.56640625, -230.6171875, -216.66796875, -202.71875, -188.76953125, -174.8203125, -160.87109375, -146.921875, -132.97265625, -119.0234375, -105.07421875, -91.125, -77.17578125, -63.2265625, -49.27734375, -35.328125, -21.37890625, -7.4296875, 6.51953125, 20.46875, 34.41796875, 48.3671875, 62.31640625, 76.265625, 90.21484375, 104.1640625, 118.11328125, 132.0625, 146.01171875, 159.9609375, 173.91015625, 187.859375, 201.80859375, 215.7578125, 229.70703125, 243.65625, 257.60546875, 271.5546875, 285.50390625, 299.453125, 313.40234375, 327.3515625, 341.30078125, 355.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 11.0, 11.0, 15.0, 20.0, 26.0, 55.0, 98.0, 270.0, 831.0, 5667.0, 886641.0, 150828.0, 3024.0, 601.0, 198.0, 102.0, 57.0, 28.0, 22.0, 10.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.5, -265.15625, -251.8125, -238.46875, -225.125, -211.78125, -198.4375, -185.09375, -171.75, -158.40625, -145.0625, -131.71875, -118.375, -105.03125, -91.6875, -78.34375, -65.0, -51.65625, -38.3125, -24.96875, -11.625, 1.71875, 15.0625, 28.40625, 41.75, 55.09375, 68.4375, 81.78125, 95.125, 108.46875, 121.8125, 135.15625, 148.5, 161.84375, 175.1875, 188.53125, 201.875, 215.21875, 228.5625, 241.90625, 255.25, 268.59375, 281.9375, 295.28125, 308.625, 321.96875, 335.3125, 348.65625, 362.0, 375.34375, 388.6875, 402.03125, 415.375, 428.71875, 442.0625, 455.40625, 468.75, 482.09375, 495.4375, 508.78125, 522.125, 535.46875, 548.8125, 562.15625, 575.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 10.0, 8.0, 8.0, 14.0, 21.0, 45.0, 39.0, 63.0, 93.0, 124.0, 125.0, 126.0, 99.0, 62.0, 45.0, 40.0, 24.0, 6.0, 10.0, 9.0, 11.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169677734375, -0.01643204689025879, -0.015896320343017578, -0.015360593795776367, -0.014824867248535156, -0.014289140701293945, -0.013753414154052734, -0.013217687606811523, -0.012681961059570312, -0.012146234512329102, -0.01161050796508789, -0.01107478141784668, -0.010539054870605469, -0.010003328323364258, -0.009467601776123047, -0.008931875228881836, -0.008396148681640625, -0.007860422134399414, -0.007324695587158203, -0.006788969039916992, -0.006253242492675781, -0.00571751594543457, -0.005181789398193359, -0.0046460628509521484, -0.0041103363037109375, -0.0035746097564697266, -0.0030388832092285156, -0.0025031566619873047, -0.0019674301147460938, -0.0014317035675048828, -0.0008959770202636719, -0.00036025047302246094, 0.00017547607421875, 0.0007112026214599609, 0.0012469291687011719, 0.0017826557159423828, 0.0023183822631835938, 0.0028541088104248047, 0.0033898353576660156, 0.0039255619049072266, 0.0044612884521484375, 0.0049970149993896484, 0.005532741546630859, 0.00606846809387207, 0.006604194641113281, 0.007139921188354492, 0.007675647735595703, 0.008211374282836914, 0.008747100830078125, 0.009282827377319336, 0.009818553924560547, 0.010354280471801758, 0.010890007019042969, 0.01142573356628418, 0.01196146011352539, 0.012497186660766602, 0.013032913208007812, 0.013568639755249023, 0.014104366302490234, 0.014640092849731445, 0.015175819396972656, 0.015711545944213867, 0.016247272491455078, 0.01678299903869629, 0.0173187255859375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 7.0, 7.0, 13.0, 17.0, 28.0, 39.0, 50.0, 115.0, 163.0, 291.0, 685.0, 1568.0, 4281.0, 15782.0, 131231.0, 828842.0, 50762.0, 9440.0, 2891.0, 1161.0, 500.0, 264.0, 153.0, 77.0, 54.0, 50.0, 25.0, 7.0, 13.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-211.625, -205.955078125, -200.28515625, -194.615234375, -188.9453125, -183.275390625, -177.60546875, -171.935546875, -166.265625, -160.595703125, -154.92578125, -149.255859375, -143.5859375, -137.916015625, -132.24609375, -126.576171875, -120.90625, -115.236328125, -109.56640625, -103.896484375, -98.2265625, -92.556640625, -86.88671875, -81.216796875, -75.546875, -69.876953125, -64.20703125, -58.537109375, -52.8671875, -47.197265625, -41.52734375, -35.857421875, -30.1875, -24.517578125, -18.84765625, -13.177734375, -7.5078125, -1.837890625, 3.83203125, 9.501953125, 15.171875, 20.841796875, 26.51171875, 32.181640625, 37.8515625, 43.521484375, 49.19140625, 54.861328125, 60.53125, 66.201171875, 71.87109375, 77.541015625, 83.2109375, 88.880859375, 94.55078125, 100.220703125, 105.890625, 111.560546875, 117.23046875, 122.900390625, 128.5703125, 134.240234375, 139.91015625, 145.580078125, 151.25]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 5.0, 9.0, 14.0, 14.0, 19.0, 39.0, 64.0, 83.0, 135.0, 132.0, 138.0, 111.0, 91.0, 35.0, 33.0, 16.0, 11.0, 12.0, 8.0, 5.0, 2.0, 1.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.125, -123.498046875, -117.87109375, -112.244140625, -106.6171875, -100.990234375, -95.36328125, -89.736328125, -84.109375, -78.482421875, -72.85546875, -67.228515625, -61.6015625, -55.974609375, -50.34765625, -44.720703125, -39.09375, -33.466796875, -27.83984375, -22.212890625, -16.5859375, -10.958984375, -5.33203125, 0.294921875, 5.921875, 11.548828125, 17.17578125, 22.802734375, 28.4296875, 34.056640625, 39.68359375, 45.310546875, 50.9375, 56.564453125, 62.19140625, 67.818359375, 73.4453125, 79.072265625, 84.69921875, 90.326171875, 95.953125, 101.580078125, 107.20703125, 112.833984375, 118.4609375, 124.087890625, 129.71484375, 135.341796875, 140.96875, 146.595703125, 152.22265625, 157.849609375, 163.4765625, 169.103515625, 174.73046875, 180.357421875, 185.984375, 191.611328125, 197.23828125, 202.865234375, 208.4921875, 214.119140625, 219.74609375, 225.373046875, 231.0]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 11.0, 29.0, 113.0, 317.0, 340.0, 134.0, 42.0, 10.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4469.40771484375, -4333.720703125, -4198.03369140625, -4062.3466796875, -3926.65966796875, -3790.97265625, -3655.28564453125, -3519.5986328125, -3383.91162109375, -3248.224609375, -3112.53759765625, -2976.8505859375, -2841.16357421875, -2705.4765625, -2569.78955078125, -2434.1025390625, -2298.415771484375, -2162.728759765625, -2027.041748046875, -1891.354736328125, -1755.667724609375, -1619.980712890625, -1484.2938232421875, -1348.6068115234375, -1212.9197998046875, -1077.2327880859375, -941.5457763671875, -805.8588256835938, -670.1718139648438, -534.4848022460938, -398.7978515625, -263.11083984375, -127.423828125, 8.263168334960938, 143.95016479492188, 279.63714599609375, 415.32415771484375, 551.0111694335938, 686.6981201171875, 822.3851318359375, 958.0721435546875, 1093.7591552734375, 1229.4461669921875, 1365.133056640625, 1500.820068359375, 1636.507080078125, 1772.194091796875, 1907.881103515625, 2043.568115234375, 2179.255126953125, 2314.942138671875, 2450.629150390625, 2586.316162109375, 2722.003173828125, 2857.68994140625, 2993.376953125, 3129.06396484375, 3264.7509765625, 3400.43798828125, 3536.125, 3671.81201171875, 3807.4990234375, 3943.18603515625, 4078.873046875, 4214.56005859375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 2.0, 4.0, 10.0, 8.0, 14.0, 27.0, 24.0, 29.0, 35.0, 43.0, 44.0, 50.0, 52.0, 61.0, 73.0, 76.0, 54.0, 55.0, 53.0, 52.0, 33.0, 40.0, 36.0, 21.0, 24.0, 14.0, 13.0, 12.0, 11.0, 12.0, 6.0, 5.0, 2.0, 1.0, 3.0], "bins": [-2195.891357421875, -2146.28857421875, -2096.68603515625, -2047.0833740234375, -1997.480712890625, -1947.8779296875, -1898.2752685546875, -1848.672607421875, -1799.0699462890625, -1749.46728515625, -1699.8646240234375, -1650.261962890625, -1600.6591796875, -1551.0565185546875, -1501.453857421875, -1451.8511962890625, -1402.24853515625, -1352.6458740234375, -1303.043212890625, -1253.4405517578125, -1203.837890625, -1154.235107421875, -1104.6324462890625, -1055.02978515625, -1005.4271240234375, -955.824462890625, -906.2218017578125, -856.6190795898438, -807.0164184570312, -757.4137573242188, -707.81103515625, -658.2083740234375, -608.6058349609375, -559.003173828125, -509.4004821777344, -459.79779052734375, -410.19512939453125, -360.59246826171875, -310.9897766113281, -261.3870849609375, -211.784423828125, -162.18174743652344, -112.57907104492188, -62.97639465332031, -13.37371826171875, 36.22895812988281, 85.83163452148438, 135.434326171875, 185.0369873046875, 234.63966369628906, 284.2423400878906, 333.84503173828125, 383.44769287109375, 433.05035400390625, 482.6530456542969, 532.2557373046875, 581.8583984375, 631.4610595703125, 681.063720703125, 730.6664428710938, 780.2691040039062, 829.8717651367188, 879.4744873046875, 929.0771484375, 978.6798095703125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 4.0, 10.0, 12.0, 10.0, 35.0, 27.0, 47.0, 53.0, 81.0, 129.0, 244.0, 350.0, 691.0, 1499.0, 4595.0, 36203.0, 4128061.0, 16689.0, 3123.0, 1124.0, 516.0, 275.0, 174.0, 108.0, 76.0, 36.0, 29.0, 18.0, 14.0, 8.0, 9.0, 8.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-365.5, -355.96875, -346.4375, -336.90625, -327.375, -317.84375, -308.3125, -298.78125, -289.25, -279.71875, -270.1875, -260.65625, -251.125, -241.59375, -232.0625, -222.53125, -213.0, -203.46875, -193.9375, -184.40625, -174.875, -165.34375, -155.8125, -146.28125, -136.75, -127.21875, -117.6875, -108.15625, -98.625, -89.09375, -79.5625, -70.03125, -60.5, -50.96875, -41.4375, -31.90625, -22.375, -12.84375, -3.3125, 6.21875, 15.75, 25.28125, 34.8125, 44.34375, 53.875, 63.40625, 72.9375, 82.46875, 92.0, 101.53125, 111.0625, 120.59375, 130.125, 139.65625, 149.1875, 158.71875, 168.25, 177.78125, 187.3125, 196.84375, 206.375, 215.90625, 225.4375, 234.96875, 244.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 9.0, 16.0, 16.0, 33.0, 56.0, 104.0, 148.0, 154.0, 148.0, 119.0, 77.0, 47.0, 24.0, 14.0, 16.0, 6.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-205.5, -201.2646484375, -197.029296875, -192.7939453125, -188.55859375, -184.3232421875, -180.087890625, -175.8525390625, -171.6171875, -167.3818359375, -163.146484375, -158.9111328125, -154.67578125, -150.4404296875, -146.205078125, -141.9697265625, -137.734375, -133.4990234375, -129.263671875, -125.0283203125, -120.79296875, -116.5576171875, -112.322265625, -108.0869140625, -103.8515625, -99.6162109375, -95.380859375, -91.1455078125, -86.91015625, -82.6748046875, -78.439453125, -74.2041015625, -69.96875, -65.7333984375, -61.498046875, -57.2626953125, -53.02734375, -48.7919921875, -44.556640625, -40.3212890625, -36.0859375, -31.8505859375, -27.615234375, -23.3798828125, -19.14453125, -14.9091796875, -10.673828125, -6.4384765625, -2.203125, 2.0322265625, 6.267578125, 10.5029296875, 14.73828125, 18.9736328125, 23.208984375, 27.4443359375, 31.6796875, 35.9150390625, 40.150390625, 44.3857421875, 48.62109375, 52.8564453125, 57.091796875, 61.3271484375, 65.5625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 4.0, 8.0, 4.0, 10.0, 15.0, 23.0, 25.0, 30.0, 35.0, 54.0, 69.0, 146.0, 296.0, 666.0, 2116.0, 8738.0, 91898.0, 4064427.0, 19798.0, 3809.0, 1112.0, 446.0, 210.0, 86.0, 51.0, 52.0, 37.0, 18.0, 28.0, 15.0, 11.0, 10.0, 8.0, 3.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-300.0, -288.98046875, -277.9609375, -266.94140625, -255.921875, -244.90234375, -233.8828125, -222.86328125, -211.84375, -200.82421875, -189.8046875, -178.78515625, -167.765625, -156.74609375, -145.7265625, -134.70703125, -123.6875, -112.66796875, -101.6484375, -90.62890625, -79.609375, -68.58984375, -57.5703125, -46.55078125, -35.53125, -24.51171875, -13.4921875, -2.47265625, 8.546875, 19.56640625, 30.5859375, 41.60546875, 52.625, 63.64453125, 74.6640625, 85.68359375, 96.703125, 107.72265625, 118.7421875, 129.76171875, 140.78125, 151.80078125, 162.8203125, 173.83984375, 184.859375, 195.87890625, 206.8984375, 217.91796875, 228.9375, 239.95703125, 250.9765625, 261.99609375, 273.015625, 284.03515625, 295.0546875, 306.07421875, 317.09375, 328.11328125, 339.1328125, 350.15234375, 361.171875, 372.19140625, 383.2109375, 394.23046875, 405.25]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 11.0, 17.0, 41.0, 188.0, 3588.0, 114.0, 45.0, 24.0, 18.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.875, -58.166015625, -53.45703125, -48.748046875, -44.0390625, -39.330078125, -34.62109375, -29.912109375, -25.203125, -20.494140625, -15.78515625, -11.076171875, -6.3671875, -1.658203125, 3.05078125, 7.759765625, 12.46875, 17.177734375, 21.88671875, 26.595703125, 31.3046875, 36.013671875, 40.72265625, 45.431640625, 50.140625, 54.849609375, 59.55859375, 64.267578125, 68.9765625, 73.685546875, 78.39453125, 83.103515625, 87.8125, 92.521484375, 97.23046875, 101.939453125, 106.6484375, 111.357421875, 116.06640625, 120.775390625, 125.484375, 130.193359375, 134.90234375, 139.611328125, 144.3203125, 149.029296875, 153.73828125, 158.447265625, 163.15625, 167.865234375, 172.57421875, 177.283203125, 181.9921875, 186.701171875, 191.41015625, 196.119140625, 200.828125, 205.537109375, 210.24609375, 214.955078125, 219.6640625, 224.373046875, 229.08203125, 233.791015625, 238.5]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 17.0, 22.0, 73.0, 154.0, 271.0, 221.0, 138.0, 63.0, 18.0, 14.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-330.59765625, -309.6024169921875, -288.6071472167969, -267.6119079589844, -246.6166534423828, -225.62139892578125, -204.62615966796875, -183.6309051513672, -162.63565063476562, -141.64039611816406, -120.64514923095703, -99.64990234375, -78.65464782714844, -57.659393310546875, -36.664146423339844, -15.668899536132812, 5.32635498046875, 26.321605682373047, 47.316856384277344, 68.31210327148438, 89.30735778808594, 110.3026123046875, 131.2978515625, 152.29310607910156, 173.28836059570312, 194.2836151123047, 215.27886962890625, 236.27410888671875, 257.26934814453125, 278.2646179199219, 299.2598571777344, 320.255126953125, 341.2503662109375, 362.24560546875, 383.2408752441406, 404.2361145019531, 425.23138427734375, 446.22662353515625, 467.22186279296875, 488.21710205078125, 509.2123718261719, 530.2076416015625, 551.202880859375, 572.1981201171875, 593.193359375, 614.1885986328125, 635.1838989257812, 656.1791381835938, 677.1743774414062, 698.1696166992188, 719.1648559570312, 740.16015625, 761.1553955078125, 782.150634765625, 803.1458740234375, 824.14111328125, 845.1363525390625, 866.131591796875, 887.1268310546875, 908.1221313476562, 929.1173706054688, 950.1126098632812, 971.1078491210938, 992.1030883789062, 1013.098388671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 11.0, 16.0, 28.0, 32.0, 56.0, 98.0, 96.0, 100.0, 102.0, 109.0, 92.0, 94.0, 43.0, 45.0, 34.0, 22.0, 10.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-490.27374267578125, -475.19708251953125, -460.1203918457031, -445.043701171875, -429.967041015625, -414.890380859375, -399.8136901855469, -384.73699951171875, -369.66033935546875, -354.58367919921875, -339.5069885253906, -324.4302978515625, -309.3536376953125, -294.2769775390625, -279.2002868652344, -264.12359619140625, -249.04693603515625, -233.9702606201172, -218.89358520507812, -203.81690979003906, -188.740234375, -173.66355895996094, -158.58688354492188, -143.5102081298828, -128.43353271484375, -113.35685729980469, -98.28018188476562, -83.20350646972656, -68.1268310546875, -53.05015563964844, -37.973480224609375, -22.896804809570312, -7.820098876953125, 7.2565765380859375, 22.333251953125, 37.40992736816406, 52.486602783203125, 67.56327819824219, 82.63995361328125, 97.71662902832031, 112.79330444335938, 127.86997985839844, 142.9466552734375, 158.02333068847656, 173.10000610351562, 188.1766815185547, 203.25335693359375, 218.3300323486328, 233.40670776367188, 248.48338317871094, 263.56005859375, 278.63671875, 293.7134094238281, 308.79010009765625, 323.86676025390625, 338.94342041015625, 354.0201110839844, 369.0968017578125, 384.1734619140625, 399.2501220703125, 414.3268127441406, 429.40350341796875, 444.48016357421875, 459.55682373046875, 474.6335144042969]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 8.0, 10.0, 21.0, 27.0, 24.0, 40.0, 47.0, 91.0, 122.0, 201.0, 320.0, 589.0, 1168.0, 2468.0, 6229.0, 20103.0, 93394.0, 507943.0, 336191.0, 56431.0, 13783.0, 4905.0, 1981.0, 1013.0, 555.0, 309.0, 184.0, 106.0, 78.0, 50.0, 56.0, 28.0, 15.0, 12.0, 11.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-201.75, -195.609375, -189.46875, -183.328125, -177.1875, -171.046875, -164.90625, -158.765625, -152.625, -146.484375, -140.34375, -134.203125, -128.0625, -121.921875, -115.78125, -109.640625, -103.5, -97.359375, -91.21875, -85.078125, -78.9375, -72.796875, -66.65625, -60.515625, -54.375, -48.234375, -42.09375, -35.953125, -29.8125, -23.671875, -17.53125, -11.390625, -5.25, 0.890625, 7.03125, 13.171875, 19.3125, 25.453125, 31.59375, 37.734375, 43.875, 50.015625, 56.15625, 62.296875, 68.4375, 74.578125, 80.71875, 86.859375, 93.0, 99.140625, 105.28125, 111.421875, 117.5625, 123.703125, 129.84375, 135.984375, 142.125, 148.265625, 154.40625, 160.546875, 166.6875, 172.828125, 178.96875, 185.109375, 191.25]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 8.0, 10.0, 18.0, 26.0, 33.0, 62.0, 71.0, 90.0, 93.0, 129.0, 114.0, 91.0, 69.0, 59.0, 35.0, 29.0, 20.0, 17.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-165.5, -162.07666015625, -158.6533203125, -155.22998046875, -151.806640625, -148.38330078125, -144.9599609375, -141.53662109375, -138.11328125, -134.68994140625, -131.2666015625, -127.84326171875, -124.419921875, -120.99658203125, -117.5732421875, -114.14990234375, -110.7265625, -107.30322265625, -103.8798828125, -100.45654296875, -97.033203125, -93.60986328125, -90.1865234375, -86.76318359375, -83.33984375, -79.91650390625, -76.4931640625, -73.06982421875, -69.646484375, -66.22314453125, -62.7998046875, -59.37646484375, -55.953125, -52.52978515625, -49.1064453125, -45.68310546875, -42.259765625, -38.83642578125, -35.4130859375, -31.98974609375, -28.56640625, -25.14306640625, -21.7197265625, -18.29638671875, -14.873046875, -11.44970703125, -8.0263671875, -4.60302734375, -1.1796875, 2.24365234375, 5.6669921875, 9.09033203125, 12.513671875, 15.93701171875, 19.3603515625, 22.78369140625, 26.20703125, 29.63037109375, 33.0537109375, 36.47705078125, 39.900390625, 43.32373046875, 46.7470703125, 50.17041015625, 53.59375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 9.0, 6.0, 14.0, 19.0, 34.0, 42.0, 99.0, 172.0, 385.0, 972.0, 3334.0, 35219.0, 947470.0, 54816.0, 4104.0, 1043.0, 413.0, 166.0, 112.0, 41.0, 29.0, 18.0, 15.0, 14.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.0, -377.2734375, -360.546875, -343.8203125, -327.09375, -310.3671875, -293.640625, -276.9140625, -260.1875, -243.4609375, -226.734375, -210.0078125, -193.28125, -176.5546875, -159.828125, -143.1015625, -126.375, -109.6484375, -92.921875, -76.1953125, -59.46875, -42.7421875, -26.015625, -9.2890625, 7.4375, 24.1640625, 40.890625, 57.6171875, 74.34375, 91.0703125, 107.796875, 124.5234375, 141.25, 157.9765625, 174.703125, 191.4296875, 208.15625, 224.8828125, 241.609375, 258.3359375, 275.0625, 291.7890625, 308.515625, 325.2421875, 341.96875, 358.6953125, 375.421875, 392.1484375, 408.875, 425.6015625, 442.328125, 459.0546875, 475.78125, 492.5078125, 509.234375, 525.9609375, 542.6875, 559.4140625, 576.140625, 592.8671875, 609.59375, 626.3203125, 643.046875, 659.7734375, 676.5]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 19.0, 28.0, 33.0, 46.0, 48.0, 56.0, 70.0, 85.0, 80.0, 73.0, 70.0, 79.0, 65.0, 58.0, 42.0, 36.0, 25.0, 23.0, 21.0, 10.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-360.5, -347.27734375, -334.0546875, -320.83203125, -307.609375, -294.38671875, -281.1640625, -267.94140625, -254.71875, -241.49609375, -228.2734375, -215.05078125, -201.828125, -188.60546875, -175.3828125, -162.16015625, -148.9375, -135.71484375, -122.4921875, -109.26953125, -96.046875, -82.82421875, -69.6015625, -56.37890625, -43.15625, -29.93359375, -16.7109375, -3.48828125, 9.734375, 22.95703125, 36.1796875, 49.40234375, 62.625, 75.84765625, 89.0703125, 102.29296875, 115.515625, 128.73828125, 141.9609375, 155.18359375, 168.40625, 181.62890625, 194.8515625, 208.07421875, 221.296875, 234.51953125, 247.7421875, 260.96484375, 274.1875, 287.41015625, 300.6328125, 313.85546875, 327.078125, 340.30078125, 353.5234375, 366.74609375, 379.96875, 393.19140625, 406.4140625, 419.63671875, 432.859375, 446.08203125, 459.3046875, 472.52734375, 485.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 7.0, 7.0, 2.0, 14.0, 7.0, 14.0, 26.0, 26.0, 44.0, 69.0, 72.0, 135.0, 247.0, 475.0, 1236.0, 4469.0, 29667.0, 613127.0, 373016.0, 20475.0, 3395.0, 1036.0, 399.0, 199.0, 126.0, 61.0, 61.0, 34.0, 27.0, 15.0, 11.0, 10.0, 8.0, 5.0, 4.0, 2.0, 6.0, 4.0, 5.0, 2.0, 0.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-96.375, -93.2578125, -90.140625, -87.0234375, -83.90625, -80.7890625, -77.671875, -74.5546875, -71.4375, -68.3203125, -65.203125, -62.0859375, -58.96875, -55.8515625, -52.734375, -49.6171875, -46.5, -43.3828125, -40.265625, -37.1484375, -34.03125, -30.9140625, -27.796875, -24.6796875, -21.5625, -18.4453125, -15.328125, -12.2109375, -9.09375, -5.9765625, -2.859375, 0.2578125, 3.375, 6.4921875, 9.609375, 12.7265625, 15.84375, 18.9609375, 22.078125, 25.1953125, 28.3125, 31.4296875, 34.546875, 37.6640625, 40.78125, 43.8984375, 47.015625, 50.1328125, 53.25, 56.3671875, 59.484375, 62.6015625, 65.71875, 68.8359375, 71.953125, 75.0703125, 78.1875, 81.3046875, 84.421875, 87.5390625, 90.65625, 93.7734375, 96.890625, 100.0078125, 103.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 10.0, 19.0, 25.0, 28.0, 55.0, 57.0, 81.0, 128.0, 120.0, 109.0, 93.0, 62.0, 55.0, 26.0, 35.0, 20.0, 14.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01458740234375, -0.014152288436889648, -0.013717174530029297, -0.013282060623168945, -0.012846946716308594, -0.012411832809448242, -0.01197671890258789, -0.011541604995727539, -0.011106491088867188, -0.010671377182006836, -0.010236263275146484, -0.009801149368286133, -0.009366035461425781, -0.00893092155456543, -0.008495807647705078, -0.008060693740844727, -0.007625579833984375, -0.0071904659271240234, -0.006755352020263672, -0.00632023811340332, -0.005885124206542969, -0.005450010299682617, -0.005014896392822266, -0.004579782485961914, -0.0041446685791015625, -0.003709554672241211, -0.0032744407653808594, -0.002839326858520508, -0.0024042129516601562, -0.0019690990447998047, -0.0015339851379394531, -0.0010988712310791016, -0.00066375732421875, -0.00022864341735839844, 0.00020647048950195312, 0.0006415843963623047, 0.0010766983032226562, 0.0015118122100830078, 0.0019469261169433594, 0.002382040023803711, 0.0028171539306640625, 0.003252267837524414, 0.0036873817443847656, 0.004122495651245117, 0.004557609558105469, 0.00499272346496582, 0.005427837371826172, 0.0058629512786865234, 0.006298065185546875, 0.0067331790924072266, 0.007168292999267578, 0.00760340690612793, 0.008038520812988281, 0.008473634719848633, 0.008908748626708984, 0.009343862533569336, 0.009778976440429688, 0.010214090347290039, 0.01064920425415039, 0.011084318161010742, 0.011519432067871094, 0.011954545974731445, 0.012389659881591797, 0.012824773788452148, 0.0132598876953125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 5.0, 6.0, 7.0, 7.0, 7.0, 18.0, 23.0, 26.0, 38.0, 43.0, 76.0, 138.0, 211.0, 375.0, 698.0, 1634.0, 5089.0, 25290.0, 478606.0, 502064.0, 25770.0, 5097.0, 1704.0, 694.0, 341.0, 187.0, 114.0, 93.0, 61.0, 38.0, 26.0, 16.0, 11.0, 12.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-92.6875, -89.3779296875, -86.068359375, -82.7587890625, -79.44921875, -76.1396484375, -72.830078125, -69.5205078125, -66.2109375, -62.9013671875, -59.591796875, -56.2822265625, -52.97265625, -49.6630859375, -46.353515625, -43.0439453125, -39.734375, -36.4248046875, -33.115234375, -29.8056640625, -26.49609375, -23.1865234375, -19.876953125, -16.5673828125, -13.2578125, -9.9482421875, -6.638671875, -3.3291015625, -0.01953125, 3.2900390625, 6.599609375, 9.9091796875, 13.21875, 16.5283203125, 19.837890625, 23.1474609375, 26.45703125, 29.7666015625, 33.076171875, 36.3857421875, 39.6953125, 43.0048828125, 46.314453125, 49.6240234375, 52.93359375, 56.2431640625, 59.552734375, 62.8623046875, 66.171875, 69.4814453125, 72.791015625, 76.1005859375, 79.41015625, 82.7197265625, 86.029296875, 89.3388671875, 92.6484375, 95.9580078125, 99.267578125, 102.5771484375, 105.88671875, 109.1962890625, 112.505859375, 115.8154296875, 119.125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 7.0, 8.0, 3.0, 11.0, 14.0, 14.0, 26.0, 43.0, 79.0, 130.0, 175.0, 149.0, 103.0, 81.0, 55.0, 32.0, 19.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-158.375, -154.3173828125, -150.259765625, -146.2021484375, -142.14453125, -138.0869140625, -134.029296875, -129.9716796875, -125.9140625, -121.8564453125, -117.798828125, -113.7412109375, -109.68359375, -105.6259765625, -101.568359375, -97.5107421875, -93.453125, -89.3955078125, -85.337890625, -81.2802734375, -77.22265625, -73.1650390625, -69.107421875, -65.0498046875, -60.9921875, -56.9345703125, -52.876953125, -48.8193359375, -44.76171875, -40.7041015625, -36.646484375, -32.5888671875, -28.53125, -24.4736328125, -20.416015625, -16.3583984375, -12.30078125, -8.2431640625, -4.185546875, -0.1279296875, 3.9296875, 7.9873046875, 12.044921875, 16.1025390625, 20.16015625, 24.2177734375, 28.275390625, 32.3330078125, 36.390625, 40.4482421875, 44.505859375, 48.5634765625, 52.62109375, 56.6787109375, 60.736328125, 64.7939453125, 68.8515625, 72.9091796875, 76.966796875, 81.0244140625, 85.08203125, 89.1396484375, 93.197265625, 97.2548828125, 101.3125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 5.0, 21.0, 66.0, 152.0, 300.0, 252.0, 137.0, 43.0, 16.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3942.359375, -3841.4501953125, -3740.541015625, -3639.6318359375, -3538.72265625, -3437.8134765625, -3336.904296875, -3235.9951171875, -3135.0859375, -3034.1767578125, -2933.267578125, -2832.3583984375, -2731.44921875, -2630.5400390625, -2529.630859375, -2428.7216796875, -2327.812744140625, -2226.903564453125, -2125.994384765625, -2025.085205078125, -1924.176025390625, -1823.266845703125, -1722.3577880859375, -1621.4486083984375, -1520.5394287109375, -1419.6302490234375, -1318.7210693359375, -1217.81201171875, -1116.90283203125, -1015.9935913085938, -915.08447265625, -814.17529296875, -713.26611328125, -612.35693359375, -511.4477844238281, -410.53863525390625, -309.62945556640625, -208.72027587890625, -107.8111572265625, -6.9019775390625, 94.0072021484375, 194.91636657714844, 295.8255310058594, 396.73468017578125, 497.64385986328125, 598.5530395507812, 699.462158203125, 800.371337890625, 901.280517578125, 1002.189697265625, 1103.098876953125, 1204.008056640625, 1304.917236328125, 1405.826416015625, 1506.7354736328125, 1607.6446533203125, 1708.5538330078125, 1809.4630126953125, 1910.3721923828125, 2011.28125, 2112.1904296875, 2213.099609375, 2314.0087890625, 2414.91796875, 2515.8271484375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 13.0, 11.0, 4.0, 10.0, 10.0, 21.0, 23.0, 33.0, 21.0, 33.0, 29.0, 51.0, 40.0, 49.0, 50.0, 54.0, 40.0, 53.0, 56.0, 44.0, 46.0, 47.0, 44.0, 39.0, 31.0, 26.0, 20.0, 24.0, 15.0, 12.0, 9.0, 10.0, 7.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1210.9700927734375, -1171.8963623046875, -1132.8226318359375, -1093.7490234375, -1054.67529296875, -1015.6015625, -976.52783203125, -937.4541625976562, -898.3804931640625, -859.3067626953125, -820.2330932617188, -781.1593627929688, -742.085693359375, -703.011962890625, -663.938232421875, -624.8645629882812, -585.7908325195312, -546.7171020507812, -507.6434326171875, -468.5697021484375, -429.49603271484375, -390.42230224609375, -351.3486022949219, -312.27490234375, -273.2012023925781, -234.12750244140625, -195.05380249023438, -155.98008728027344, -116.90638732910156, -77.83268737792969, -38.75897216796875, 0.314727783203125, 39.388427734375, 78.46212768554688, 117.53583526611328, 156.6095428466797, 195.68324279785156, 234.75694274902344, 273.8306579589844, 312.90435791015625, 351.9780578613281, 391.0517578125, 430.1254577636719, 469.19915771484375, 508.27288818359375, 547.3465576171875, 586.4202880859375, 625.4940185546875, 664.5676879882812, 703.6414184570312, 742.715087890625, 781.788818359375, 820.8624877929688, 859.9362182617188, 899.0098876953125, 938.0836181640625, 977.1573486328125, 1016.2310791015625, 1055.3048095703125, 1094.37841796875, 1133.4521484375, 1172.52587890625, 1211.599609375, 1250.67333984375, 1289.7469482421875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 16.0, 11.0, 21.0, 36.0, 49.0, 98.0, 159.0, 310.0, 617.0, 1527.0, 4263.0, 14612.0, 87937.0, 3853853.0, 200460.0, 21747.0, 5475.0, 1782.0, 701.0, 304.0, 126.0, 66.0, 40.0, 25.0, 13.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.125, -180.419921875, -174.71484375, -169.009765625, -163.3046875, -157.599609375, -151.89453125, -146.189453125, -140.484375, -134.779296875, -129.07421875, -123.369140625, -117.6640625, -111.958984375, -106.25390625, -100.548828125, -94.84375, -89.138671875, -83.43359375, -77.728515625, -72.0234375, -66.318359375, -60.61328125, -54.908203125, -49.203125, -43.498046875, -37.79296875, -32.087890625, -26.3828125, -20.677734375, -14.97265625, -9.267578125, -3.5625, 2.142578125, 7.84765625, 13.552734375, 19.2578125, 24.962890625, 30.66796875, 36.373046875, 42.078125, 47.783203125, 53.48828125, 59.193359375, 64.8984375, 70.603515625, 76.30859375, 82.013671875, 87.71875, 93.423828125, 99.12890625, 104.833984375, 110.5390625, 116.244140625, 121.94921875, 127.654296875, 133.359375, 139.064453125, 144.76953125, 150.474609375, 156.1796875, 161.884765625, 167.58984375, 173.294921875, 179.0]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 10.0, 8.0, 8.0, 10.0, 12.0, 27.0, 35.0, 34.0, 55.0, 72.0, 88.0, 90.0, 108.0, 90.0, 70.0, 70.0, 65.0, 44.0, 31.0, 23.0, 17.0, 10.0, 13.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.375, -91.91552734375, -89.4560546875, -86.99658203125, -84.537109375, -82.07763671875, -79.6181640625, -77.15869140625, -74.69921875, -72.23974609375, -69.7802734375, -67.32080078125, -64.861328125, -62.40185546875, -59.9423828125, -57.48291015625, -55.0234375, -52.56396484375, -50.1044921875, -47.64501953125, -45.185546875, -42.72607421875, -40.2666015625, -37.80712890625, -35.34765625, -32.88818359375, -30.4287109375, -27.96923828125, -25.509765625, -23.05029296875, -20.5908203125, -18.13134765625, -15.671875, -13.21240234375, -10.7529296875, -8.29345703125, -5.833984375, -3.37451171875, -0.9150390625, 1.54443359375, 4.00390625, 6.46337890625, 8.9228515625, 11.38232421875, 13.841796875, 16.30126953125, 18.7607421875, 21.22021484375, 23.6796875, 26.13916015625, 28.5986328125, 31.05810546875, 33.517578125, 35.97705078125, 38.4365234375, 40.89599609375, 43.35546875, 45.81494140625, 48.2744140625, 50.73388671875, 53.193359375, 55.65283203125, 58.1123046875, 60.57177734375, 63.03125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 6.0, 14.0, 17.0, 20.0, 39.0, 60.0, 109.0, 198.0, 452.0, 964.0, 2531.0, 8310.0, 41137.0, 1023428.0, 3049595.0, 53608.0, 9424.0, 2578.0, 989.0, 391.0, 159.0, 74.0, 51.0, 27.0, 26.0, 14.0, 13.0, 8.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-226.25, -219.798828125, -213.34765625, -206.896484375, -200.4453125, -193.994140625, -187.54296875, -181.091796875, -174.640625, -168.189453125, -161.73828125, -155.287109375, -148.8359375, -142.384765625, -135.93359375, -129.482421875, -123.03125, -116.580078125, -110.12890625, -103.677734375, -97.2265625, -90.775390625, -84.32421875, -77.873046875, -71.421875, -64.970703125, -58.51953125, -52.068359375, -45.6171875, -39.166015625, -32.71484375, -26.263671875, -19.8125, -13.361328125, -6.91015625, -0.458984375, 5.9921875, 12.443359375, 18.89453125, 25.345703125, 31.796875, 38.248046875, 44.69921875, 51.150390625, 57.6015625, 64.052734375, 70.50390625, 76.955078125, 83.40625, 89.857421875, 96.30859375, 102.759765625, 109.2109375, 115.662109375, 122.11328125, 128.564453125, 135.015625, 141.466796875, 147.91796875, 154.369140625, 160.8203125, 167.271484375, 173.72265625, 180.173828125, 186.625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 10.0, 14.0, 15.0, 19.0, 29.0, 49.0, 76.0, 122.0, 243.0, 729.0, 1720.0, 567.0, 180.0, 105.0, 61.0, 32.0, 22.0, 16.0, 13.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.0, -231.130859375, -225.26171875, -219.392578125, -213.5234375, -207.654296875, -201.78515625, -195.916015625, -190.046875, -184.177734375, -178.30859375, -172.439453125, -166.5703125, -160.701171875, -154.83203125, -148.962890625, -143.09375, -137.224609375, -131.35546875, -125.486328125, -119.6171875, -113.748046875, -107.87890625, -102.009765625, -96.140625, -90.271484375, -84.40234375, -78.533203125, -72.6640625, -66.794921875, -60.92578125, -55.056640625, -49.1875, -43.318359375, -37.44921875, -31.580078125, -25.7109375, -19.841796875, -13.97265625, -8.103515625, -2.234375, 3.634765625, 9.50390625, 15.373046875, 21.2421875, 27.111328125, 32.98046875, 38.849609375, 44.71875, 50.587890625, 56.45703125, 62.326171875, 68.1953125, 74.064453125, 79.93359375, 85.802734375, 91.671875, 97.541015625, 103.41015625, 109.279296875, 115.1484375, 121.017578125, 126.88671875, 132.755859375, 138.625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 10.0, 34.0, 72.0, 142.0, 197.0, 223.0, 149.0, 73.0, 39.0, 11.0, 9.0, 3.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2369.82861328125, -2318.706787109375, -2267.585205078125, -2216.46337890625, -2165.341552734375, -2114.219970703125, -2063.09814453125, -2011.976318359375, -1960.8546142578125, -1909.73291015625, -1858.611083984375, -1807.4893798828125, -1756.36767578125, -1705.245849609375, -1654.1241455078125, -1603.00244140625, -1551.880615234375, -1500.7589111328125, -1449.6370849609375, -1398.515380859375, -1347.3935546875, -1296.2718505859375, -1245.150146484375, -1194.0283203125, -1142.9066162109375, -1091.784912109375, -1040.6630859375, -989.5413818359375, -938.4196166992188, -887.2978515625, -836.1761474609375, -785.0543823242188, -733.9327392578125, -682.8109741210938, -631.689208984375, -580.5675048828125, -529.4457397460938, -478.323974609375, -427.2022399902344, -376.08050537109375, -324.958740234375, -273.83697509765625, -222.71524047851562, -171.59349060058594, -120.47174072265625, -69.34999084472656, -18.228240966796875, 32.89349365234375, 84.0152587890625, 135.1370086669922, 186.25875854492188, 237.38050842285156, 288.50225830078125, 339.6240234375, 390.7457580566406, 441.86749267578125, 492.9892578125, 544.1110229492188, 595.2327880859375, 646.3544921875, 697.4762573242188, 748.5980224609375, 799.7197265625, 850.8414916992188, 901.9632568359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 5.0, 16.0, 22.0, 21.0, 25.0, 45.0, 48.0, 63.0, 67.0, 83.0, 74.0, 73.0, 79.0, 82.0, 60.0, 62.0, 35.0, 38.0, 23.0, 16.0, 15.0, 11.0, 14.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1056.51171875, -1022.3818969726562, -988.2521362304688, -954.122314453125, -919.9925537109375, -885.8627319335938, -851.73291015625, -817.6031494140625, -783.4733276367188, -749.343505859375, -715.2137451171875, -681.0839233398438, -646.9541015625, -612.8243408203125, -578.6945190429688, -544.564697265625, -510.4349365234375, -476.3051452636719, -442.17535400390625, -408.0455322265625, -373.9157409667969, -339.78594970703125, -305.6561279296875, -271.5263366699219, -237.39654541015625, -203.26675415039062, -169.13694763183594, -135.00714111328125, -100.87734985351562, -66.74755859375, -32.61775207519531, 1.512054443359375, 35.641845703125, 69.77164459228516, 103.90144348144531, 138.03125, 172.16104125976562, 206.29083251953125, 240.42063903808594, 274.5504455566406, 308.68023681640625, 342.8100280761719, 376.9398193359375, 411.06964111328125, 445.1994323730469, 479.3292236328125, 513.4590454101562, 547.5888671875, 581.7186279296875, 615.8484497070312, 649.9782104492188, 684.1080322265625, 718.23779296875, 752.3676147460938, 786.4974365234375, 820.627197265625, 854.7570190429688, 888.8868408203125, 923.0166015625, 957.1464233398438, 991.2762451171875, 1025.406005859375, 1059.5357666015625, 1093.6656494140625, 1127.79541015625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 12.0, 11.0, 16.0, 19.0, 25.0, 49.0, 77.0, 129.0, 204.0, 374.0, 678.0, 1496.0, 3308.0, 8398.0, 23976.0, 84929.0, 364724.0, 416329.0, 99850.0, 27471.0, 9458.0, 3591.0, 1643.0, 829.0, 368.0, 230.0, 120.0, 66.0, 49.0, 37.0, 22.0, 14.0, 11.0, 9.0, 11.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.625, -125.451171875, -121.27734375, -117.103515625, -112.9296875, -108.755859375, -104.58203125, -100.408203125, -96.234375, -92.060546875, -87.88671875, -83.712890625, -79.5390625, -75.365234375, -71.19140625, -67.017578125, -62.84375, -58.669921875, -54.49609375, -50.322265625, -46.1484375, -41.974609375, -37.80078125, -33.626953125, -29.453125, -25.279296875, -21.10546875, -16.931640625, -12.7578125, -8.583984375, -4.41015625, -0.236328125, 3.9375, 8.111328125, 12.28515625, 16.458984375, 20.6328125, 24.806640625, 28.98046875, 33.154296875, 37.328125, 41.501953125, 45.67578125, 49.849609375, 54.0234375, 58.197265625, 62.37109375, 66.544921875, 70.71875, 74.892578125, 79.06640625, 83.240234375, 87.4140625, 91.587890625, 95.76171875, 99.935546875, 104.109375, 108.283203125, 112.45703125, 116.630859375, 120.8046875, 124.978515625, 129.15234375, 133.326171875, 137.5]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 6.0, 2.0, 9.0, 7.0, 10.0, 14.0, 16.0, 24.0, 29.0, 20.0, 31.0, 39.0, 41.0, 34.0, 45.0, 47.0, 39.0, 66.0, 57.0, 52.0, 58.0, 41.0, 54.0, 39.0, 39.0, 31.0, 25.0, 21.0, 18.0, 20.0, 17.0, 12.0, 9.0, 9.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.40625, -40.947265625, -39.48828125, -38.029296875, -36.5703125, -35.111328125, -33.65234375, -32.193359375, -30.734375, -29.275390625, -27.81640625, -26.357421875, -24.8984375, -23.439453125, -21.98046875, -20.521484375, -19.0625, -17.603515625, -16.14453125, -14.685546875, -13.2265625, -11.767578125, -10.30859375, -8.849609375, -7.390625, -5.931640625, -4.47265625, -3.013671875, -1.5546875, -0.095703125, 1.36328125, 2.822265625, 4.28125, 5.740234375, 7.19921875, 8.658203125, 10.1171875, 11.576171875, 13.03515625, 14.494140625, 15.953125, 17.412109375, 18.87109375, 20.330078125, 21.7890625, 23.248046875, 24.70703125, 26.166015625, 27.625, 29.083984375, 30.54296875, 32.001953125, 33.4609375, 34.919921875, 36.37890625, 37.837890625, 39.296875, 40.755859375, 42.21484375, 43.673828125, 45.1328125, 46.591796875, 48.05078125, 49.509765625, 50.96875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 10.0, 15.0, 26.0, 45.0, 42.0, 80.0, 97.0, 217.0, 371.0, 678.0, 1335.0, 3479.0, 14569.0, 150000.0, 784482.0, 78235.0, 9633.0, 2676.0, 1166.0, 573.0, 297.0, 186.0, 113.0, 65.0, 44.0, 37.0, 30.0, 14.0, 13.0, 7.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.25, -219.2421875, -211.234375, -203.2265625, -195.21875, -187.2109375, -179.203125, -171.1953125, -163.1875, -155.1796875, -147.171875, -139.1640625, -131.15625, -123.1484375, -115.140625, -107.1328125, -99.125, -91.1171875, -83.109375, -75.1015625, -67.09375, -59.0859375, -51.078125, -43.0703125, -35.0625, -27.0546875, -19.046875, -11.0390625, -3.03125, 4.9765625, 12.984375, 20.9921875, 29.0, 37.0078125, 45.015625, 53.0234375, 61.03125, 69.0390625, 77.046875, 85.0546875, 93.0625, 101.0703125, 109.078125, 117.0859375, 125.09375, 133.1015625, 141.109375, 149.1171875, 157.125, 165.1328125, 173.140625, 181.1484375, 189.15625, 197.1640625, 205.171875, 213.1796875, 221.1875, 229.1953125, 237.203125, 245.2109375, 253.21875, 261.2265625, 269.234375, 277.2421875, 285.25]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 9.0, 18.0, 13.0, 18.0, 21.0, 26.0, 20.0, 17.0, 33.0, 35.0, 56.0, 60.0, 51.0, 65.0, 54.0, 62.0, 51.0, 46.0, 43.0, 47.0, 38.0, 40.0, 36.0, 28.0, 24.0, 20.0, 10.0, 9.0, 11.0, 7.0, 6.0, 8.0, 2.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-211.125, -203.275390625, -195.42578125, -187.576171875, -179.7265625, -171.876953125, -164.02734375, -156.177734375, -148.328125, -140.478515625, -132.62890625, -124.779296875, -116.9296875, -109.080078125, -101.23046875, -93.380859375, -85.53125, -77.681640625, -69.83203125, -61.982421875, -54.1328125, -46.283203125, -38.43359375, -30.583984375, -22.734375, -14.884765625, -7.03515625, 0.814453125, 8.6640625, 16.513671875, 24.36328125, 32.212890625, 40.0625, 47.912109375, 55.76171875, 63.611328125, 71.4609375, 79.310546875, 87.16015625, 95.009765625, 102.859375, 110.708984375, 118.55859375, 126.408203125, 134.2578125, 142.107421875, 149.95703125, 157.806640625, 165.65625, 173.505859375, 181.35546875, 189.205078125, 197.0546875, 204.904296875, 212.75390625, 220.603515625, 228.453125, 236.302734375, 244.15234375, 252.001953125, 259.8515625, 267.701171875, 275.55078125, 283.400390625, 291.25]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 3.0, 4.0, 10.0, 8.0, 10.0, 13.0, 15.0, 18.0, 26.0, 41.0, 56.0, 77.0, 167.0, 169.0, 337.0, 602.0, 1172.0, 3023.0, 10078.0, 68011.0, 800126.0, 142270.0, 15057.0, 3966.0, 1497.0, 689.0, 391.0, 230.0, 134.0, 99.0, 74.0, 62.0, 33.0, 17.0, 11.0, 15.0, 12.0, 11.0, 2.0, 8.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.5, -77.955078125, -75.41015625, -72.865234375, -70.3203125, -67.775390625, -65.23046875, -62.685546875, -60.140625, -57.595703125, -55.05078125, -52.505859375, -49.9609375, -47.416015625, -44.87109375, -42.326171875, -39.78125, -37.236328125, -34.69140625, -32.146484375, -29.6015625, -27.056640625, -24.51171875, -21.966796875, -19.421875, -16.876953125, -14.33203125, -11.787109375, -9.2421875, -6.697265625, -4.15234375, -1.607421875, 0.9375, 3.482421875, 6.02734375, 8.572265625, 11.1171875, 13.662109375, 16.20703125, 18.751953125, 21.296875, 23.841796875, 26.38671875, 28.931640625, 31.4765625, 34.021484375, 36.56640625, 39.111328125, 41.65625, 44.201171875, 46.74609375, 49.291015625, 51.8359375, 54.380859375, 56.92578125, 59.470703125, 62.015625, 64.560546875, 67.10546875, 69.650390625, 72.1953125, 74.740234375, 77.28515625, 79.830078125, 82.375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 5.0, 10.0, 15.0, 25.0, 39.0, 55.0, 80.0, 82.0, 130.0, 144.0, 123.0, 91.0, 47.0, 48.0, 32.0, 24.0, 19.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01158905029296875, -0.011128783226013184, -0.010668516159057617, -0.01020824909210205, -0.009747982025146484, -0.009287714958190918, -0.008827447891235352, -0.008367180824279785, -0.007906913757324219, -0.007446646690368652, -0.006986379623413086, -0.0065261125564575195, -0.006065845489501953, -0.005605578422546387, -0.00514531135559082, -0.004685044288635254, -0.0042247772216796875, -0.003764510154724121, -0.0033042430877685547, -0.0028439760208129883, -0.002383708953857422, -0.0019234418869018555, -0.001463174819946289, -0.0010029077529907227, -0.0005426406860351562, -8.237361907958984e-05, 0.00037789344787597656, 0.000838160514831543, 0.0012984275817871094, 0.0017586946487426758, 0.002218961715698242, 0.0026792287826538086, 0.003139495849609375, 0.0035997629165649414, 0.004060029983520508, 0.004520297050476074, 0.004980564117431641, 0.005440831184387207, 0.0059010982513427734, 0.00636136531829834, 0.006821632385253906, 0.007281899452209473, 0.007742166519165039, 0.008202433586120605, 0.008662700653076172, 0.009122967720031738, 0.009583234786987305, 0.010043501853942871, 0.010503768920898438, 0.010964035987854004, 0.01142430305480957, 0.011884570121765137, 0.012344837188720703, 0.01280510425567627, 0.013265371322631836, 0.013725638389587402, 0.014185905456542969, 0.014646172523498535, 0.015106439590454102, 0.015566706657409668, 0.016026973724365234, 0.0164872407913208, 0.016947507858276367, 0.017407774925231934, 0.0178680419921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 8.0, 26.0, 16.0, 20.0, 31.0, 60.0, 71.0, 112.0, 190.0, 304.0, 614.0, 1257.0, 3584.0, 13660.0, 129970.0, 818752.0, 64984.0, 9807.0, 2797.0, 1032.0, 482.0, 258.0, 147.0, 120.0, 75.0, 49.0, 27.0, 20.0, 21.0, 11.0, 5.0, 8.0, 1.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.625, -87.91015625, -85.1953125, -82.48046875, -79.765625, -77.05078125, -74.3359375, -71.62109375, -68.90625, -66.19140625, -63.4765625, -60.76171875, -58.046875, -55.33203125, -52.6171875, -49.90234375, -47.1875, -44.47265625, -41.7578125, -39.04296875, -36.328125, -33.61328125, -30.8984375, -28.18359375, -25.46875, -22.75390625, -20.0390625, -17.32421875, -14.609375, -11.89453125, -9.1796875, -6.46484375, -3.75, -1.03515625, 1.6796875, 4.39453125, 7.109375, 9.82421875, 12.5390625, 15.25390625, 17.96875, 20.68359375, 23.3984375, 26.11328125, 28.828125, 31.54296875, 34.2578125, 36.97265625, 39.6875, 42.40234375, 45.1171875, 47.83203125, 50.546875, 53.26171875, 55.9765625, 58.69140625, 61.40625, 64.12109375, 66.8359375, 69.55078125, 72.265625, 74.98046875, 77.6953125, 80.41015625, 83.125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 15.0, 20.0, 61.0, 57.0, 76.0, 114.0, 130.0, 125.0, 107.0, 92.0, 56.0, 31.0, 24.0, 17.0, 13.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.6875, -94.630859375, -91.57421875, -88.517578125, -85.4609375, -82.404296875, -79.34765625, -76.291015625, -73.234375, -70.177734375, -67.12109375, -64.064453125, -61.0078125, -57.951171875, -54.89453125, -51.837890625, -48.78125, -45.724609375, -42.66796875, -39.611328125, -36.5546875, -33.498046875, -30.44140625, -27.384765625, -24.328125, -21.271484375, -18.21484375, -15.158203125, -12.1015625, -9.044921875, -5.98828125, -2.931640625, 0.125, 3.181640625, 6.23828125, 9.294921875, 12.3515625, 15.408203125, 18.46484375, 21.521484375, 24.578125, 27.634765625, 30.69140625, 33.748046875, 36.8046875, 39.861328125, 42.91796875, 45.974609375, 49.03125, 52.087890625, 55.14453125, 58.201171875, 61.2578125, 64.314453125, 67.37109375, 70.427734375, 73.484375, 76.541015625, 79.59765625, 82.654296875, 85.7109375, 88.767578125, 91.82421875, 94.880859375, 97.9375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 6.0, 7.0, 16.0, 26.0, 27.0, 62.0, 60.0, 95.0, 101.0, 134.0, 129.0, 110.0, 70.0, 54.0, 36.0, 18.0, 12.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-925.6077270507812, -896.558349609375, -867.509033203125, -838.4596557617188, -809.4102783203125, -780.3609619140625, -751.3115844726562, -722.26220703125, -693.212890625, -664.1635131835938, -635.1141967773438, -606.0648193359375, -577.0155029296875, -547.9661254882812, -518.916748046875, -489.8674011230469, -460.81805419921875, -431.7687072753906, -402.7193603515625, -373.66998291015625, -344.6206359863281, -315.5712890625, -286.52191162109375, -257.4725646972656, -228.4232177734375, -199.37387084960938, -170.3245086669922, -141.275146484375, -112.22579956054688, -83.17645263671875, -54.12709045410156, -25.077728271484375, 3.9715576171875, 33.020912170410156, 62.07026672363281, 91.11962127685547, 120.16897583007812, 149.21832275390625, 178.26768493652344, 207.31704711914062, 236.36639404296875, 265.4157409667969, 294.465087890625, 323.51446533203125, 352.5638122558594, 381.6131591796875, 410.66253662109375, 439.7118835449219, 468.76123046875, 497.8105773925781, 526.8599243164062, 555.9093017578125, 584.9586181640625, 614.0079956054688, 643.057373046875, 672.106689453125, 701.1560668945312, 730.2054443359375, 759.2547607421875, 788.3041381835938, 817.353515625, 846.40283203125, 875.4522094726562, 904.5015869140625, 933.5509033203125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 6.0, 9.0, 11.0, 13.0, 14.0, 28.0, 20.0, 33.0, 35.0, 27.0, 41.0, 46.0, 63.0, 59.0, 72.0, 64.0, 67.0, 54.0, 58.0, 49.0, 37.0, 38.0, 31.0, 19.0, 22.0, 23.0, 13.0, 11.0, 13.0, 5.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1232.1280517578125, -1200.5604248046875, -1168.99267578125, -1137.425048828125, -1105.857421875, -1074.289794921875, -1042.7220458984375, -1011.1544189453125, -979.5867309570312, -948.01904296875, -916.451416015625, -884.8837280273438, -853.3161010742188, -821.7484130859375, -790.1807861328125, -758.6130981445312, -727.04541015625, -695.4777221679688, -663.9100952148438, -632.3424072265625, -600.7747802734375, -569.2070922851562, -537.639404296875, -506.07177734375, -474.504150390625, -442.9364929199219, -411.36883544921875, -379.8011474609375, -348.2334899902344, -316.66583251953125, -285.0981750488281, -253.53050231933594, -221.96282958984375, -190.39517211914062, -158.82749938964844, -127.25984191894531, -95.69217681884766, -64.12451171875, -32.556854248046875, -0.9891815185546875, 30.578475952148438, 62.146141052246094, 93.71380615234375, 125.28146362304688, 156.84912109375, 188.4167938232422, 219.9844512939453, 251.5521240234375, 283.1197814941406, 314.68743896484375, 346.2550964355469, 377.82275390625, 409.39044189453125, 440.9580993652344, 472.5257568359375, 504.09344482421875, 535.6610717773438, 567.228759765625, 598.79638671875, 630.3640747070312, 661.9317016601562, 693.4993896484375, 725.0670166015625, 756.6347045898438, 788.202392578125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 10.0, 14.0, 12.0, 22.0, 23.0, 43.0, 78.0, 156.0, 234.0, 528.0, 1211.0, 3306.0, 11606.0, 69940.0, 3615496.0, 452477.0, 28762.0, 6810.0, 2181.0, 757.0, 299.0, 128.0, 78.0, 50.0, 17.0, 7.0, 11.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.25, -141.072265625, -136.89453125, -132.716796875, -128.5390625, -124.361328125, -120.18359375, -116.005859375, -111.828125, -107.650390625, -103.47265625, -99.294921875, -95.1171875, -90.939453125, -86.76171875, -82.583984375, -78.40625, -74.228515625, -70.05078125, -65.873046875, -61.6953125, -57.517578125, -53.33984375, -49.162109375, -44.984375, -40.806640625, -36.62890625, -32.451171875, -28.2734375, -24.095703125, -19.91796875, -15.740234375, -11.5625, -7.384765625, -3.20703125, 0.970703125, 5.1484375, 9.326171875, 13.50390625, 17.681640625, 21.859375, 26.037109375, 30.21484375, 34.392578125, 38.5703125, 42.748046875, 46.92578125, 51.103515625, 55.28125, 59.458984375, 63.63671875, 67.814453125, 71.9921875, 76.169921875, 80.34765625, 84.525390625, 88.703125, 92.880859375, 97.05859375, 101.236328125, 105.4140625, 109.591796875, 113.76953125, 117.947265625, 122.125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 11.0, 7.0, 36.0, 51.0, 83.0, 85.0, 116.0, 118.0, 121.0, 123.0, 90.0, 60.0, 40.0, 21.0, 11.0, 6.0, 8.0, 1.0, 4.0, 4.0, 3.0, 2.0], "bins": [-162.375, -159.11083984375, -155.8466796875, -152.58251953125, -149.318359375, -146.05419921875, -142.7900390625, -139.52587890625, -136.26171875, -132.99755859375, -129.7333984375, -126.46923828125, -123.205078125, -119.94091796875, -116.6767578125, -113.41259765625, -110.1484375, -106.88427734375, -103.6201171875, -100.35595703125, -97.091796875, -93.82763671875, -90.5634765625, -87.29931640625, -84.03515625, -80.77099609375, -77.5068359375, -74.24267578125, -70.978515625, -67.71435546875, -64.4501953125, -61.18603515625, -57.921875, -54.65771484375, -51.3935546875, -48.12939453125, -44.865234375, -41.60107421875, -38.3369140625, -35.07275390625, -31.80859375, -28.54443359375, -25.2802734375, -22.01611328125, -18.751953125, -15.48779296875, -12.2236328125, -8.95947265625, -5.6953125, -2.43115234375, 0.8330078125, 4.09716796875, 7.361328125, 10.62548828125, 13.8896484375, 17.15380859375, 20.41796875, 23.68212890625, 26.9462890625, 30.21044921875, 33.474609375, 36.73876953125, 40.0029296875, 43.26708984375, 46.53125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 4.0, 9.0, 14.0, 35.0, 54.0, 97.0, 202.0, 455.0, 1229.0, 3028.0, 8414.0, 30164.0, 207266.0, 3668932.0, 227422.0, 32031.0, 9071.0, 3312.0, 1286.0, 636.0, 301.0, 135.0, 75.0, 34.0, 28.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.0, -136.79296875, -132.5859375, -128.37890625, -124.171875, -119.96484375, -115.7578125, -111.55078125, -107.34375, -103.13671875, -98.9296875, -94.72265625, -90.515625, -86.30859375, -82.1015625, -77.89453125, -73.6875, -69.48046875, -65.2734375, -61.06640625, -56.859375, -52.65234375, -48.4453125, -44.23828125, -40.03125, -35.82421875, -31.6171875, -27.41015625, -23.203125, -18.99609375, -14.7890625, -10.58203125, -6.375, -2.16796875, 2.0390625, 6.24609375, 10.453125, 14.66015625, 18.8671875, 23.07421875, 27.28125, 31.48828125, 35.6953125, 39.90234375, 44.109375, 48.31640625, 52.5234375, 56.73046875, 60.9375, 65.14453125, 69.3515625, 73.55859375, 77.765625, 81.97265625, 86.1796875, 90.38671875, 94.59375, 98.80078125, 103.0078125, 107.21484375, 111.421875, 115.62890625, 119.8359375, 124.04296875, 128.25]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0, 4.0, 13.0, 14.0, 9.0, 10.0, 29.0, 41.0, 48.0, 89.0, 147.0, 342.0, 835.0, 1234.0, 653.0, 232.0, 123.0, 75.0, 58.0, 28.0, 17.0, 7.0, 19.0, 6.0, 9.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.4375, -91.5107421875, -87.583984375, -83.6572265625, -79.73046875, -75.8037109375, -71.876953125, -67.9501953125, -64.0234375, -60.0966796875, -56.169921875, -52.2431640625, -48.31640625, -44.3896484375, -40.462890625, -36.5361328125, -32.609375, -28.6826171875, -24.755859375, -20.8291015625, -16.90234375, -12.9755859375, -9.048828125, -5.1220703125, -1.1953125, 2.7314453125, 6.658203125, 10.5849609375, 14.51171875, 18.4384765625, 22.365234375, 26.2919921875, 30.21875, 34.1455078125, 38.072265625, 41.9990234375, 45.92578125, 49.8525390625, 53.779296875, 57.7060546875, 61.6328125, 65.5595703125, 69.486328125, 73.4130859375, 77.33984375, 81.2666015625, 85.193359375, 89.1201171875, 93.046875, 96.9736328125, 100.900390625, 104.8271484375, 108.75390625, 112.6806640625, 116.607421875, 120.5341796875, 124.4609375, 128.3876953125, 132.314453125, 136.2412109375, 140.16796875, 144.0947265625, 148.021484375, 151.9482421875, 155.875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 7.0, 10.0, 33.0, 122.0, 307.0, 332.0, 145.0, 39.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1947.9063720703125, -1885.4173583984375, -1822.9283447265625, -1760.4393310546875, -1697.9503173828125, -1635.4613037109375, -1572.9722900390625, -1510.4832763671875, -1447.9942626953125, -1385.5052490234375, -1323.0162353515625, -1260.5272216796875, -1198.0382080078125, -1135.5491943359375, -1073.0601806640625, -1010.5711669921875, -948.0821533203125, -885.5931396484375, -823.1041259765625, -760.6151123046875, -698.1260986328125, -635.6370849609375, -573.1480712890625, -510.6590576171875, -448.1700439453125, -385.6810302734375, -323.1920166015625, -260.7030029296875, -198.2139892578125, -135.7249755859375, -73.2359619140625, -10.7469482421875, 51.7421875, 114.231201171875, 176.72021484375, 239.209228515625, 301.6982421875, 364.187255859375, 426.67626953125, 489.165283203125, 551.654296875, 614.143310546875, 676.63232421875, 739.121337890625, 801.6103515625, 864.099365234375, 926.58837890625, 989.077392578125, 1051.56640625, 1114.055419921875, 1176.54443359375, 1239.033447265625, 1301.5224609375, 1364.011474609375, 1426.50048828125, 1488.989501953125, 1551.478515625, 1613.967529296875, 1676.45654296875, 1738.945556640625, 1801.4345703125, 1863.923583984375, 1926.41259765625, 1988.901611328125, 2051.390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 9.0, 17.0, 14.0, 12.0, 19.0, 35.0, 39.0, 55.0, 54.0, 54.0, 79.0, 80.0, 89.0, 76.0, 77.0, 51.0, 50.0, 42.0, 29.0, 42.0, 24.0, 15.0, 14.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-648.71923828125, -625.78662109375, -602.85400390625, -579.92138671875, -556.98876953125, -534.05615234375, -511.12353515625, -488.19091796875, -465.25830078125, -442.32568359375, -419.39306640625, -396.46044921875, -373.52783203125, -350.59521484375, -327.66259765625, -304.72998046875, -281.7973327636719, -258.8647155761719, -235.93209838867188, -212.99948120117188, -190.06686401367188, -167.13424682617188, -144.2016143798828, -121.26899719238281, -98.33638000488281, -75.40376281738281, -52.47114181518555, -29.53852081298828, -6.605903625488281, 16.32671356201172, 39.25933837890625, 62.19195556640625, 85.12457275390625, 108.05718994140625, 130.98980712890625, 153.92242431640625, 176.85504150390625, 199.78765869140625, 222.7202911376953, 245.6529083251953, 268.58551025390625, 291.51812744140625, 314.45074462890625, 337.38336181640625, 360.31597900390625, 383.24859619140625, 406.18121337890625, 429.11383056640625, 452.0464782714844, 474.9790954589844, 497.9117126464844, 520.8443603515625, 543.7769775390625, 566.7095947265625, 589.6422119140625, 612.5748291015625, 635.5074462890625, 658.4400634765625, 681.3726806640625, 704.3052978515625, 727.2379150390625, 750.1705322265625, 773.1031494140625, 796.0357666015625, 818.9683837890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 11.0, 10.0, 16.0, 16.0, 30.0, 47.0, 79.0, 139.0, 243.0, 391.0, 717.0, 1248.0, 2599.0, 5626.0, 13175.0, 33375.0, 93165.0, 283104.0, 389361.0, 142548.0, 49194.0, 18593.0, 7717.0, 3457.0, 1687.0, 872.0, 489.0, 236.0, 133.0, 102.0, 52.0, 36.0, 35.0, 17.0, 11.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.6875, -84.783203125, -81.87890625, -78.974609375, -76.0703125, -73.166015625, -70.26171875, -67.357421875, -64.453125, -61.548828125, -58.64453125, -55.740234375, -52.8359375, -49.931640625, -47.02734375, -44.123046875, -41.21875, -38.314453125, -35.41015625, -32.505859375, -29.6015625, -26.697265625, -23.79296875, -20.888671875, -17.984375, -15.080078125, -12.17578125, -9.271484375, -6.3671875, -3.462890625, -0.55859375, 2.345703125, 5.25, 8.154296875, 11.05859375, 13.962890625, 16.8671875, 19.771484375, 22.67578125, 25.580078125, 28.484375, 31.388671875, 34.29296875, 37.197265625, 40.1015625, 43.005859375, 45.91015625, 48.814453125, 51.71875, 54.623046875, 57.52734375, 60.431640625, 63.3359375, 66.240234375, 69.14453125, 72.048828125, 74.953125, 77.857421875, 80.76171875, 83.666015625, 86.5703125, 89.474609375, 92.37890625, 95.283203125, 98.1875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 7.0, 6.0, 15.0, 19.0, 22.0, 34.0, 40.0, 47.0, 58.0, 77.0, 64.0, 70.0, 76.0, 74.0, 67.0, 51.0, 70.0, 37.0, 36.0, 37.0, 17.0, 21.0, 19.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-76.0, -74.06982421875, -72.1396484375, -70.20947265625, -68.279296875, -66.34912109375, -64.4189453125, -62.48876953125, -60.55859375, -58.62841796875, -56.6982421875, -54.76806640625, -52.837890625, -50.90771484375, -48.9775390625, -47.04736328125, -45.1171875, -43.18701171875, -41.2568359375, -39.32666015625, -37.396484375, -35.46630859375, -33.5361328125, -31.60595703125, -29.67578125, -27.74560546875, -25.8154296875, -23.88525390625, -21.955078125, -20.02490234375, -18.0947265625, -16.16455078125, -14.234375, -12.30419921875, -10.3740234375, -8.44384765625, -6.513671875, -4.58349609375, -2.6533203125, -0.72314453125, 1.20703125, 3.13720703125, 5.0673828125, 6.99755859375, 8.927734375, 10.85791015625, 12.7880859375, 14.71826171875, 16.6484375, 18.57861328125, 20.5087890625, 22.43896484375, 24.369140625, 26.29931640625, 28.2294921875, 30.15966796875, 32.08984375, 34.02001953125, 35.9501953125, 37.88037109375, 39.810546875, 41.74072265625, 43.6708984375, 45.60107421875, 47.53125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 12.0, 14.0, 17.0, 13.0, 28.0, 49.0, 66.0, 88.0, 172.0, 211.0, 437.0, 673.0, 1246.0, 2809.0, 7509.0, 28436.0, 141475.0, 639752.0, 176376.0, 33864.0, 8850.0, 3076.0, 1406.0, 755.0, 407.0, 255.0, 168.0, 100.0, 80.0, 61.0, 36.0, 24.0, 24.0, 12.0, 9.0, 13.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-148.25, -143.552734375, -138.85546875, -134.158203125, -129.4609375, -124.763671875, -120.06640625, -115.369140625, -110.671875, -105.974609375, -101.27734375, -96.580078125, -91.8828125, -87.185546875, -82.48828125, -77.791015625, -73.09375, -68.396484375, -63.69921875, -59.001953125, -54.3046875, -49.607421875, -44.91015625, -40.212890625, -35.515625, -30.818359375, -26.12109375, -21.423828125, -16.7265625, -12.029296875, -7.33203125, -2.634765625, 2.0625, 6.759765625, 11.45703125, 16.154296875, 20.8515625, 25.548828125, 30.24609375, 34.943359375, 39.640625, 44.337890625, 49.03515625, 53.732421875, 58.4296875, 63.126953125, 67.82421875, 72.521484375, 77.21875, 81.916015625, 86.61328125, 91.310546875, 96.0078125, 100.705078125, 105.40234375, 110.099609375, 114.796875, 119.494140625, 124.19140625, 128.888671875, 133.5859375, 138.283203125, 142.98046875, 147.677734375, 152.375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 3.0, 8.0, 7.0, 6.0, 9.0, 10.0, 10.0, 17.0, 19.0, 22.0, 27.0, 19.0, 26.0, 31.0, 42.0, 31.0, 43.0, 41.0, 40.0, 60.0, 58.0, 54.0, 39.0, 41.0, 45.0, 39.0, 39.0, 25.0, 38.0, 25.0, 31.0, 20.0, 10.0, 16.0, 7.0, 9.0, 8.0, 7.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-120.375, -115.201171875, -110.02734375, -104.853515625, -99.6796875, -94.505859375, -89.33203125, -84.158203125, -78.984375, -73.810546875, -68.63671875, -63.462890625, -58.2890625, -53.115234375, -47.94140625, -42.767578125, -37.59375, -32.419921875, -27.24609375, -22.072265625, -16.8984375, -11.724609375, -6.55078125, -1.376953125, 3.796875, 8.970703125, 14.14453125, 19.318359375, 24.4921875, 29.666015625, 34.83984375, 40.013671875, 45.1875, 50.361328125, 55.53515625, 60.708984375, 65.8828125, 71.056640625, 76.23046875, 81.404296875, 86.578125, 91.751953125, 96.92578125, 102.099609375, 107.2734375, 112.447265625, 117.62109375, 122.794921875, 127.96875, 133.142578125, 138.31640625, 143.490234375, 148.6640625, 153.837890625, 159.01171875, 164.185546875, 169.359375, 174.533203125, 179.70703125, 184.880859375, 190.0546875, 195.228515625, 200.40234375, 205.576171875, 210.75]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 12.0, 13.0, 23.0, 25.0, 43.0, 81.0, 174.0, 343.0, 981.0, 3939.0, 32048.0, 715418.0, 276973.0, 14829.0, 2352.0, 680.0, 308.0, 120.0, 58.0, 51.0, 27.0, 16.0, 17.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.75, -89.0390625, -86.328125, -83.6171875, -80.90625, -78.1953125, -75.484375, -72.7734375, -70.0625, -67.3515625, -64.640625, -61.9296875, -59.21875, -56.5078125, -53.796875, -51.0859375, -48.375, -45.6640625, -42.953125, -40.2421875, -37.53125, -34.8203125, -32.109375, -29.3984375, -26.6875, -23.9765625, -21.265625, -18.5546875, -15.84375, -13.1328125, -10.421875, -7.7109375, -5.0, -2.2890625, 0.421875, 3.1328125, 5.84375, 8.5546875, 11.265625, 13.9765625, 16.6875, 19.3984375, 22.109375, 24.8203125, 27.53125, 30.2421875, 32.953125, 35.6640625, 38.375, 41.0859375, 43.796875, 46.5078125, 49.21875, 51.9296875, 54.640625, 57.3515625, 60.0625, 62.7734375, 65.484375, 68.1953125, 70.90625, 73.6171875, 76.328125, 79.0390625, 81.75]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 9.0, 6.0, 16.0, 9.0, 14.0, 13.0, 26.0, 21.0, 23.0, 29.0, 44.0, 50.0, 52.0, 72.0, 57.0, 62.0, 79.0, 62.0, 52.0, 52.0, 39.0, 37.0, 31.0, 27.0, 29.0, 20.0, 12.0, 14.0, 8.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00856781005859375, -0.008333981037139893, -0.008100152015686035, -0.007866322994232178, -0.00763249397277832, -0.007398664951324463, -0.0071648359298706055, -0.006931006908416748, -0.006697177886962891, -0.006463348865509033, -0.006229519844055176, -0.005995690822601318, -0.005761861801147461, -0.0055280327796936035, -0.005294203758239746, -0.005060374736785889, -0.004826545715332031, -0.004592716693878174, -0.004358887672424316, -0.004125058650970459, -0.0038912296295166016, -0.003657400608062744, -0.0034235715866088867, -0.0031897425651550293, -0.002955913543701172, -0.0027220845222473145, -0.002488255500793457, -0.0022544264793395996, -0.002020597457885742, -0.0017867684364318848, -0.0015529394149780273, -0.00131911039352417, -0.0010852813720703125, -0.0008514523506164551, -0.0006176233291625977, -0.00038379430770874023, -0.0001499652862548828, 8.386373519897461e-05, 0.00031769275665283203, 0.0005515217781066895, 0.0007853507995605469, 0.0010191798210144043, 0.0012530088424682617, 0.0014868378639221191, 0.0017206668853759766, 0.001954495906829834, 0.0021883249282836914, 0.002422153949737549, 0.0026559829711914062, 0.0028898119926452637, 0.003123641014099121, 0.0033574700355529785, 0.003591299057006836, 0.0038251280784606934, 0.004058957099914551, 0.004292786121368408, 0.004526615142822266, 0.004760444164276123, 0.0049942731857299805, 0.005228102207183838, 0.005461931228637695, 0.005695760250091553, 0.00592958927154541, 0.006163418292999268, 0.006397247314453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 5.0, 13.0, 19.0, 32.0, 84.0, 161.0, 323.0, 1093.0, 5842.0, 109859.0, 899518.0, 27614.0, 2785.0, 722.0, 254.0, 106.0, 59.0, 29.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.5, -96.8203125, -93.140625, -89.4609375, -85.78125, -82.1015625, -78.421875, -74.7421875, -71.0625, -67.3828125, -63.703125, -60.0234375, -56.34375, -52.6640625, -48.984375, -45.3046875, -41.625, -37.9453125, -34.265625, -30.5859375, -26.90625, -23.2265625, -19.546875, -15.8671875, -12.1875, -8.5078125, -4.828125, -1.1484375, 2.53125, 6.2109375, 9.890625, 13.5703125, 17.25, 20.9296875, 24.609375, 28.2890625, 31.96875, 35.6484375, 39.328125, 43.0078125, 46.6875, 50.3671875, 54.046875, 57.7265625, 61.40625, 65.0859375, 68.765625, 72.4453125, 76.125, 79.8046875, 83.484375, 87.1640625, 90.84375, 94.5234375, 98.203125, 101.8828125, 105.5625, 109.2421875, 112.921875, 116.6015625, 120.28125, 123.9609375, 127.640625, 131.3203125, 135.0]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 15.0, 21.0, 22.0, 38.0, 54.0, 68.0, 80.0, 88.0, 102.0, 90.0, 91.0, 75.0, 67.0, 54.0, 31.0, 20.0, 25.0, 9.0, 9.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.6875, -44.7509765625, -42.814453125, -40.8779296875, -38.94140625, -37.0048828125, -35.068359375, -33.1318359375, -31.1953125, -29.2587890625, -27.322265625, -25.3857421875, -23.44921875, -21.5126953125, -19.576171875, -17.6396484375, -15.703125, -13.7666015625, -11.830078125, -9.8935546875, -7.95703125, -6.0205078125, -4.083984375, -2.1474609375, -0.2109375, 1.7255859375, 3.662109375, 5.5986328125, 7.53515625, 9.4716796875, 11.408203125, 13.3447265625, 15.28125, 17.2177734375, 19.154296875, 21.0908203125, 23.02734375, 24.9638671875, 26.900390625, 28.8369140625, 30.7734375, 32.7099609375, 34.646484375, 36.5830078125, 38.51953125, 40.4560546875, 42.392578125, 44.3291015625, 46.265625, 48.2021484375, 50.138671875, 52.0751953125, 54.01171875, 55.9482421875, 57.884765625, 59.8212890625, 61.7578125, 63.6943359375, 65.630859375, 67.5673828125, 69.50390625, 71.4404296875, 73.376953125, 75.3134765625, 77.25]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 12.0, 10.0, 50.0, 89.0, 184.0, 287.0, 187.0, 98.0, 38.0, 17.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1955.6322021484375, -1907.310546875, -1858.989013671875, -1810.6673583984375, -1762.345703125, -1714.024169921875, -1665.7025146484375, -1617.380859375, -1569.059326171875, -1520.7376708984375, -1472.4161376953125, -1424.094482421875, -1375.77294921875, -1327.4512939453125, -1279.129638671875, -1230.80810546875, -1182.4864501953125, -1134.164794921875, -1085.84326171875, -1037.5216064453125, -989.2000122070312, -940.87841796875, -892.5567626953125, -844.2351684570312, -795.91357421875, -747.5919799804688, -699.2703857421875, -650.94873046875, -602.6271362304688, -554.3055419921875, -505.9839172363281, -457.66229248046875, -409.340576171875, -361.01898193359375, -312.6973571777344, -264.375732421875, -216.05413818359375, -167.73252868652344, -119.41091918945312, -71.08929443359375, -22.7677001953125, 25.553909301757812, 73.87551879882812, 122.19712829589844, 170.51873779296875, 218.84034729003906, 267.1619567871094, 315.48358154296875, 363.80517578125, 412.12677001953125, 460.4483947753906, 508.77001953125, 557.0916137695312, 605.4132080078125, 653.73486328125, 702.0564575195312, 750.3780517578125, 798.6996459960938, 847.021240234375, 895.3428955078125, 943.6644897460938, 991.986083984375, 1040.3077392578125, 1088.62939453125, 1136.950927734375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 10.0, 10.0, 12.0, 19.0, 14.0, 28.0, 19.0, 16.0, 31.0, 22.0, 32.0, 31.0, 39.0, 46.0, 46.0, 41.0, 56.0, 65.0, 51.0, 52.0, 49.0, 48.0, 31.0, 29.0, 29.0, 32.0, 26.0, 17.0, 15.0, 16.0, 12.0, 9.0, 13.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-662.2112426757812, -640.7745971679688, -619.3379516601562, -597.9013061523438, -576.4646606445312, -555.0280151367188, -533.59130859375, -512.1546630859375, -490.7180480957031, -469.2814025878906, -447.8447570800781, -426.4080810546875, -404.971435546875, -383.5347900390625, -362.09814453125, -340.6614990234375, -319.224853515625, -297.7882080078125, -276.3515625, -254.91490173339844, -233.47825622558594, -212.04161071777344, -190.60494995117188, -169.16830444335938, -147.73165893554688, -126.29501342773438, -104.85836029052734, -83.42170715332031, -61.98506164550781, -40.54841613769531, -19.11175537109375, 2.32489013671875, 23.7615966796875, 45.198246002197266, 66.63489532470703, 88.07154846191406, 109.50819396972656, 130.94483947753906, 152.38150024414062, 173.81814575195312, 195.25479125976562, 216.69143676757812, 238.12808227539062, 259.56475830078125, 281.00140380859375, 302.43804931640625, 323.87469482421875, 345.31134033203125, 366.74798583984375, 388.18463134765625, 409.62127685546875, 431.05792236328125, 452.49456787109375, 473.93121337890625, 495.3678894042969, 516.8045654296875, 538.2412109375, 559.6778564453125, 581.114501953125, 602.5511474609375, 623.98779296875, 645.4244384765625, 666.861083984375, 688.2977294921875, 709.734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 6.0, 12.0, 18.0, 22.0, 53.0, 64.0, 92.0, 138.0, 217.0, 375.0, 663.0, 1463.0, 3369.0, 8995.0, 27265.0, 111247.0, 937328.0, 2716356.0, 304310.0, 55715.0, 15976.0, 5763.0, 2346.0, 1107.0, 597.0, 288.0, 177.0, 100.0, 80.0, 42.0, 24.0, 19.0, 14.0, 8.0, 13.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.84375, -57.72705078125, -55.6103515625, -53.49365234375, -51.376953125, -49.26025390625, -47.1435546875, -45.02685546875, -42.91015625, -40.79345703125, -38.6767578125, -36.56005859375, -34.443359375, -32.32666015625, -30.2099609375, -28.09326171875, -25.9765625, -23.85986328125, -21.7431640625, -19.62646484375, -17.509765625, -15.39306640625, -13.2763671875, -11.15966796875, -9.04296875, -6.92626953125, -4.8095703125, -2.69287109375, -0.576171875, 1.54052734375, 3.6572265625, 5.77392578125, 7.890625, 10.00732421875, 12.1240234375, 14.24072265625, 16.357421875, 18.47412109375, 20.5908203125, 22.70751953125, 24.82421875, 26.94091796875, 29.0576171875, 31.17431640625, 33.291015625, 35.40771484375, 37.5244140625, 39.64111328125, 41.7578125, 43.87451171875, 45.9912109375, 48.10791015625, 50.224609375, 52.34130859375, 54.4580078125, 56.57470703125, 58.69140625, 60.80810546875, 62.9248046875, 65.04150390625, 67.158203125, 69.27490234375, 71.3916015625, 73.50830078125, 75.625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 10.0, 13.0, 17.0, 26.0, 34.0, 34.0, 38.0, 52.0, 45.0, 42.0, 58.0, 60.0, 61.0, 60.0, 69.0, 51.0, 54.0, 41.0, 44.0, 32.0, 30.0, 28.0, 17.0, 16.0, 13.0, 10.0, 14.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4375, -33.05126953125, -31.6650390625, -30.27880859375, -28.892578125, -27.50634765625, -26.1201171875, -24.73388671875, -23.34765625, -21.96142578125, -20.5751953125, -19.18896484375, -17.802734375, -16.41650390625, -15.0302734375, -13.64404296875, -12.2578125, -10.87158203125, -9.4853515625, -8.09912109375, -6.712890625, -5.32666015625, -3.9404296875, -2.55419921875, -1.16796875, 0.21826171875, 1.6044921875, 2.99072265625, 4.376953125, 5.76318359375, 7.1494140625, 8.53564453125, 9.921875, 11.30810546875, 12.6943359375, 14.08056640625, 15.466796875, 16.85302734375, 18.2392578125, 19.62548828125, 21.01171875, 22.39794921875, 23.7841796875, 25.17041015625, 26.556640625, 27.94287109375, 29.3291015625, 30.71533203125, 32.1015625, 33.48779296875, 34.8740234375, 36.26025390625, 37.646484375, 39.03271484375, 40.4189453125, 41.80517578125, 43.19140625, 44.57763671875, 45.9638671875, 47.35009765625, 48.736328125, 50.12255859375, 51.5087890625, 52.89501953125, 54.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 1.0, 11.0, 26.0, 20.0, 27.0, 43.0, 79.0, 125.0, 185.0, 391.0, 726.0, 1716.0, 4611.0, 16342.0, 81534.0, 1161903.0, 2782073.0, 117344.0, 18917.0, 5118.0, 1629.0, 648.0, 347.0, 165.0, 92.0, 56.0, 48.0, 25.0, 20.0, 11.0, 8.0, 7.0, 3.0, 3.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-138.5, -134.8662109375, -131.232421875, -127.5986328125, -123.96484375, -120.3310546875, -116.697265625, -113.0634765625, -109.4296875, -105.7958984375, -102.162109375, -98.5283203125, -94.89453125, -91.2607421875, -87.626953125, -83.9931640625, -80.359375, -76.7255859375, -73.091796875, -69.4580078125, -65.82421875, -62.1904296875, -58.556640625, -54.9228515625, -51.2890625, -47.6552734375, -44.021484375, -40.3876953125, -36.75390625, -33.1201171875, -29.486328125, -25.8525390625, -22.21875, -18.5849609375, -14.951171875, -11.3173828125, -7.68359375, -4.0498046875, -0.416015625, 3.2177734375, 6.8515625, 10.4853515625, 14.119140625, 17.7529296875, 21.38671875, 25.0205078125, 28.654296875, 32.2880859375, 35.921875, 39.5556640625, 43.189453125, 46.8232421875, 50.45703125, 54.0908203125, 57.724609375, 61.3583984375, 64.9921875, 68.6259765625, 72.259765625, 75.8935546875, 79.52734375, 83.1611328125, 86.794921875, 90.4287109375, 94.0625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 12.0, 16.0, 14.0, 16.0, 30.0, 27.0, 30.0, 40.0, 67.0, 67.0, 142.0, 189.0, 293.0, 503.0, 799.0, 659.0, 390.0, 270.0, 140.0, 96.0, 75.0, 38.0, 44.0, 31.0, 14.0, 10.0, 10.0, 8.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.75, -94.66796875, -91.5859375, -88.50390625, -85.421875, -82.33984375, -79.2578125, -76.17578125, -73.09375, -70.01171875, -66.9296875, -63.84765625, -60.765625, -57.68359375, -54.6015625, -51.51953125, -48.4375, -45.35546875, -42.2734375, -39.19140625, -36.109375, -33.02734375, -29.9453125, -26.86328125, -23.78125, -20.69921875, -17.6171875, -14.53515625, -11.453125, -8.37109375, -5.2890625, -2.20703125, 0.875, 3.95703125, 7.0390625, 10.12109375, 13.203125, 16.28515625, 19.3671875, 22.44921875, 25.53125, 28.61328125, 31.6953125, 34.77734375, 37.859375, 40.94140625, 44.0234375, 47.10546875, 50.1875, 53.26953125, 56.3515625, 59.43359375, 62.515625, 65.59765625, 68.6796875, 71.76171875, 74.84375, 77.92578125, 81.0078125, 84.08984375, 87.171875, 90.25390625, 93.3359375, 96.41796875, 99.5]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 5.0, 17.0, 27.0, 85.0, 232.0, 317.0, 178.0, 98.0, 18.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2697.83203125, -2643.29443359375, -2588.757080078125, -2534.219482421875, -2479.681884765625, -2425.14453125, -2370.60693359375, -2316.0693359375, -2261.531982421875, -2206.994384765625, -2152.45703125, -2097.91943359375, -2043.3819580078125, -1988.844482421875, -1934.306884765625, -1879.7694091796875, -1825.2318115234375, -1770.6943359375, -1716.15673828125, -1661.6192626953125, -1607.081787109375, -1552.544189453125, -1498.0067138671875, -1443.46923828125, -1388.931640625, -1334.3941650390625, -1279.8565673828125, -1225.319091796875, -1170.7816162109375, -1116.244140625, -1061.70654296875, -1007.1690673828125, -952.6315307617188, -898.093994140625, -843.5565185546875, -789.0189819335938, -734.4814453125, -679.9439697265625, -625.4064331054688, -570.868896484375, -516.3314208984375, -461.7939147949219, -407.25640869140625, -352.7188720703125, -298.1813659667969, -243.64385986328125, -189.1063232421875, -134.56881713867188, -80.03131103515625, -25.493797302246094, 29.043716430664062, 83.58123779296875, 138.11874389648438, 192.65625, 247.19378662109375, 301.7312927246094, 356.268798828125, 410.8063049316406, 465.34381103515625, 519.88134765625, 574.4188232421875, 628.9563598632812, 683.493896484375, 738.0313720703125, 792.5689086914062]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 6.0, 7.0, 13.0, 10.0, 23.0, 27.0, 28.0, 35.0, 22.0, 36.0, 48.0, 61.0, 55.0, 67.0, 52.0, 43.0, 54.0, 56.0, 58.0, 47.0, 40.0, 37.0, 36.0, 30.0, 27.0, 17.0, 11.0, 7.0, 5.0, 12.0, 4.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-604.5279541015625, -584.8312377929688, -565.134521484375, -545.4378662109375, -525.7411499023438, -506.04443359375, -486.34771728515625, -466.6510009765625, -446.9543151855469, -427.2575988769531, -407.5609130859375, -387.86419677734375, -368.16748046875, -348.4707946777344, -328.7740783691406, -309.077392578125, -289.38067626953125, -269.6839599609375, -249.98727416992188, -230.29055786132812, -210.59385681152344, -190.89715576171875, -171.200439453125, -151.5037384033203, -131.80703735351562, -112.11033630371094, -92.41362762451172, -72.7169189453125, -53.02021789550781, -33.323516845703125, -13.626808166503906, 6.0699005126953125, 25.7666015625, 45.46330642700195, 65.1600112915039, 84.85671997070312, 104.55342102050781, 124.2501220703125, 143.94683837890625, 163.64353942871094, 183.34024047851562, 203.0369415283203, 222.733642578125, 242.43035888671875, 262.1270751953125, 281.8237609863281, 301.5204772949219, 321.2171630859375, 340.91387939453125, 360.610595703125, 380.3072814941406, 400.0039978027344, 419.70068359375, 439.39739990234375, 459.0941162109375, 478.79083251953125, 498.4875183105469, 518.1842041015625, 537.8809204101562, 557.57763671875, 577.2743530273438, 596.9710693359375, 616.667724609375, 636.3644409179688, 656.0611572265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 12.0, 11.0, 17.0, 19.0, 46.0, 75.0, 95.0, 209.0, 424.0, 989.0, 2447.0, 7167.0, 22755.0, 78838.0, 261565.0, 431087.0, 170768.0, 49593.0, 14545.0, 4770.0, 1619.0, 742.0, 334.0, 167.0, 97.0, 51.0, 28.0, 31.0, 21.0, 10.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-114.9375, -111.7724609375, -108.607421875, -105.4423828125, -102.27734375, -99.1123046875, -95.947265625, -92.7822265625, -89.6171875, -86.4521484375, -83.287109375, -80.1220703125, -76.95703125, -73.7919921875, -70.626953125, -67.4619140625, -64.296875, -61.1318359375, -57.966796875, -54.8017578125, -51.63671875, -48.4716796875, -45.306640625, -42.1416015625, -38.9765625, -35.8115234375, -32.646484375, -29.4814453125, -26.31640625, -23.1513671875, -19.986328125, -16.8212890625, -13.65625, -10.4912109375, -7.326171875, -4.1611328125, -0.99609375, 2.1689453125, 5.333984375, 8.4990234375, 11.6640625, 14.8291015625, 17.994140625, 21.1591796875, 24.32421875, 27.4892578125, 30.654296875, 33.8193359375, 36.984375, 40.1494140625, 43.314453125, 46.4794921875, 49.64453125, 52.8095703125, 55.974609375, 59.1396484375, 62.3046875, 65.4697265625, 68.634765625, 71.7998046875, 74.96484375, 78.1298828125, 81.294921875, 84.4599609375, 87.625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 10.0, 5.0, 9.0, 12.0, 16.0, 25.0, 33.0, 32.0, 41.0, 27.0, 49.0, 57.0, 61.0, 60.0, 59.0, 69.0, 56.0, 56.0, 52.0, 68.0, 44.0, 34.0, 30.0, 28.0, 18.0, 14.0, 12.0, 13.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -40.80419921875, -39.2958984375, -37.78759765625, -36.279296875, -34.77099609375, -33.2626953125, -31.75439453125, -30.24609375, -28.73779296875, -27.2294921875, -25.72119140625, -24.212890625, -22.70458984375, -21.1962890625, -19.68798828125, -18.1796875, -16.67138671875, -15.1630859375, -13.65478515625, -12.146484375, -10.63818359375, -9.1298828125, -7.62158203125, -6.11328125, -4.60498046875, -3.0966796875, -1.58837890625, -0.080078125, 1.42822265625, 2.9365234375, 4.44482421875, 5.953125, 7.46142578125, 8.9697265625, 10.47802734375, 11.986328125, 13.49462890625, 15.0029296875, 16.51123046875, 18.01953125, 19.52783203125, 21.0361328125, 22.54443359375, 24.052734375, 25.56103515625, 27.0693359375, 28.57763671875, 30.0859375, 31.59423828125, 33.1025390625, 34.61083984375, 36.119140625, 37.62744140625, 39.1357421875, 40.64404296875, 42.15234375, 43.66064453125, 45.1689453125, 46.67724609375, 48.185546875, 49.69384765625, 51.2021484375, 52.71044921875, 54.21875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 7.0, 4.0, 9.0, 8.0, 15.0, 21.0, 24.0, 44.0, 42.0, 66.0, 123.0, 188.0, 232.0, 364.0, 561.0, 975.0, 1630.0, 3516.0, 9829.0, 46755.0, 348884.0, 554582.0, 60182.0, 11794.0, 3952.0, 1895.0, 965.0, 592.0, 405.0, 278.0, 179.0, 114.0, 93.0, 65.0, 38.0, 28.0, 21.0, 23.0, 11.0, 6.0, 10.0, 3.0, 3.0, 10.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-131.25, -126.734375, -122.21875, -117.703125, -113.1875, -108.671875, -104.15625, -99.640625, -95.125, -90.609375, -86.09375, -81.578125, -77.0625, -72.546875, -68.03125, -63.515625, -59.0, -54.484375, -49.96875, -45.453125, -40.9375, -36.421875, -31.90625, -27.390625, -22.875, -18.359375, -13.84375, -9.328125, -4.8125, -0.296875, 4.21875, 8.734375, 13.25, 17.765625, 22.28125, 26.796875, 31.3125, 35.828125, 40.34375, 44.859375, 49.375, 53.890625, 58.40625, 62.921875, 67.4375, 71.953125, 76.46875, 80.984375, 85.5, 90.015625, 94.53125, 99.046875, 103.5625, 108.078125, 112.59375, 117.109375, 121.625, 126.140625, 130.65625, 135.171875, 139.6875, 144.203125, 148.71875, 153.234375, 157.75]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 7.0, 4.0, 11.0, 14.0, 10.0, 28.0, 26.0, 28.0, 37.0, 42.0, 42.0, 47.0, 47.0, 58.0, 58.0, 65.0, 54.0, 58.0, 59.0, 36.0, 30.0, 51.0, 21.0, 31.0, 30.0, 18.0, 9.0, 18.0, 7.0, 11.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-182.125, -176.130859375, -170.13671875, -164.142578125, -158.1484375, -152.154296875, -146.16015625, -140.166015625, -134.171875, -128.177734375, -122.18359375, -116.189453125, -110.1953125, -104.201171875, -98.20703125, -92.212890625, -86.21875, -80.224609375, -74.23046875, -68.236328125, -62.2421875, -56.248046875, -50.25390625, -44.259765625, -38.265625, -32.271484375, -26.27734375, -20.283203125, -14.2890625, -8.294921875, -2.30078125, 3.693359375, 9.6875, 15.681640625, 21.67578125, 27.669921875, 33.6640625, 39.658203125, 45.65234375, 51.646484375, 57.640625, 63.634765625, 69.62890625, 75.623046875, 81.6171875, 87.611328125, 93.60546875, 99.599609375, 105.59375, 111.587890625, 117.58203125, 123.576171875, 129.5703125, 135.564453125, 141.55859375, 147.552734375, 153.546875, 159.541015625, 165.53515625, 171.529296875, 177.5234375, 183.517578125, 189.51171875, 195.505859375, 201.5]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 4.0, 8.0, 10.0, 14.0, 18.0, 24.0, 37.0, 65.0, 117.0, 186.0, 442.0, 1505.0, 8550.0, 232771.0, 784187.0, 17078.0, 2279.0, 635.0, 281.0, 115.0, 58.0, 44.0, 21.0, 23.0, 15.0, 12.0, 11.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.25, -85.416015625, -82.58203125, -79.748046875, -76.9140625, -74.080078125, -71.24609375, -68.412109375, -65.578125, -62.744140625, -59.91015625, -57.076171875, -54.2421875, -51.408203125, -48.57421875, -45.740234375, -42.90625, -40.072265625, -37.23828125, -34.404296875, -31.5703125, -28.736328125, -25.90234375, -23.068359375, -20.234375, -17.400390625, -14.56640625, -11.732421875, -8.8984375, -6.064453125, -3.23046875, -0.396484375, 2.4375, 5.271484375, 8.10546875, 10.939453125, 13.7734375, 16.607421875, 19.44140625, 22.275390625, 25.109375, 27.943359375, 30.77734375, 33.611328125, 36.4453125, 39.279296875, 42.11328125, 44.947265625, 47.78125, 50.615234375, 53.44921875, 56.283203125, 59.1171875, 61.951171875, 64.78515625, 67.619140625, 70.453125, 73.287109375, 76.12109375, 78.955078125, 81.7890625, 84.623046875, 87.45703125, 90.291015625, 93.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 9.0, 25.0, 22.0, 28.0, 30.0, 34.0, 55.0, 66.0, 92.0, 115.0, 112.0, 88.0, 53.0, 48.0, 35.0, 41.0, 27.0, 25.0, 13.0, 8.0, 15.0, 13.0, 6.0, 4.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010528564453125, -0.0102006196975708, -0.009872674942016602, -0.009544730186462402, -0.009216785430908203, -0.008888840675354004, -0.008560895919799805, -0.008232951164245605, -0.007905006408691406, -0.007577061653137207, -0.007249116897583008, -0.006921172142028809, -0.006593227386474609, -0.00626528263092041, -0.005937337875366211, -0.005609393119812012, -0.0052814483642578125, -0.004953503608703613, -0.004625558853149414, -0.004297614097595215, -0.003969669342041016, -0.0036417245864868164, -0.003313779830932617, -0.002985835075378418, -0.0026578903198242188, -0.0023299455642700195, -0.0020020008087158203, -0.001674056053161621, -0.0013461112976074219, -0.0010181665420532227, -0.0006902217864990234, -0.0003622770309448242, -3.4332275390625e-05, 0.0002936124801635742, 0.0006215572357177734, 0.0009495019912719727, 0.0012774467468261719, 0.001605391502380371, 0.0019333362579345703, 0.0022612810134887695, 0.0025892257690429688, 0.002917170524597168, 0.003245115280151367, 0.0035730600357055664, 0.0039010047912597656, 0.004228949546813965, 0.004556894302368164, 0.004884839057922363, 0.0052127838134765625, 0.005540728569030762, 0.005868673324584961, 0.00619661808013916, 0.006524562835693359, 0.006852507591247559, 0.007180452346801758, 0.007508397102355957, 0.007836341857910156, 0.008164286613464355, 0.008492231369018555, 0.008820176124572754, 0.009148120880126953, 0.009476065635681152, 0.009804010391235352, 0.01013195514678955, 0.01045989990234375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 7.0, 16.0, 18.0, 19.0, 36.0, 50.0, 95.0, 164.0, 260.0, 581.0, 1311.0, 3451.0, 13189.0, 171773.0, 815860.0, 32161.0, 5975.0, 1895.0, 828.0, 349.0, 177.0, 104.0, 77.0, 49.0, 31.0, 17.0, 13.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.0625, -72.7333984375, -70.404296875, -68.0751953125, -65.74609375, -63.4169921875, -61.087890625, -58.7587890625, -56.4296875, -54.1005859375, -51.771484375, -49.4423828125, -47.11328125, -44.7841796875, -42.455078125, -40.1259765625, -37.796875, -35.4677734375, -33.138671875, -30.8095703125, -28.48046875, -26.1513671875, -23.822265625, -21.4931640625, -19.1640625, -16.8349609375, -14.505859375, -12.1767578125, -9.84765625, -7.5185546875, -5.189453125, -2.8603515625, -0.53125, 1.7978515625, 4.126953125, 6.4560546875, 8.78515625, 11.1142578125, 13.443359375, 15.7724609375, 18.1015625, 20.4306640625, 22.759765625, 25.0888671875, 27.41796875, 29.7470703125, 32.076171875, 34.4052734375, 36.734375, 39.0634765625, 41.392578125, 43.7216796875, 46.05078125, 48.3798828125, 50.708984375, 53.0380859375, 55.3671875, 57.6962890625, 60.025390625, 62.3544921875, 64.68359375, 67.0126953125, 69.341796875, 71.6708984375, 74.0]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 0.0, 3.0, 5.0, 7.0, 7.0, 5.0, 7.0, 8.0, 17.0, 27.0, 42.0, 38.0, 58.0, 93.0, 122.0, 142.0, 129.0, 96.0, 58.0, 39.0, 26.0, 21.0, 9.0, 10.0, 6.0, 9.0, 5.0, 2.0, 1.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.1875, -54.396484375, -52.60546875, -50.814453125, -49.0234375, -47.232421875, -45.44140625, -43.650390625, -41.859375, -40.068359375, -38.27734375, -36.486328125, -34.6953125, -32.904296875, -31.11328125, -29.322265625, -27.53125, -25.740234375, -23.94921875, -22.158203125, -20.3671875, -18.576171875, -16.78515625, -14.994140625, -13.203125, -11.412109375, -9.62109375, -7.830078125, -6.0390625, -4.248046875, -2.45703125, -0.666015625, 1.125, 2.916015625, 4.70703125, 6.498046875, 8.2890625, 10.080078125, 11.87109375, 13.662109375, 15.453125, 17.244140625, 19.03515625, 20.826171875, 22.6171875, 24.408203125, 26.19921875, 27.990234375, 29.78125, 31.572265625, 33.36328125, 35.154296875, 36.9453125, 38.736328125, 40.52734375, 42.318359375, 44.109375, 45.900390625, 47.69140625, 49.482421875, 51.2734375, 53.064453125, 54.85546875, 56.646484375, 58.4375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 13.0, 36.0, 51.0, 112.0, 209.0, 239.0, 149.0, 88.0, 45.0, 22.0, 18.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1324.128662109375, -1288.4403076171875, -1252.751953125, -1217.0635986328125, -1181.375244140625, -1145.686767578125, -1109.99853515625, -1074.31005859375, -1038.6217041015625, -1002.933349609375, -967.2449951171875, -931.556640625, -895.8682250976562, -860.1798706054688, -824.4915161132812, -788.8031616210938, -753.1148071289062, -717.4264526367188, -681.7380981445312, -646.0496826171875, -610.361328125, -574.6729736328125, -538.984619140625, -503.2962646484375, -467.6078796386719, -431.9195251464844, -396.23114013671875, -360.54278564453125, -324.85443115234375, -289.1660461425781, -253.47769165039062, -217.78932189941406, -182.10089111328125, -146.4125213623047, -110.72415924072266, -75.03579711914062, -39.34742736816406, -3.6590576171875, 32.029296875, 67.71766662597656, 103.40603637695312, 139.0944061279297, 174.78277587890625, 210.47113037109375, 246.1595001220703, 281.8478698730469, 317.5362243652344, 353.224609375, 388.9129638671875, 424.601318359375, 460.2897033691406, 495.9780578613281, 531.6664428710938, 567.3547973632812, 603.0431518554688, 638.7315063476562, 674.419921875, 710.1082763671875, 745.796630859375, 781.4849853515625, 817.1734008789062, 852.8617553710938, 888.5501098632812, 924.2384643554688, 959.9268188476562]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 17.0, 23.0, 30.0, 23.0, 31.0, 36.0, 28.0, 26.0, 43.0, 62.0, 66.0, 73.0, 79.0, 71.0, 53.0, 23.0, 28.0, 31.0, 24.0, 31.0, 27.0, 20.0, 24.0, 19.0, 13.0, 10.0, 7.0, 9.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-619.3637084960938, -598.286865234375, -577.2100219726562, -556.1331787109375, -535.0562744140625, -513.9794311523438, -492.902587890625, -471.82574462890625, -450.7489013671875, -429.67205810546875, -408.5951843261719, -387.5183410644531, -366.4414978027344, -345.3646240234375, -324.28778076171875, -303.2109375, -282.1340637207031, -261.0572204589844, -239.98036193847656, -218.90350341796875, -197.82666015625, -176.7498016357422, -155.67294311523438, -134.59609985351562, -113.51924133300781, -92.44239044189453, -71.36553955078125, -50.28868103027344, -29.211830139160156, -8.134979248046875, 12.941879272460938, 34.01872253417969, 55.0955810546875, 76.17243194580078, 97.24928283691406, 118.32614135742188, 139.40298461914062, 160.47984313964844, 181.55670166015625, 202.633544921875, 223.7104034423828, 244.78726196289062, 265.8641052246094, 286.94097900390625, 308.017822265625, 329.09466552734375, 350.1715087890625, 371.24835205078125, 392.3252258300781, 413.4020690917969, 434.47894287109375, 455.5557861328125, 476.63262939453125, 497.70947265625, 518.786376953125, 539.8631591796875, 560.9400634765625, 582.0169067382812, 603.09375, 624.170654296875, 645.2474975585938, 666.3243408203125, 687.4011840820312, 708.47802734375, 729.5548706054688]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 12.0, 11.0, 17.0, 27.0, 24.0, 48.0, 64.0, 96.0, 208.0, 494.0, 1687.0, 8416.0, 74574.0, 2573819.0, 1478479.0, 47538.0, 6465.0, 1385.0, 402.0, 173.0, 89.0, 46.0, 48.0, 25.0, 19.0, 20.0, 14.0, 11.0, 12.0, 5.0, 8.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-105.9375, -102.9033203125, -99.869140625, -96.8349609375, -93.80078125, -90.7666015625, -87.732421875, -84.6982421875, -81.6640625, -78.6298828125, -75.595703125, -72.5615234375, -69.52734375, -66.4931640625, -63.458984375, -60.4248046875, -57.390625, -54.3564453125, -51.322265625, -48.2880859375, -45.25390625, -42.2197265625, -39.185546875, -36.1513671875, -33.1171875, -30.0830078125, -27.048828125, -24.0146484375, -20.98046875, -17.9462890625, -14.912109375, -11.8779296875, -8.84375, -5.8095703125, -2.775390625, 0.2587890625, 3.29296875, 6.3271484375, 9.361328125, 12.3955078125, 15.4296875, 18.4638671875, 21.498046875, 24.5322265625, 27.56640625, 30.6005859375, 33.634765625, 36.6689453125, 39.703125, 42.7373046875, 45.771484375, 48.8056640625, 51.83984375, 54.8740234375, 57.908203125, 60.9423828125, 63.9765625, 67.0107421875, 70.044921875, 73.0791015625, 76.11328125, 79.1474609375, 82.181640625, 85.2158203125, 88.25]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 13.0, 16.0, 20.0, 17.0, 16.0, 20.0, 19.0, 32.0, 36.0, 33.0, 40.0, 27.0, 35.0, 40.0, 44.0, 45.0, 55.0, 37.0, 55.0, 44.0, 49.0, 31.0, 43.0, 32.0, 40.0, 22.0, 27.0, 22.0, 15.0, 10.0, 10.0, 11.0, 7.0, 10.0, 5.0, 6.0, 2.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.515625, -30.446044921875, -29.37646484375, -28.306884765625, -27.2373046875, -26.167724609375, -25.09814453125, -24.028564453125, -22.958984375, -21.889404296875, -20.81982421875, -19.750244140625, -18.6806640625, -17.611083984375, -16.54150390625, -15.471923828125, -14.40234375, -13.332763671875, -12.26318359375, -11.193603515625, -10.1240234375, -9.054443359375, -7.98486328125, -6.915283203125, -5.845703125, -4.776123046875, -3.70654296875, -2.636962890625, -1.5673828125, -0.497802734375, 0.57177734375, 1.641357421875, 2.7109375, 3.780517578125, 4.85009765625, 5.919677734375, 6.9892578125, 8.058837890625, 9.12841796875, 10.197998046875, 11.267578125, 12.337158203125, 13.40673828125, 14.476318359375, 15.5458984375, 16.615478515625, 17.68505859375, 18.754638671875, 19.82421875, 20.893798828125, 21.96337890625, 23.032958984375, 24.1025390625, 25.172119140625, 26.24169921875, 27.311279296875, 28.380859375, 29.450439453125, 30.52001953125, 31.589599609375, 32.6591796875, 33.728759765625, 34.79833984375, 35.867919921875, 36.9375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 6.0, 12.0, 23.0, 37.0, 67.0, 98.0, 229.0, 483.0, 1264.0, 4188.0, 18627.0, 133569.0, 3444162.0, 543268.0, 38576.0, 6862.0, 1718.0, 569.0, 226.0, 131.0, 59.0, 28.0, 20.0, 13.0, 15.0, 7.0, 4.0, 2.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.6875, -121.2919921875, -117.896484375, -114.5009765625, -111.10546875, -107.7099609375, -104.314453125, -100.9189453125, -97.5234375, -94.1279296875, -90.732421875, -87.3369140625, -83.94140625, -80.5458984375, -77.150390625, -73.7548828125, -70.359375, -66.9638671875, -63.568359375, -60.1728515625, -56.77734375, -53.3818359375, -49.986328125, -46.5908203125, -43.1953125, -39.7998046875, -36.404296875, -33.0087890625, -29.61328125, -26.2177734375, -22.822265625, -19.4267578125, -16.03125, -12.6357421875, -9.240234375, -5.8447265625, -2.44921875, 0.9462890625, 4.341796875, 7.7373046875, 11.1328125, 14.5283203125, 17.923828125, 21.3193359375, 24.71484375, 28.1103515625, 31.505859375, 34.9013671875, 38.296875, 41.6923828125, 45.087890625, 48.4833984375, 51.87890625, 55.2744140625, 58.669921875, 62.0654296875, 65.4609375, 68.8564453125, 72.251953125, 75.6474609375, 79.04296875, 82.4384765625, 85.833984375, 89.2294921875, 92.625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 6.0, 10.0, 13.0, 13.0, 19.0, 19.0, 19.0, 24.0, 32.0, 40.0, 66.0, 93.0, 173.0, 266.0, 415.0, 645.0, 714.0, 523.0, 350.0, 204.0, 121.0, 90.0, 52.0, 38.0, 30.0, 28.0, 12.0, 13.0, 12.0, 11.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-91.3125, -88.7861328125, -86.259765625, -83.7333984375, -81.20703125, -78.6806640625, -76.154296875, -73.6279296875, -71.1015625, -68.5751953125, -66.048828125, -63.5224609375, -60.99609375, -58.4697265625, -55.943359375, -53.4169921875, -50.890625, -48.3642578125, -45.837890625, -43.3115234375, -40.78515625, -38.2587890625, -35.732421875, -33.2060546875, -30.6796875, -28.1533203125, -25.626953125, -23.1005859375, -20.57421875, -18.0478515625, -15.521484375, -12.9951171875, -10.46875, -7.9423828125, -5.416015625, -2.8896484375, -0.36328125, 2.1630859375, 4.689453125, 7.2158203125, 9.7421875, 12.2685546875, 14.794921875, 17.3212890625, 19.84765625, 22.3740234375, 24.900390625, 27.4267578125, 29.953125, 32.4794921875, 35.005859375, 37.5322265625, 40.05859375, 42.5849609375, 45.111328125, 47.6376953125, 50.1640625, 52.6904296875, 55.216796875, 57.7431640625, 60.26953125, 62.7958984375, 65.322265625, 67.8486328125, 70.375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 10.0, 40.0, 159.0, 357.0, 294.0, 96.0, 28.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-977.974609375, -926.07958984375, -874.1845703125, -822.28955078125, -770.39453125, -718.49951171875, -666.6045532226562, -614.7095336914062, -562.8145141601562, -510.91949462890625, -459.02447509765625, -407.1294860839844, -355.2344665527344, -303.3394470214844, -251.4444580078125, -199.5494384765625, -147.6544189453125, -95.75940704345703, -43.86439514160156, 8.030609130859375, 59.925628662109375, 111.82064819335938, 163.71563720703125, 215.61065673828125, 267.50567626953125, 319.40069580078125, 371.29571533203125, 423.1907043457031, 475.0857238769531, 526.980712890625, 578.875732421875, 630.770751953125, 682.665771484375, 734.560791015625, 786.455810546875, 838.350830078125, 890.245849609375, 942.140869140625, 994.0358276367188, 1045.930908203125, 1097.825927734375, 1149.720947265625, 1201.615966796875, 1253.510986328125, 1305.406005859375, 1357.301025390625, 1409.196044921875, 1461.091064453125, 1512.9859619140625, 1564.8809814453125, 1616.7760009765625, 1668.6710205078125, 1720.5660400390625, 1772.4610595703125, 1824.35595703125, 1876.2509765625, 1928.14599609375, 1980.041015625, 2031.93603515625, 2083.8310546875, 2135.72607421875, 2187.62109375, 2239.51611328125, 2291.4111328125, 2343.30615234375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 3.0, 9.0, 10.0, 9.0, 17.0, 19.0, 20.0, 18.0, 30.0, 43.0, 33.0, 44.0, 45.0, 48.0, 45.0, 61.0, 55.0, 55.0, 62.0, 37.0, 28.0, 55.0, 51.0, 22.0, 40.0, 20.0, 23.0, 22.0, 13.0, 13.0, 7.0, 7.0, 7.0, 5.0, 5.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-544.79833984375, -530.513916015625, -516.2295532226562, -501.94512939453125, -487.6607360839844, -473.3763427734375, -459.0919189453125, -444.8075256347656, -430.52313232421875, -416.2387390136719, -401.9543151855469, -387.669921875, -373.3855285644531, -359.10113525390625, -344.81671142578125, -330.5323181152344, -316.2478942871094, -301.9635009765625, -287.6790771484375, -273.3946838378906, -259.11029052734375, -244.8258819580078, -230.54147338867188, -216.257080078125, -201.97267150878906, -187.68826293945312, -173.40386962890625, -159.1194610595703, -144.83505249023438, -130.5506591796875, -116.26625061035156, -101.98184967041016, -87.69744873046875, -73.41304779052734, -59.12864303588867, -44.84423828125, -30.559837341308594, -16.275436401367188, -1.99102783203125, 12.293373107910156, 26.577774047851562, 40.86217498779297, 55.14657974243164, 69.43098449707031, 83.71538543701172, 97.99978637695312, 112.28419494628906, 126.56859588623047, 140.85299682617188, 155.1374053955078, 169.4217987060547, 183.70620727539062, 197.9906005859375, 212.27500915527344, 226.55941772460938, 240.84381103515625, 255.1282196044922, 269.4126281738281, 283.697021484375, 297.9814453125, 312.2658386230469, 326.55023193359375, 340.83465576171875, 355.1190490722656, 369.4034423828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 14.0, 9.0, 14.0, 24.0, 36.0, 59.0, 126.0, 204.0, 341.0, 733.0, 1486.0, 3127.0, 6994.0, 17783.0, 45166.0, 124096.0, 336255.0, 322463.0, 117349.0, 42986.0, 16589.0, 6740.0, 2994.0, 1405.0, 723.0, 363.0, 216.0, 116.0, 58.0, 30.0, 22.0, 14.0, 8.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.6875, -67.2822265625, -64.876953125, -62.4716796875, -60.06640625, -57.6611328125, -55.255859375, -52.8505859375, -50.4453125, -48.0400390625, -45.634765625, -43.2294921875, -40.82421875, -38.4189453125, -36.013671875, -33.6083984375, -31.203125, -28.7978515625, -26.392578125, -23.9873046875, -21.58203125, -19.1767578125, -16.771484375, -14.3662109375, -11.9609375, -9.5556640625, -7.150390625, -4.7451171875, -2.33984375, 0.0654296875, 2.470703125, 4.8759765625, 7.28125, 9.6865234375, 12.091796875, 14.4970703125, 16.90234375, 19.3076171875, 21.712890625, 24.1181640625, 26.5234375, 28.9287109375, 31.333984375, 33.7392578125, 36.14453125, 38.5498046875, 40.955078125, 43.3603515625, 45.765625, 48.1708984375, 50.576171875, 52.9814453125, 55.38671875, 57.7919921875, 60.197265625, 62.6025390625, 65.0078125, 67.4130859375, 69.818359375, 72.2236328125, 74.62890625, 77.0341796875, 79.439453125, 81.8447265625, 84.25]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 5.0, 14.0, 13.0, 15.0, 11.0, 19.0, 19.0, 18.0, 16.0, 30.0, 32.0, 39.0, 37.0, 45.0, 36.0, 38.0, 44.0, 46.0, 45.0, 53.0, 49.0, 48.0, 47.0, 30.0, 29.0, 35.0, 32.0, 25.0, 19.0, 29.0, 9.0, 16.0, 9.0, 13.0, 4.0, 6.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.6875, -33.60986328125, -32.5322265625, -31.45458984375, -30.376953125, -29.29931640625, -28.2216796875, -27.14404296875, -26.06640625, -24.98876953125, -23.9111328125, -22.83349609375, -21.755859375, -20.67822265625, -19.6005859375, -18.52294921875, -17.4453125, -16.36767578125, -15.2900390625, -14.21240234375, -13.134765625, -12.05712890625, -10.9794921875, -9.90185546875, -8.82421875, -7.74658203125, -6.6689453125, -5.59130859375, -4.513671875, -3.43603515625, -2.3583984375, -1.28076171875, -0.203125, 0.87451171875, 1.9521484375, 3.02978515625, 4.107421875, 5.18505859375, 6.2626953125, 7.34033203125, 8.41796875, 9.49560546875, 10.5732421875, 11.65087890625, 12.728515625, 13.80615234375, 14.8837890625, 15.96142578125, 17.0390625, 18.11669921875, 19.1943359375, 20.27197265625, 21.349609375, 22.42724609375, 23.5048828125, 24.58251953125, 25.66015625, 26.73779296875, 27.8154296875, 28.89306640625, 29.970703125, 31.04833984375, 32.1259765625, 33.20361328125, 34.28125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 12.0, 15.0, 13.0, 21.0, 35.0, 37.0, 73.0, 105.0, 144.0, 196.0, 290.0, 468.0, 665.0, 1183.0, 2424.0, 6100.0, 24295.0, 161664.0, 715766.0, 107112.0, 18050.0, 4939.0, 2028.0, 1011.0, 628.0, 388.0, 294.0, 174.0, 120.0, 82.0, 60.0, 32.0, 42.0, 19.0, 20.0, 8.0, 6.0, 3.0, 9.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-127.25, -122.921875, -118.59375, -114.265625, -109.9375, -105.609375, -101.28125, -96.953125, -92.625, -88.296875, -83.96875, -79.640625, -75.3125, -70.984375, -66.65625, -62.328125, -58.0, -53.671875, -49.34375, -45.015625, -40.6875, -36.359375, -32.03125, -27.703125, -23.375, -19.046875, -14.71875, -10.390625, -6.0625, -1.734375, 2.59375, 6.921875, 11.25, 15.578125, 19.90625, 24.234375, 28.5625, 32.890625, 37.21875, 41.546875, 45.875, 50.203125, 54.53125, 58.859375, 63.1875, 67.515625, 71.84375, 76.171875, 80.5, 84.828125, 89.15625, 93.484375, 97.8125, 102.140625, 106.46875, 110.796875, 115.125, 119.453125, 123.78125, 128.109375, 132.4375, 136.765625, 141.09375, 145.421875, 149.75]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 5.0, 7.0, 12.0, 10.0, 10.0, 19.0, 22.0, 20.0, 23.0, 38.0, 33.0, 42.0, 47.0, 47.0, 44.0, 43.0, 52.0, 68.0, 59.0, 63.0, 50.0, 40.0, 39.0, 37.0, 36.0, 21.0, 22.0, 14.0, 13.0, 10.0, 10.0, 8.0, 10.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.25, -147.60546875, -142.9609375, -138.31640625, -133.671875, -129.02734375, -124.3828125, -119.73828125, -115.09375, -110.44921875, -105.8046875, -101.16015625, -96.515625, -91.87109375, -87.2265625, -82.58203125, -77.9375, -73.29296875, -68.6484375, -64.00390625, -59.359375, -54.71484375, -50.0703125, -45.42578125, -40.78125, -36.13671875, -31.4921875, -26.84765625, -22.203125, -17.55859375, -12.9140625, -8.26953125, -3.625, 1.01953125, 5.6640625, 10.30859375, 14.953125, 19.59765625, 24.2421875, 28.88671875, 33.53125, 38.17578125, 42.8203125, 47.46484375, 52.109375, 56.75390625, 61.3984375, 66.04296875, 70.6875, 75.33203125, 79.9765625, 84.62109375, 89.265625, 93.91015625, 98.5546875, 103.19921875, 107.84375, 112.48828125, 117.1328125, 121.77734375, 126.421875, 131.06640625, 135.7109375, 140.35546875, 145.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 9.0, 19.0, 25.0, 27.0, 27.0, 59.0, 102.0, 179.0, 351.0, 929.0, 3009.0, 17881.0, 295587.0, 691010.0, 32855.0, 4240.0, 1199.0, 492.0, 205.0, 114.0, 67.0, 37.0, 25.0, 28.0, 14.0, 9.0, 12.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -41.5615234375, -40.029296875, -38.4970703125, -36.96484375, -35.4326171875, -33.900390625, -32.3681640625, -30.8359375, -29.3037109375, -27.771484375, -26.2392578125, -24.70703125, -23.1748046875, -21.642578125, -20.1103515625, -18.578125, -17.0458984375, -15.513671875, -13.9814453125, -12.44921875, -10.9169921875, -9.384765625, -7.8525390625, -6.3203125, -4.7880859375, -3.255859375, -1.7236328125, -0.19140625, 1.3408203125, 2.873046875, 4.4052734375, 5.9375, 7.4697265625, 9.001953125, 10.5341796875, 12.06640625, 13.5986328125, 15.130859375, 16.6630859375, 18.1953125, 19.7275390625, 21.259765625, 22.7919921875, 24.32421875, 25.8564453125, 27.388671875, 28.9208984375, 30.453125, 31.9853515625, 33.517578125, 35.0498046875, 36.58203125, 38.1142578125, 39.646484375, 41.1787109375, 42.7109375, 44.2431640625, 45.775390625, 47.3076171875, 48.83984375, 50.3720703125, 51.904296875, 53.4365234375, 54.96875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 1.0, 4.0, 5.0, 7.0, 13.0, 15.0, 28.0, 24.0, 39.0, 40.0, 51.0, 54.0, 82.0, 80.0, 88.0, 80.0, 75.0, 65.0, 44.0, 33.0, 35.0, 22.0, 22.0, 21.0, 14.0, 11.0, 12.0, 8.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006832122802734375, -0.006602585315704346, -0.006373047828674316, -0.006143510341644287, -0.005913972854614258, -0.0056844353675842285, -0.005454897880554199, -0.00522536039352417, -0.004995822906494141, -0.004766285419464111, -0.004536747932434082, -0.004307210445404053, -0.0040776729583740234, -0.003848135471343994, -0.003618597984313965, -0.0033890604972839355, -0.0031595230102539062, -0.002929985523223877, -0.0027004480361938477, -0.0024709105491638184, -0.002241373062133789, -0.0020118355751037598, -0.0017822980880737305, -0.0015527606010437012, -0.0013232231140136719, -0.0010936856269836426, -0.0008641481399536133, -0.000634610652923584, -0.0004050731658935547, -0.0001755356788635254, 5.4001808166503906e-05, 0.0002835392951965332, 0.0005130767822265625, 0.0007426142692565918, 0.0009721517562866211, 0.0012016892433166504, 0.0014312267303466797, 0.001660764217376709, 0.0018903017044067383, 0.0021198391914367676, 0.002349376678466797, 0.002578914165496826, 0.0028084516525268555, 0.0030379891395568848, 0.003267526626586914, 0.0034970641136169434, 0.0037266016006469727, 0.003956139087677002, 0.004185676574707031, 0.0044152140617370605, 0.00464475154876709, 0.004874289035797119, 0.0051038265228271484, 0.005333364009857178, 0.005562901496887207, 0.005792438983917236, 0.006021976470947266, 0.006251513957977295, 0.006481051445007324, 0.0067105889320373535, 0.006940126419067383, 0.007169663906097412, 0.007399201393127441, 0.007628738880157471, 0.0078582763671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 26.0, 38.0, 52.0, 87.0, 150.0, 298.0, 531.0, 1023.0, 2398.0, 7236.0, 36491.0, 366737.0, 576405.0, 44002.0, 8025.0, 2616.0, 1072.0, 540.0, 292.0, 178.0, 114.0, 76.0, 50.0, 26.0, 24.0, 11.0, 13.0, 3.0, 6.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.03125, -37.884765625, -36.73828125, -35.591796875, -34.4453125, -33.298828125, -32.15234375, -31.005859375, -29.859375, -28.712890625, -27.56640625, -26.419921875, -25.2734375, -24.126953125, -22.98046875, -21.833984375, -20.6875, -19.541015625, -18.39453125, -17.248046875, -16.1015625, -14.955078125, -13.80859375, -12.662109375, -11.515625, -10.369140625, -9.22265625, -8.076171875, -6.9296875, -5.783203125, -4.63671875, -3.490234375, -2.34375, -1.197265625, -0.05078125, 1.095703125, 2.2421875, 3.388671875, 4.53515625, 5.681640625, 6.828125, 7.974609375, 9.12109375, 10.267578125, 11.4140625, 12.560546875, 13.70703125, 14.853515625, 16.0, 17.146484375, 18.29296875, 19.439453125, 20.5859375, 21.732421875, 22.87890625, 24.025390625, 25.171875, 26.318359375, 27.46484375, 28.611328125, 29.7578125, 30.904296875, 32.05078125, 33.197265625, 34.34375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 8.0, 9.0, 14.0, 12.0, 21.0, 25.0, 37.0, 56.0, 58.0, 72.0, 82.0, 85.0, 88.0, 97.0, 70.0, 59.0, 48.0, 53.0, 26.0, 23.0, 11.0, 12.0, 13.0, 10.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -18.697265625, -17.67578125, -16.654296875, -15.6328125, -14.611328125, -13.58984375, -12.568359375, -11.546875, -10.525390625, -9.50390625, -8.482421875, -7.4609375, -6.439453125, -5.41796875, -4.396484375, -3.375, -2.353515625, -1.33203125, -0.310546875, 0.7109375, 1.732421875, 2.75390625, 3.775390625, 4.796875, 5.818359375, 6.83984375, 7.861328125, 8.8828125, 9.904296875, 10.92578125, 11.947265625, 12.96875, 13.990234375, 15.01171875, 16.033203125, 17.0546875, 18.076171875, 19.09765625, 20.119140625, 21.140625, 22.162109375, 23.18359375, 24.205078125, 25.2265625, 26.248046875, 27.26953125, 28.291015625, 29.3125, 30.333984375, 31.35546875, 32.376953125, 33.3984375, 34.419921875, 35.44140625, 36.462890625, 37.484375, 38.505859375, 39.52734375, 40.548828125, 41.5703125, 42.591796875, 43.61328125, 44.634765625, 45.65625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 7.0, 7.0, 18.0, 40.0, 102.0, 143.0, 250.0, 178.0, 113.0, 62.0, 27.0, 23.0, 9.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1023.83837890625, -996.6572875976562, -969.4762573242188, -942.295166015625, -915.1141357421875, -887.9330444335938, -860.751953125, -833.5709228515625, -806.3898315429688, -779.208740234375, -752.0277099609375, -724.8466186523438, -697.66552734375, -670.4844970703125, -643.3034057617188, -616.122314453125, -588.9412841796875, -561.7601928710938, -534.5791625976562, -507.3980712890625, -480.2170104980469, -453.03594970703125, -425.8548583984375, -398.6737976074219, -371.49273681640625, -344.3116760253906, -317.130615234375, -289.94952392578125, -262.7684631347656, -235.58740234375, -208.4063262939453, -181.22525024414062, -154.044189453125, -126.86312103271484, -99.68205261230469, -72.50098419189453, -45.319915771484375, -18.13885498046875, 9.042221069335938, 36.223297119140625, 63.40435791015625, 90.5854263305664, 117.76649475097656, 144.94757080078125, 172.12863159179688, 199.3096923828125, 226.4907684326172, 253.67184448242188, 280.8529052734375, 308.0339660644531, 335.21502685546875, 362.3961181640625, 389.5771789550781, 416.75823974609375, 443.9393310546875, 471.1203918457031, 498.30145263671875, 525.4825439453125, 552.66357421875, 579.8446655273438, 607.0257568359375, 634.206787109375, 661.3878784179688, 688.5689697265625, 715.75]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 10.0, 9.0, 13.0, 13.0, 18.0, 17.0, 18.0, 17.0, 17.0, 20.0, 28.0, 32.0, 25.0, 27.0, 29.0, 54.0, 58.0, 63.0, 69.0, 71.0, 39.0, 34.0, 32.0, 28.0, 23.0, 25.0, 23.0, 16.0, 16.0, 18.0, 23.0, 11.0, 12.0, 7.0, 15.0, 11.0, 6.0, 4.0, 7.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-435.8338317871094, -420.75042724609375, -405.6670227050781, -390.5836181640625, -375.50018310546875, -360.4167785644531, -345.3333740234375, -330.2499694824219, -315.16656494140625, -300.0831604003906, -284.999755859375, -269.91632080078125, -254.83291625976562, -239.74951171875, -224.66610717773438, -209.58270263671875, -194.499267578125, -179.41586303710938, -164.3324432373047, -149.24903869628906, -134.16561889648438, -119.08221435546875, -103.99880981445312, -88.91539764404297, -73.83198547363281, -58.748573303222656, -43.665164947509766, -28.581756591796875, -13.498344421386719, 1.5850677490234375, 16.668472290039062, 31.75188446044922, 46.8353271484375, 61.918739318847656, 77.00215148925781, 92.08555603027344, 107.1689682006836, 122.25238037109375, 137.33578491210938, 152.419189453125, 167.5026092529297, 182.5860137939453, 197.66943359375, 212.75283813476562, 227.83624267578125, 242.91966247558594, 258.0030517578125, 273.08648681640625, 288.1698913574219, 303.2532958984375, 318.3367004394531, 333.42010498046875, 348.5035400390625, 363.5869445800781, 378.67034912109375, 393.7537536621094, 408.837158203125, 423.9205627441406, 439.00396728515625, 454.08740234375, 469.1708068847656, 484.25421142578125, 499.3376159667969, 514.4210205078125, 529.5044555664062]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 11.0, 8.0, 9.0, 13.0, 15.0, 21.0, 37.0, 73.0, 97.0, 157.0, 255.0, 492.0, 1217.0, 3425.0, 12862.0, 84572.0, 1454561.0, 2457943.0, 152626.0, 18433.0, 4612.0, 1530.0, 571.0, 288.0, 158.0, 105.0, 65.0, 31.0, 26.0, 14.0, 15.0, 8.0, 10.0, 8.0, 6.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.46875, -60.6376953125, -58.806640625, -56.9755859375, -55.14453125, -53.3134765625, -51.482421875, -49.6513671875, -47.8203125, -45.9892578125, -44.158203125, -42.3271484375, -40.49609375, -38.6650390625, -36.833984375, -35.0029296875, -33.171875, -31.3408203125, -29.509765625, -27.6787109375, -25.84765625, -24.0166015625, -22.185546875, -20.3544921875, -18.5234375, -16.6923828125, -14.861328125, -13.0302734375, -11.19921875, -9.3681640625, -7.537109375, -5.7060546875, -3.875, -2.0439453125, -0.212890625, 1.6181640625, 3.44921875, 5.2802734375, 7.111328125, 8.9423828125, 10.7734375, 12.6044921875, 14.435546875, 16.2666015625, 18.09765625, 19.9287109375, 21.759765625, 23.5908203125, 25.421875, 27.2529296875, 29.083984375, 30.9150390625, 32.74609375, 34.5771484375, 36.408203125, 38.2392578125, 40.0703125, 41.9013671875, 43.732421875, 45.5634765625, 47.39453125, 49.2255859375, 51.056640625, 52.8876953125, 54.71875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 9.0, 13.0, 15.0, 14.0, 13.0, 18.0, 16.0, 21.0, 24.0, 27.0, 19.0, 44.0, 54.0, 43.0, 48.0, 38.0, 43.0, 46.0, 45.0, 53.0, 43.0, 40.0, 35.0, 34.0, 41.0, 25.0, 22.0, 16.0, 24.0, 19.0, 28.0, 7.0, 11.0, 13.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.0, -26.05078125, -25.1015625, -24.15234375, -23.203125, -22.25390625, -21.3046875, -20.35546875, -19.40625, -18.45703125, -17.5078125, -16.55859375, -15.609375, -14.66015625, -13.7109375, -12.76171875, -11.8125, -10.86328125, -9.9140625, -8.96484375, -8.015625, -7.06640625, -6.1171875, -5.16796875, -4.21875, -3.26953125, -2.3203125, -1.37109375, -0.421875, 0.52734375, 1.4765625, 2.42578125, 3.375, 4.32421875, 5.2734375, 6.22265625, 7.171875, 8.12109375, 9.0703125, 10.01953125, 10.96875, 11.91796875, 12.8671875, 13.81640625, 14.765625, 15.71484375, 16.6640625, 17.61328125, 18.5625, 19.51171875, 20.4609375, 21.41015625, 22.359375, 23.30859375, 24.2578125, 25.20703125, 26.15625, 27.10546875, 28.0546875, 29.00390625, 29.953125, 30.90234375, 31.8515625, 32.80078125, 33.75]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 11.0, 23.0, 24.0, 53.0, 91.0, 189.0, 477.0, 1571.0, 9157.0, 153733.0, 3925292.0, 93276.0, 7632.0, 1660.0, 580.0, 243.0, 117.0, 56.0, 37.0, 22.0, 20.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-143.375, -139.328125, -135.28125, -131.234375, -127.1875, -123.140625, -119.09375, -115.046875, -111.0, -106.953125, -102.90625, -98.859375, -94.8125, -90.765625, -86.71875, -82.671875, -78.625, -74.578125, -70.53125, -66.484375, -62.4375, -58.390625, -54.34375, -50.296875, -46.25, -42.203125, -38.15625, -34.109375, -30.0625, -26.015625, -21.96875, -17.921875, -13.875, -9.828125, -5.78125, -1.734375, 2.3125, 6.359375, 10.40625, 14.453125, 18.5, 22.546875, 26.59375, 30.640625, 34.6875, 38.734375, 42.78125, 46.828125, 50.875, 54.921875, 58.96875, 63.015625, 67.0625, 71.109375, 75.15625, 79.203125, 83.25, 87.296875, 91.34375, 95.390625, 99.4375, 103.484375, 107.53125, 111.578125, 115.625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 6.0, 6.0, 10.0, 20.0, 21.0, 45.0, 65.0, 112.0, 242.0, 506.0, 901.0, 941.0, 581.0, 282.0, 117.0, 58.0, 57.0, 36.0, 16.0, 9.0, 16.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.0625, -87.1591796875, -84.255859375, -81.3525390625, -78.44921875, -75.5458984375, -72.642578125, -69.7392578125, -66.8359375, -63.9326171875, -61.029296875, -58.1259765625, -55.22265625, -52.3193359375, -49.416015625, -46.5126953125, -43.609375, -40.7060546875, -37.802734375, -34.8994140625, -31.99609375, -29.0927734375, -26.189453125, -23.2861328125, -20.3828125, -17.4794921875, -14.576171875, -11.6728515625, -8.76953125, -5.8662109375, -2.962890625, -0.0595703125, 2.84375, 5.7470703125, 8.650390625, 11.5537109375, 14.45703125, 17.3603515625, 20.263671875, 23.1669921875, 26.0703125, 28.9736328125, 31.876953125, 34.7802734375, 37.68359375, 40.5869140625, 43.490234375, 46.3935546875, 49.296875, 52.2001953125, 55.103515625, 58.0068359375, 60.91015625, 63.8134765625, 66.716796875, 69.6201171875, 72.5234375, 75.4267578125, 78.330078125, 81.2333984375, 84.13671875, 87.0400390625, 89.943359375, 92.8466796875, 95.75]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 17.0, 28.0, 87.0, 182.0, 293.0, 222.0, 93.0, 31.0, 14.0, 8.0, 10.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-614.099609375, -585.4658203125, -556.8320922851562, -528.1983032226562, -499.56451416015625, -470.9307556152344, -442.2969970703125, -413.6632080078125, -385.0294494628906, -356.39569091796875, -327.76190185546875, -299.1281433105469, -270.494384765625, -241.860595703125, -213.22683715820312, -184.5930633544922, -155.95928955078125, -127.32551574707031, -98.6917495727539, -70.0579833984375, -41.42420959472656, -12.790435791015625, 15.84332275390625, 44.47709655761719, 73.11087036132812, 101.74464416503906, 130.37841796875, 159.01217651367188, 187.6459503173828, 216.27972412109375, 244.91348266601562, 273.5472412109375, 302.1810302734375, 330.8147888183594, 359.4485778808594, 388.08233642578125, 416.71612548828125, 445.3498840332031, 473.983642578125, 502.617431640625, 531.251220703125, 559.885009765625, 588.5187377929688, 617.1525268554688, 645.7863159179688, 674.4200439453125, 703.0538330078125, 731.6876220703125, 760.3213500976562, 788.9551391601562, 817.5888671875, 846.22265625, 874.8564453125, 903.490234375, 932.1239624023438, 960.7577514648438, 989.3914794921875, 1018.0252685546875, 1046.6590576171875, 1075.292724609375, 1103.926513671875, 1132.560302734375, 1161.194091796875, 1189.827880859375, 1218.461669921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 9.0, 10.0, 15.0, 23.0, 22.0, 29.0, 46.0, 42.0, 64.0, 61.0, 75.0, 81.0, 75.0, 55.0, 68.0, 63.0, 55.0, 38.0, 51.0, 26.0, 21.0, 26.0, 16.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-503.86358642578125, -488.7021484375, -473.54071044921875, -458.3792724609375, -443.21783447265625, -428.056396484375, -412.89495849609375, -397.7334899902344, -382.5720520019531, -367.4106140136719, -352.2491760253906, -337.0877380371094, -321.9263000488281, -306.76483154296875, -291.6033935546875, -276.44195556640625, -261.280517578125, -246.11907958984375, -230.9576416015625, -215.79620361328125, -200.63475036621094, -185.4733123779297, -170.31187438964844, -155.15042114257812, -139.989013671875, -124.82757568359375, -109.66613006591797, -94.50469207763672, -79.34324645996094, -64.18180847167969, -49.02037048339844, -33.858924865722656, -18.697479248046875, -3.536038398742676, 11.625402450561523, 26.786842346191406, 41.94828414916992, 57.10972595214844, 72.27116394042969, 87.43260955810547, 102.59404754638672, 117.75548553466797, 132.91693115234375, 148.078369140625, 163.23980712890625, 178.4012451171875, 193.56268310546875, 208.72413635253906, 223.8855743408203, 239.04701232910156, 254.2084503173828, 269.3699035644531, 284.5313415527344, 299.6927795410156, 314.8542175292969, 330.0156555175781, 345.1770935058594, 360.3385314941406, 375.4999694824219, 390.6614074707031, 405.8228454589844, 420.98431396484375, 436.145751953125, 451.30718994140625, 466.4686279296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 4.0, 1.0, 11.0, 17.0, 28.0, 51.0, 81.0, 133.0, 212.0, 358.0, 569.0, 961.0, 1622.0, 2962.0, 5450.0, 10448.0, 19924.0, 40315.0, 82503.0, 161201.0, 248435.0, 221466.0, 125345.0, 62682.0, 30474.0, 15320.0, 7925.0, 4211.0, 2436.0, 1427.0, 727.0, 492.0, 272.0, 189.0, 110.0, 71.0, 42.0, 31.0, 14.0, 16.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.1875, -36.90625, -35.625, -34.34375, -33.0625, -31.78125, -30.5, -29.21875, -27.9375, -26.65625, -25.375, -24.09375, -22.8125, -21.53125, -20.25, -18.96875, -17.6875, -16.40625, -15.125, -13.84375, -12.5625, -11.28125, -10.0, -8.71875, -7.4375, -6.15625, -4.875, -3.59375, -2.3125, -1.03125, 0.25, 1.53125, 2.8125, 4.09375, 5.375, 6.65625, 7.9375, 9.21875, 10.5, 11.78125, 13.0625, 14.34375, 15.625, 16.90625, 18.1875, 19.46875, 20.75, 22.03125, 23.3125, 24.59375, 25.875, 27.15625, 28.4375, 29.71875, 31.0, 32.28125, 33.5625, 34.84375, 36.125, 37.40625, 38.6875, 39.96875, 41.25, 42.53125, 43.8125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 7.0, 8.0, 6.0, 1.0, 11.0, 11.0, 16.0, 20.0, 19.0, 12.0, 26.0, 26.0, 28.0, 40.0, 30.0, 38.0, 36.0, 49.0, 38.0, 44.0, 46.0, 49.0, 39.0, 52.0, 34.0, 44.0, 35.0, 35.0, 37.0, 20.0, 18.0, 22.0, 24.0, 15.0, 23.0, 6.0, 8.0, 4.0, 8.0, 3.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.0, -26.0556640625, -25.111328125, -24.1669921875, -23.22265625, -22.2783203125, -21.333984375, -20.3896484375, -19.4453125, -18.5009765625, -17.556640625, -16.6123046875, -15.66796875, -14.7236328125, -13.779296875, -12.8349609375, -11.890625, -10.9462890625, -10.001953125, -9.0576171875, -8.11328125, -7.1689453125, -6.224609375, -5.2802734375, -4.3359375, -3.3916015625, -2.447265625, -1.5029296875, -0.55859375, 0.3857421875, 1.330078125, 2.2744140625, 3.21875, 4.1630859375, 5.107421875, 6.0517578125, 6.99609375, 7.9404296875, 8.884765625, 9.8291015625, 10.7734375, 11.7177734375, 12.662109375, 13.6064453125, 14.55078125, 15.4951171875, 16.439453125, 17.3837890625, 18.328125, 19.2724609375, 20.216796875, 21.1611328125, 22.10546875, 23.0498046875, 23.994140625, 24.9384765625, 25.8828125, 26.8271484375, 27.771484375, 28.7158203125, 29.66015625, 30.6044921875, 31.548828125, 32.4931640625, 33.4375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 12.0, 18.0, 20.0, 21.0, 40.0, 49.0, 62.0, 88.0, 110.0, 161.0, 258.0, 450.0, 965.0, 2351.0, 7271.0, 27072.0, 119814.0, 577664.0, 238709.0, 53259.0, 13045.0, 3931.0, 1458.0, 668.0, 343.0, 188.0, 148.0, 97.0, 72.0, 42.0, 48.0, 30.0, 16.0, 10.0, 10.0, 12.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.25, -66.7529296875, -64.255859375, -61.7587890625, -59.26171875, -56.7646484375, -54.267578125, -51.7705078125, -49.2734375, -46.7763671875, -44.279296875, -41.7822265625, -39.28515625, -36.7880859375, -34.291015625, -31.7939453125, -29.296875, -26.7998046875, -24.302734375, -21.8056640625, -19.30859375, -16.8115234375, -14.314453125, -11.8173828125, -9.3203125, -6.8232421875, -4.326171875, -1.8291015625, 0.66796875, 3.1650390625, 5.662109375, 8.1591796875, 10.65625, 13.1533203125, 15.650390625, 18.1474609375, 20.64453125, 23.1416015625, 25.638671875, 28.1357421875, 30.6328125, 33.1298828125, 35.626953125, 38.1240234375, 40.62109375, 43.1181640625, 45.615234375, 48.1123046875, 50.609375, 53.1064453125, 55.603515625, 58.1005859375, 60.59765625, 63.0947265625, 65.591796875, 68.0888671875, 70.5859375, 73.0830078125, 75.580078125, 78.0771484375, 80.57421875, 83.0712890625, 85.568359375, 88.0654296875, 90.5625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 12.0, 13.0, 8.0, 17.0, 14.0, 16.0, 20.0, 21.0, 40.0, 40.0, 57.0, 61.0, 41.0, 51.0, 53.0, 43.0, 47.0, 56.0, 58.0, 45.0, 54.0, 42.0, 20.0, 32.0, 25.0, 20.0, 11.0, 15.0, 16.0, 18.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-130.0, -126.23046875, -122.4609375, -118.69140625, -114.921875, -111.15234375, -107.3828125, -103.61328125, -99.84375, -96.07421875, -92.3046875, -88.53515625, -84.765625, -80.99609375, -77.2265625, -73.45703125, -69.6875, -65.91796875, -62.1484375, -58.37890625, -54.609375, -50.83984375, -47.0703125, -43.30078125, -39.53125, -35.76171875, -31.9921875, -28.22265625, -24.453125, -20.68359375, -16.9140625, -13.14453125, -9.375, -5.60546875, -1.8359375, 1.93359375, 5.703125, 9.47265625, 13.2421875, 17.01171875, 20.78125, 24.55078125, 28.3203125, 32.08984375, 35.859375, 39.62890625, 43.3984375, 47.16796875, 50.9375, 54.70703125, 58.4765625, 62.24609375, 66.015625, 69.78515625, 73.5546875, 77.32421875, 81.09375, 84.86328125, 88.6328125, 92.40234375, 96.171875, 99.94140625, 103.7109375, 107.48046875, 111.25]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 12.0, 18.0, 22.0, 27.0, 39.0, 66.0, 103.0, 125.0, 271.0, 400.0, 822.0, 1756.0, 4029.0, 10401.0, 30396.0, 97004.0, 418798.0, 339864.0, 96333.0, 29896.0, 10515.0, 4005.0, 1722.0, 803.0, 421.0, 241.0, 137.0, 79.0, 67.0, 44.0, 32.0, 22.0, 12.0, 10.0, 11.0, 14.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.609375, -17.07568359375, -16.5419921875, -16.00830078125, -15.474609375, -14.94091796875, -14.4072265625, -13.87353515625, -13.33984375, -12.80615234375, -12.2724609375, -11.73876953125, -11.205078125, -10.67138671875, -10.1376953125, -9.60400390625, -9.0703125, -8.53662109375, -8.0029296875, -7.46923828125, -6.935546875, -6.40185546875, -5.8681640625, -5.33447265625, -4.80078125, -4.26708984375, -3.7333984375, -3.19970703125, -2.666015625, -2.13232421875, -1.5986328125, -1.06494140625, -0.53125, 0.00244140625, 0.5361328125, 1.06982421875, 1.603515625, 2.13720703125, 2.6708984375, 3.20458984375, 3.73828125, 4.27197265625, 4.8056640625, 5.33935546875, 5.873046875, 6.40673828125, 6.9404296875, 7.47412109375, 8.0078125, 8.54150390625, 9.0751953125, 9.60888671875, 10.142578125, 10.67626953125, 11.2099609375, 11.74365234375, 12.27734375, 12.81103515625, 13.3447265625, 13.87841796875, 14.412109375, 14.94580078125, 15.4794921875, 16.01318359375, 16.546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 6.0, 7.0, 5.0, 11.0, 14.0, 21.0, 25.0, 40.0, 46.0, 55.0, 69.0, 80.0, 93.0, 77.0, 80.0, 68.0, 67.0, 54.0, 36.0, 27.0, 25.0, 20.0, 16.0, 8.0, 6.0, 7.0, 10.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006084442138671875, -0.005868673324584961, -0.005652904510498047, -0.005437135696411133, -0.005221366882324219, -0.005005598068237305, -0.004789829254150391, -0.0045740604400634766, -0.0043582916259765625, -0.0041425228118896484, -0.003926753997802734, -0.0037109851837158203, -0.0034952163696289062, -0.003279447555541992, -0.003063678741455078, -0.002847909927368164, -0.00263214111328125, -0.002416372299194336, -0.002200603485107422, -0.001984834671020508, -0.0017690658569335938, -0.0015532970428466797, -0.0013375282287597656, -0.0011217594146728516, -0.0009059906005859375, -0.0006902217864990234, -0.0004744529724121094, -0.0002586841583251953, -4.291534423828125e-05, 0.0001728534698486328, 0.0003886222839355469, 0.0006043910980224609, 0.000820159912109375, 0.001035928726196289, 0.0012516975402832031, 0.0014674663543701172, 0.0016832351684570312, 0.0018990039825439453, 0.0021147727966308594, 0.0023305416107177734, 0.0025463104248046875, 0.0027620792388916016, 0.0029778480529785156, 0.0031936168670654297, 0.0034093856811523438, 0.003625154495239258, 0.003840923309326172, 0.004056692123413086, 0.0042724609375, 0.004488229751586914, 0.004703998565673828, 0.004919767379760742, 0.005135536193847656, 0.00535130500793457, 0.005567073822021484, 0.0057828426361083984, 0.0059986114501953125, 0.0062143802642822266, 0.006430149078369141, 0.006645917892456055, 0.006861686706542969, 0.007077455520629883, 0.007293224334716797, 0.007508993148803711, 0.007724761962890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 10.0, 10.0, 17.0, 21.0, 30.0, 46.0, 72.0, 82.0, 155.0, 234.0, 481.0, 913.0, 2133.0, 5888.0, 20097.0, 92156.0, 557163.0, 286809.0, 60209.0, 14234.0, 4281.0, 1727.0, 792.0, 407.0, 228.0, 110.0, 87.0, 54.0, 29.0, 28.0, 14.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.375, -23.610107421875, -22.84521484375, -22.080322265625, -21.3154296875, -20.550537109375, -19.78564453125, -19.020751953125, -18.255859375, -17.490966796875, -16.72607421875, -15.961181640625, -15.1962890625, -14.431396484375, -13.66650390625, -12.901611328125, -12.13671875, -11.371826171875, -10.60693359375, -9.842041015625, -9.0771484375, -8.312255859375, -7.54736328125, -6.782470703125, -6.017578125, -5.252685546875, -4.48779296875, -3.722900390625, -2.9580078125, -2.193115234375, -1.42822265625, -0.663330078125, 0.1015625, 0.866455078125, 1.63134765625, 2.396240234375, 3.1611328125, 3.926025390625, 4.69091796875, 5.455810546875, 6.220703125, 6.985595703125, 7.75048828125, 8.515380859375, 9.2802734375, 10.045166015625, 10.81005859375, 11.574951171875, 12.33984375, 13.104736328125, 13.86962890625, 14.634521484375, 15.3994140625, 16.164306640625, 16.92919921875, 17.694091796875, 18.458984375, 19.223876953125, 19.98876953125, 20.753662109375, 21.5185546875, 22.283447265625, 23.04833984375, 23.813232421875, 24.578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 8.0, 12.0, 12.0, 26.0, 28.0, 27.0, 40.0, 60.0, 49.0, 54.0, 87.0, 86.0, 89.0, 90.0, 70.0, 57.0, 47.0, 30.0, 31.0, 32.0, 21.0, 8.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.90625, -26.087890625, -25.26953125, -24.451171875, -23.6328125, -22.814453125, -21.99609375, -21.177734375, -20.359375, -19.541015625, -18.72265625, -17.904296875, -17.0859375, -16.267578125, -15.44921875, -14.630859375, -13.8125, -12.994140625, -12.17578125, -11.357421875, -10.5390625, -9.720703125, -8.90234375, -8.083984375, -7.265625, -6.447265625, -5.62890625, -4.810546875, -3.9921875, -3.173828125, -2.35546875, -1.537109375, -0.71875, 0.099609375, 0.91796875, 1.736328125, 2.5546875, 3.373046875, 4.19140625, 5.009765625, 5.828125, 6.646484375, 7.46484375, 8.283203125, 9.1015625, 9.919921875, 10.73828125, 11.556640625, 12.375, 13.193359375, 14.01171875, 14.830078125, 15.6484375, 16.466796875, 17.28515625, 18.103515625, 18.921875, 19.740234375, 20.55859375, 21.376953125, 22.1953125, 23.013671875, 23.83203125, 24.650390625, 25.46875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 8.0, 33.0, 93.0, 192.0, 367.0, 173.0, 76.0, 23.0, 13.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1051.0025634765625, -1020.4654541015625, -989.9284057617188, -959.3912963867188, -928.8541870117188, -898.317138671875, -867.780029296875, -837.242919921875, -806.705810546875, -776.168701171875, -745.6316528320312, -715.0945434570312, -684.5574340820312, -654.0203857421875, -623.4832763671875, -592.9461669921875, -562.4091186523438, -531.8720092773438, -501.3349304199219, -470.7978515625, -440.2607421875, -409.7236633300781, -379.18658447265625, -348.64947509765625, -318.1123962402344, -287.5753173828125, -257.0382080078125, -226.50112915039062, -195.9640350341797, -165.42694091796875, -134.88986206054688, -104.35276794433594, -73.815673828125, -43.27858352661133, -12.741493225097656, 17.79559326171875, 48.33268737792969, 78.86978149414062, 109.4068603515625, 139.94395446777344, 170.48104858398438, 201.0181427001953, 231.55523681640625, 262.0923156738281, 292.62939453125, 323.16650390625, 353.7035827636719, 384.24066162109375, 414.77777099609375, 445.3148498535156, 475.8519592285156, 506.3890380859375, 536.9261474609375, 567.4632568359375, 598.0003051757812, 628.5374145507812, 659.074462890625, 689.611572265625, 720.1486206054688, 750.6857299804688, 781.2228393554688, 811.7598876953125, 842.2969970703125, 872.8341064453125, 903.3712158203125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 6.0, 6.0, 6.0, 12.0, 9.0, 11.0, 14.0, 21.0, 24.0, 22.0, 37.0, 30.0, 29.0, 41.0, 44.0, 75.0, 96.0, 82.0, 69.0, 45.0, 49.0, 40.0, 31.0, 29.0, 32.0, 30.0, 18.0, 12.0, 23.0, 8.0, 9.0, 10.0, 12.0, 4.0, 4.0, 5.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-385.2171936035156, -370.248779296875, -355.2803649902344, -340.31195068359375, -325.343505859375, -310.3751220703125, -295.40667724609375, -280.4382629394531, -265.4698486328125, -250.50143432617188, -235.53302001953125, -220.56459045410156, -205.59617614746094, -190.6277618408203, -175.65933227539062, -160.69091796875, -145.72250366210938, -130.75408935546875, -115.7856674194336, -100.81724548339844, -85.84883117675781, -70.88041687011719, -55.91199493408203, -40.943572998046875, -25.97515869140625, -11.00674057006836, 3.9616775512695312, 18.930095672607422, 33.89851379394531, 48.86692810058594, 63.835350036621094, 78.80377197265625, 93.772216796875, 108.74063110351562, 123.70905303955078, 138.67747497558594, 153.64588928222656, 168.6143035888672, 183.58273315429688, 198.5511474609375, 213.51956176757812, 228.48797607421875, 243.45639038085938, 258.4248046875, 273.39324951171875, 288.36163330078125, 303.330078125, 318.2984924316406, 333.26690673828125, 348.2353210449219, 363.2037353515625, 378.1721496582031, 393.14056396484375, 408.1090087890625, 423.0774230957031, 438.04583740234375, 453.0142517089844, 467.982666015625, 482.9510803222656, 497.91949462890625, 512.887939453125, 527.8563232421875, 542.8247680664062, 557.793212890625, 572.7615966796875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 7.0, 12.0, 13.0, 21.0, 20.0, 44.0, 62.0, 94.0, 115.0, 201.0, 325.0, 566.0, 1011.0, 1893.0, 4480.0, 11677.0, 41517.0, 246043.0, 1612746.0, 1894500.0, 304687.0, 51154.0, 13424.0, 4863.0, 2183.0, 1091.0, 596.0, 347.0, 181.0, 128.0, 88.0, 55.0, 38.0, 23.0, 17.0, 13.0, 10.0, 10.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.46875, -34.32666015625, -33.1845703125, -32.04248046875, -30.900390625, -29.75830078125, -28.6162109375, -27.47412109375, -26.33203125, -25.18994140625, -24.0478515625, -22.90576171875, -21.763671875, -20.62158203125, -19.4794921875, -18.33740234375, -17.1953125, -16.05322265625, -14.9111328125, -13.76904296875, -12.626953125, -11.48486328125, -10.3427734375, -9.20068359375, -8.05859375, -6.91650390625, -5.7744140625, -4.63232421875, -3.490234375, -2.34814453125, -1.2060546875, -0.06396484375, 1.078125, 2.22021484375, 3.3623046875, 4.50439453125, 5.646484375, 6.78857421875, 7.9306640625, 9.07275390625, 10.21484375, 11.35693359375, 12.4990234375, 13.64111328125, 14.783203125, 15.92529296875, 17.0673828125, 18.20947265625, 19.3515625, 20.49365234375, 21.6357421875, 22.77783203125, 23.919921875, 25.06201171875, 26.2041015625, 27.34619140625, 28.48828125, 29.63037109375, 30.7724609375, 31.91455078125, 33.056640625, 34.19873046875, 35.3408203125, 36.48291015625, 37.625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 13.0, 13.0, 13.0, 16.0, 21.0, 18.0, 24.0, 30.0, 39.0, 31.0, 36.0, 36.0, 32.0, 39.0, 36.0, 56.0, 46.0, 40.0, 39.0, 34.0, 37.0, 29.0, 29.0, 37.0, 37.0, 30.0, 26.0, 22.0, 19.0, 19.0, 18.0, 14.0, 6.0, 8.0, 7.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-29.125, -28.280517578125, -27.43603515625, -26.591552734375, -25.7470703125, -24.902587890625, -24.05810546875, -23.213623046875, -22.369140625, -21.524658203125, -20.68017578125, -19.835693359375, -18.9912109375, -18.146728515625, -17.30224609375, -16.457763671875, -15.61328125, -14.768798828125, -13.92431640625, -13.079833984375, -12.2353515625, -11.390869140625, -10.54638671875, -9.701904296875, -8.857421875, -8.012939453125, -7.16845703125, -6.323974609375, -5.4794921875, -4.635009765625, -3.79052734375, -2.946044921875, -2.1015625, -1.257080078125, -0.41259765625, 0.431884765625, 1.2763671875, 2.120849609375, 2.96533203125, 3.809814453125, 4.654296875, 5.498779296875, 6.34326171875, 7.187744140625, 8.0322265625, 8.876708984375, 9.72119140625, 10.565673828125, 11.41015625, 12.254638671875, 13.09912109375, 13.943603515625, 14.7880859375, 15.632568359375, 16.47705078125, 17.321533203125, 18.166015625, 19.010498046875, 19.85498046875, 20.699462890625, 21.5439453125, 22.388427734375, 23.23291015625, 24.077392578125, 24.921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 6.0, 15.0, 4.0, 14.0, 34.0, 54.0, 114.0, 223.0, 686.0, 2782.0, 18936.0, 1000528.0, 3133028.0, 32324.0, 4065.0, 884.0, 288.0, 116.0, 65.0, 33.0, 16.0, 13.0, 7.0, 7.0, 5.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-125.1875, -121.5166015625, -117.845703125, -114.1748046875, -110.50390625, -106.8330078125, -103.162109375, -99.4912109375, -95.8203125, -92.1494140625, -88.478515625, -84.8076171875, -81.13671875, -77.4658203125, -73.794921875, -70.1240234375, -66.453125, -62.7822265625, -59.111328125, -55.4404296875, -51.76953125, -48.0986328125, -44.427734375, -40.7568359375, -37.0859375, -33.4150390625, -29.744140625, -26.0732421875, -22.40234375, -18.7314453125, -15.060546875, -11.3896484375, -7.71875, -4.0478515625, -0.376953125, 3.2939453125, 6.96484375, 10.6357421875, 14.306640625, 17.9775390625, 21.6484375, 25.3193359375, 28.990234375, 32.6611328125, 36.33203125, 40.0029296875, 43.673828125, 47.3447265625, 51.015625, 54.6865234375, 58.357421875, 62.0283203125, 65.69921875, 69.3701171875, 73.041015625, 76.7119140625, 80.3828125, 84.0537109375, 87.724609375, 91.3955078125, 95.06640625, 98.7373046875, 102.408203125, 106.0791015625, 109.75]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 7.0, 12.0, 10.0, 15.0, 32.0, 31.0, 49.0, 86.0, 125.0, 222.0, 439.0, 726.0, 867.0, 568.0, 344.0, 173.0, 108.0, 89.0, 56.0, 30.0, 21.0, 12.0, 11.0, 5.0, 10.0, 3.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.0625, -73.90771484375, -71.7529296875, -69.59814453125, -67.443359375, -65.28857421875, -63.1337890625, -60.97900390625, -58.82421875, -56.66943359375, -54.5146484375, -52.35986328125, -50.205078125, -48.05029296875, -45.8955078125, -43.74072265625, -41.5859375, -39.43115234375, -37.2763671875, -35.12158203125, -32.966796875, -30.81201171875, -28.6572265625, -26.50244140625, -24.34765625, -22.19287109375, -20.0380859375, -17.88330078125, -15.728515625, -13.57373046875, -11.4189453125, -9.26416015625, -7.109375, -4.95458984375, -2.7998046875, -0.64501953125, 1.509765625, 3.66455078125, 5.8193359375, 7.97412109375, 10.12890625, 12.28369140625, 14.4384765625, 16.59326171875, 18.748046875, 20.90283203125, 23.0576171875, 25.21240234375, 27.3671875, 29.52197265625, 31.6767578125, 33.83154296875, 35.986328125, 38.14111328125, 40.2958984375, 42.45068359375, 44.60546875, 46.76025390625, 48.9150390625, 51.06982421875, 53.224609375, 55.37939453125, 57.5341796875, 59.68896484375, 61.84375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 2.0, 6.0, 13.0, 14.0, 38.0, 61.0, 103.0, 153.0, 166.0, 161.0, 107.0, 62.0, 33.0, 33.0, 18.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-315.57257080078125, -301.3780517578125, -287.18353271484375, -272.989013671875, -258.79449462890625, -244.5999755859375, -230.40545654296875, -216.2109375, -202.01641845703125, -187.8218994140625, -173.62738037109375, -159.432861328125, -145.23834228515625, -131.0438232421875, -116.84931182861328, -102.65479278564453, -88.46028137207031, -74.26576232910156, -60.07124328613281, -45.87672805786133, -31.682209014892578, -17.487693786621094, -3.2931747436523438, 10.901344299316406, 25.095863342285156, 39.290382385253906, 53.484901428222656, 67.67941284179688, 81.87393188476562, 96.06845092773438, 110.26296997070312, 124.45748901367188, 138.65200805664062, 152.84652709960938, 167.04104614257812, 181.23556518554688, 195.43008422851562, 209.62460327148438, 223.81912231445312, 238.01364135742188, 252.20816040039062, 266.4026794433594, 280.5971984863281, 294.7917175292969, 308.9862365722656, 323.1807556152344, 337.3752746582031, 351.5697937011719, 365.7642822265625, 379.95880126953125, 394.1533203125, 408.34783935546875, 422.5423583984375, 436.73687744140625, 450.931396484375, 465.12591552734375, 479.3204345703125, 493.51495361328125, 507.70947265625, 521.9039916992188, 536.0985107421875, 550.2930297851562, 564.487548828125, 578.6820678710938, 592.8765869140625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 4.0, 5.0, 12.0, 8.0, 19.0, 20.0, 17.0, 15.0, 25.0, 29.0, 36.0, 34.0, 34.0, 49.0, 48.0, 35.0, 36.0, 54.0, 44.0, 40.0, 52.0, 44.0, 43.0, 38.0, 35.0, 37.0, 30.0, 20.0, 17.0, 21.0, 15.0, 16.0, 5.0, 7.0, 14.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 0.0, 5.0, 0.0, 1.0], "bins": [-270.1198425292969, -262.09344482421875, -254.0670166015625, -246.04061889648438, -238.0142059326172, -229.98779296875, -221.96139526367188, -213.9349822998047, -205.9085693359375, -197.8821563720703, -189.85574340820312, -181.829345703125, -173.8029327392578, -165.77651977539062, -157.7501220703125, -149.7237091064453, -141.69729614257812, -133.67088317871094, -125.64447784423828, -117.61807250976562, -109.59165954589844, -101.56524658203125, -93.5388412475586, -85.51243591308594, -77.48602294921875, -69.45960998535156, -61.433204650878906, -53.406795501708984, -45.38038635253906, -37.35397720336914, -29.32756805419922, -21.301158905029297, -13.274765014648438, -5.248355865478516, 2.7780532836914062, 10.804462432861328, 18.83087158203125, 26.857280731201172, 34.883689880371094, 42.910099029541016, 50.93650817871094, 58.96291732788086, 66.98932647705078, 75.01573181152344, 83.04214477539062, 91.06855773925781, 99.09496307373047, 107.12136840820312, 115.14778137207031, 123.1741943359375, 131.20059204101562, 139.2270050048828, 147.25341796875, 155.2798309326172, 163.30624389648438, 171.3326416015625, 179.3590545654297, 187.38546752929688, 195.411865234375, 203.4382781982422, 211.46469116210938, 219.49110412597656, 227.51751708984375, 235.54391479492188, 243.57032775878906]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 9.0, 18.0, 9.0, 17.0, 22.0, 44.0, 64.0, 73.0, 125.0, 175.0, 300.0, 493.0, 793.0, 1390.0, 2346.0, 4004.0, 7496.0, 13546.0, 24998.0, 47046.0, 90583.0, 167179.0, 245365.0, 200039.0, 113741.0, 59354.0, 31225.0, 16839.0, 9039.0, 5128.0, 2885.0, 1595.0, 1023.0, 575.0, 356.0, 219.0, 160.0, 93.0, 55.0, 47.0, 21.0, 27.0, 13.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.40625, -34.32275390625, -33.2392578125, -32.15576171875, -31.072265625, -29.98876953125, -28.9052734375, -27.82177734375, -26.73828125, -25.65478515625, -24.5712890625, -23.48779296875, -22.404296875, -21.32080078125, -20.2373046875, -19.15380859375, -18.0703125, -16.98681640625, -15.9033203125, -14.81982421875, -13.736328125, -12.65283203125, -11.5693359375, -10.48583984375, -9.40234375, -8.31884765625, -7.2353515625, -6.15185546875, -5.068359375, -3.98486328125, -2.9013671875, -1.81787109375, -0.734375, 0.34912109375, 1.4326171875, 2.51611328125, 3.599609375, 4.68310546875, 5.7666015625, 6.85009765625, 7.93359375, 9.01708984375, 10.1005859375, 11.18408203125, 12.267578125, 13.35107421875, 14.4345703125, 15.51806640625, 16.6015625, 17.68505859375, 18.7685546875, 19.85205078125, 20.935546875, 22.01904296875, 23.1025390625, 24.18603515625, 25.26953125, 26.35302734375, 27.4365234375, 28.52001953125, 29.603515625, 30.68701171875, 31.7705078125, 32.85400390625, 33.9375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 6.0, 4.0, 2.0, 2.0, 9.0, 15.0, 14.0, 15.0, 17.0, 21.0, 30.0, 27.0, 30.0, 37.0, 40.0, 38.0, 36.0, 53.0, 52.0, 51.0, 41.0, 30.0, 38.0, 30.0, 36.0, 37.0, 41.0, 32.0, 25.0, 35.0, 23.0, 20.0, 18.0, 9.0, 17.0, 15.0, 12.0, 7.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-29.3125, -28.408203125, -27.50390625, -26.599609375, -25.6953125, -24.791015625, -23.88671875, -22.982421875, -22.078125, -21.173828125, -20.26953125, -19.365234375, -18.4609375, -17.556640625, -16.65234375, -15.748046875, -14.84375, -13.939453125, -13.03515625, -12.130859375, -11.2265625, -10.322265625, -9.41796875, -8.513671875, -7.609375, -6.705078125, -5.80078125, -4.896484375, -3.9921875, -3.087890625, -2.18359375, -1.279296875, -0.375, 0.529296875, 1.43359375, 2.337890625, 3.2421875, 4.146484375, 5.05078125, 5.955078125, 6.859375, 7.763671875, 8.66796875, 9.572265625, 10.4765625, 11.380859375, 12.28515625, 13.189453125, 14.09375, 14.998046875, 15.90234375, 16.806640625, 17.7109375, 18.615234375, 19.51953125, 20.423828125, 21.328125, 22.232421875, 23.13671875, 24.041015625, 24.9453125, 25.849609375, 26.75390625, 27.658203125, 28.5625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 8.0, 20.0, 19.0, 26.0, 27.0, 45.0, 66.0, 88.0, 117.0, 181.0, 317.0, 535.0, 955.0, 2111.0, 6353.0, 26294.0, 156161.0, 695460.0, 127743.0, 22383.0, 5574.0, 1856.0, 849.0, 474.0, 290.0, 181.0, 129.0, 79.0, 58.0, 29.0, 37.0, 24.0, 19.0, 12.0, 9.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-93.25, -90.4619140625, -87.673828125, -84.8857421875, -82.09765625, -79.3095703125, -76.521484375, -73.7333984375, -70.9453125, -68.1572265625, -65.369140625, -62.5810546875, -59.79296875, -57.0048828125, -54.216796875, -51.4287109375, -48.640625, -45.8525390625, -43.064453125, -40.2763671875, -37.48828125, -34.7001953125, -31.912109375, -29.1240234375, -26.3359375, -23.5478515625, -20.759765625, -17.9716796875, -15.18359375, -12.3955078125, -9.607421875, -6.8193359375, -4.03125, -1.2431640625, 1.544921875, 4.3330078125, 7.12109375, 9.9091796875, 12.697265625, 15.4853515625, 18.2734375, 21.0615234375, 23.849609375, 26.6376953125, 29.42578125, 32.2138671875, 35.001953125, 37.7900390625, 40.578125, 43.3662109375, 46.154296875, 48.9423828125, 51.73046875, 54.5185546875, 57.306640625, 60.0947265625, 62.8828125, 65.6708984375, 68.458984375, 71.2470703125, 74.03515625, 76.8232421875, 79.611328125, 82.3994140625, 85.1875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 3.0, 0.0, 4.0, 6.0, 8.0, 6.0, 7.0, 10.0, 11.0, 19.0, 24.0, 34.0, 28.0, 27.0, 28.0, 39.0, 54.0, 51.0, 42.0, 50.0, 38.0, 55.0, 52.0, 41.0, 38.0, 36.0, 39.0, 40.0, 49.0, 28.0, 29.0, 26.0, 12.0, 14.0, 9.0, 8.0, 10.0, 3.0, 1.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-103.375, -99.8125, -96.25, -92.6875, -89.125, -85.5625, -82.0, -78.4375, -74.875, -71.3125, -67.75, -64.1875, -60.625, -57.0625, -53.5, -49.9375, -46.375, -42.8125, -39.25, -35.6875, -32.125, -28.5625, -25.0, -21.4375, -17.875, -14.3125, -10.75, -7.1875, -3.625, -0.0625, 3.5, 7.0625, 10.625, 14.1875, 17.75, 21.3125, 24.875, 28.4375, 32.0, 35.5625, 39.125, 42.6875, 46.25, 49.8125, 53.375, 56.9375, 60.5, 64.0625, 67.625, 71.1875, 74.75, 78.3125, 81.875, 85.4375, 89.0, 92.5625, 96.125, 99.6875, 103.25, 106.8125, 110.375, 113.9375, 117.5, 121.0625, 124.625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 6.0, 9.0, 19.0, 20.0, 34.0, 47.0, 72.0, 109.0, 184.0, 368.0, 841.0, 2191.0, 8156.0, 42385.0, 605884.0, 339899.0, 37465.0, 7184.0, 2050.0, 781.0, 347.0, 186.0, 109.0, 54.0, 36.0, 25.0, 21.0, 11.0, 6.0, 11.0, 7.0, 5.0, 8.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-34.3125, -33.30224609375, -32.2919921875, -31.28173828125, -30.271484375, -29.26123046875, -28.2509765625, -27.24072265625, -26.23046875, -25.22021484375, -24.2099609375, -23.19970703125, -22.189453125, -21.17919921875, -20.1689453125, -19.15869140625, -18.1484375, -17.13818359375, -16.1279296875, -15.11767578125, -14.107421875, -13.09716796875, -12.0869140625, -11.07666015625, -10.06640625, -9.05615234375, -8.0458984375, -7.03564453125, -6.025390625, -5.01513671875, -4.0048828125, -2.99462890625, -1.984375, -0.97412109375, 0.0361328125, 1.04638671875, 2.056640625, 3.06689453125, 4.0771484375, 5.08740234375, 6.09765625, 7.10791015625, 8.1181640625, 9.12841796875, 10.138671875, 11.14892578125, 12.1591796875, 13.16943359375, 14.1796875, 15.18994140625, 16.2001953125, 17.21044921875, 18.220703125, 19.23095703125, 20.2412109375, 21.25146484375, 22.26171875, 23.27197265625, 24.2822265625, 25.29248046875, 26.302734375, 27.31298828125, 28.3232421875, 29.33349609375, 30.34375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 11.0, 6.0, 12.0, 8.0, 23.0, 24.0, 29.0, 31.0, 43.0, 45.0, 75.0, 94.0, 90.0, 85.0, 96.0, 53.0, 48.0, 42.0, 32.0, 35.0, 18.0, 15.0, 10.0, 15.0, 9.0, 5.0, 4.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0065765380859375, -0.0063707828521728516, -0.006165027618408203, -0.005959272384643555, -0.005753517150878906, -0.005547761917114258, -0.005342006683349609, -0.005136251449584961, -0.0049304962158203125, -0.004724740982055664, -0.004518985748291016, -0.004313230514526367, -0.004107475280761719, -0.0039017200469970703, -0.003695964813232422, -0.0034902095794677734, -0.003284454345703125, -0.0030786991119384766, -0.002872943878173828, -0.0026671886444091797, -0.0024614334106445312, -0.002255678176879883, -0.0020499229431152344, -0.001844167709350586, -0.0016384124755859375, -0.001432657241821289, -0.0012269020080566406, -0.0010211467742919922, -0.0008153915405273438, -0.0006096363067626953, -0.0004038810729980469, -0.00019812583923339844, 7.62939453125e-06, 0.00021338462829589844, 0.0004191398620605469, 0.0006248950958251953, 0.0008306503295898438, 0.0010364055633544922, 0.0012421607971191406, 0.001447916030883789, 0.0016536712646484375, 0.001859426498413086, 0.0020651817321777344, 0.002270936965942383, 0.0024766921997070312, 0.0026824474334716797, 0.002888202667236328, 0.0030939579010009766, 0.003299713134765625, 0.0035054683685302734, 0.003711223602294922, 0.00391697883605957, 0.004122734069824219, 0.004328489303588867, 0.004534244537353516, 0.004739999771118164, 0.0049457550048828125, 0.005151510238647461, 0.005357265472412109, 0.005563020706176758, 0.005768775939941406, 0.005974531173706055, 0.006180286407470703, 0.0063860416412353516, 0.006591796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 10.0, 5.0, 11.0, 20.0, 40.0, 79.0, 171.0, 439.0, 1527.0, 9466.0, 276549.0, 743524.0, 13882.0, 1889.0, 533.0, 209.0, 93.0, 43.0, 20.0, 11.0, 9.0, 2.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-58.96875, -57.00830078125, -55.0478515625, -53.08740234375, -51.126953125, -49.16650390625, -47.2060546875, -45.24560546875, -43.28515625, -41.32470703125, -39.3642578125, -37.40380859375, -35.443359375, -33.48291015625, -31.5224609375, -29.56201171875, -27.6015625, -25.64111328125, -23.6806640625, -21.72021484375, -19.759765625, -17.79931640625, -15.8388671875, -13.87841796875, -11.91796875, -9.95751953125, -7.9970703125, -6.03662109375, -4.076171875, -2.11572265625, -0.1552734375, 1.80517578125, 3.765625, 5.72607421875, 7.6865234375, 9.64697265625, 11.607421875, 13.56787109375, 15.5283203125, 17.48876953125, 19.44921875, 21.40966796875, 23.3701171875, 25.33056640625, 27.291015625, 29.25146484375, 31.2119140625, 33.17236328125, 35.1328125, 37.09326171875, 39.0537109375, 41.01416015625, 42.974609375, 44.93505859375, 46.8955078125, 48.85595703125, 50.81640625, 52.77685546875, 54.7373046875, 56.69775390625, 58.658203125, 60.61865234375, 62.5791015625, 64.53955078125, 66.5]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 12.0, 14.0, 21.0, 33.0, 31.0, 58.0, 84.0, 115.0, 130.0, 140.0, 102.0, 71.0, 55.0, 46.0, 28.0, 14.0, 10.0, 7.0, 6.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5625, -36.30517578125, -35.0478515625, -33.79052734375, -32.533203125, -31.27587890625, -30.0185546875, -28.76123046875, -27.50390625, -26.24658203125, -24.9892578125, -23.73193359375, -22.474609375, -21.21728515625, -19.9599609375, -18.70263671875, -17.4453125, -16.18798828125, -14.9306640625, -13.67333984375, -12.416015625, -11.15869140625, -9.9013671875, -8.64404296875, -7.38671875, -6.12939453125, -4.8720703125, -3.61474609375, -2.357421875, -1.10009765625, 0.1572265625, 1.41455078125, 2.671875, 3.92919921875, 5.1865234375, 6.44384765625, 7.701171875, 8.95849609375, 10.2158203125, 11.47314453125, 12.73046875, 13.98779296875, 15.2451171875, 16.50244140625, 17.759765625, 19.01708984375, 20.2744140625, 21.53173828125, 22.7890625, 24.04638671875, 25.3037109375, 26.56103515625, 27.818359375, 29.07568359375, 30.3330078125, 31.59033203125, 32.84765625, 34.10498046875, 35.3623046875, 36.61962890625, 37.876953125, 39.13427734375, 40.3916015625, 41.64892578125, 42.90625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 8.0, 29.0, 54.0, 166.0, 441.0, 201.0, 70.0, 18.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1886.7208251953125, -1848.696044921875, -1810.671142578125, -1772.646240234375, -1734.6214599609375, -1696.5966796875, -1658.57177734375, -1620.546875, -1582.5220947265625, -1544.497314453125, -1506.472412109375, -1468.447509765625, -1430.4227294921875, -1392.39794921875, -1354.373046875, -1316.34814453125, -1278.3233642578125, -1240.298583984375, -1202.273681640625, -1164.248779296875, -1126.2239990234375, -1088.19921875, -1050.17431640625, -1012.1494750976562, -974.1246337890625, -936.0997924804688, -898.074951171875, -860.0501098632812, -822.0252685546875, -784.0004272460938, -745.9755859375, -707.9507446289062, -669.9259033203125, -631.9010620117188, -593.876220703125, -555.8513793945312, -517.8265380859375, -479.80169677734375, -441.77685546875, -403.75201416015625, -365.7271728515625, -327.70233154296875, -289.677490234375, -251.65264892578125, -213.6278076171875, -175.60296630859375, -137.578125, -99.55328369140625, -61.5284423828125, -23.50360107421875, 14.521240234375, 52.54608154296875, 90.5709228515625, 128.59576416015625, 166.62060546875, 204.64544677734375, 242.6702880859375, 280.69512939453125, 318.719970703125, 356.74481201171875, 394.7696533203125, 432.79449462890625, 470.8193359375, 508.84417724609375, 546.8690185546875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 8.0, 8.0, 8.0, 9.0, 6.0, 15.0, 14.0, 17.0, 14.0, 20.0, 18.0, 19.0, 24.0, 22.0, 33.0, 39.0, 40.0, 59.0, 90.0, 93.0, 69.0, 52.0, 28.0, 44.0, 41.0, 25.0, 24.0, 14.0, 22.0, 19.0, 13.0, 18.0, 13.0, 9.0, 14.0, 9.0, 4.0, 3.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-344.2588195800781, -332.486328125, -320.7138366699219, -308.94134521484375, -297.1688537597656, -285.3963623046875, -273.62384033203125, -261.85137939453125, -250.07887268066406, -238.30638122558594, -226.5338897705078, -214.76138305664062, -202.9888916015625, -191.21640014648438, -179.44390869140625, -167.67141723632812, -155.89892578125, -144.12643432617188, -132.35394287109375, -120.5814437866211, -108.80895233154297, -97.03646087646484, -85.26396179199219, -73.49147033691406, -61.71897888183594, -49.94648742675781, -38.17399215698242, -26.40149688720703, -14.629005432128906, -2.8565139770507812, 8.915985107421875, 20.6884765625, 32.460968017578125, 44.23345947265625, 56.00595474243164, 67.77845001220703, 79.55094146728516, 91.32343292236328, 103.09593200683594, 114.86842346191406, 126.64091491699219, 138.4134063720703, 150.18589782714844, 161.95840454101562, 173.73089599609375, 185.50338745117188, 197.27587890625, 209.04837036132812, 220.82086181640625, 232.59335327148438, 244.3658447265625, 256.1383361816406, 267.91082763671875, 279.6833190917969, 291.455810546875, 303.22833251953125, 315.00079345703125, 326.7732849121094, 338.5457763671875, 350.3182678222656, 362.09075927734375, 373.8632507324219, 385.6357421875, 397.40826416015625, 409.1807556152344]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 8.0, 7.0, 11.0, 21.0, 19.0, 33.0, 34.0, 66.0, 80.0, 118.0, 221.0, 337.0, 566.0, 1052.0, 1908.0, 4217.0, 10408.0, 33501.0, 154284.0, 827020.0, 2207410.0, 764296.0, 138993.0, 31228.0, 10052.0, 3948.0, 1929.0, 1033.0, 532.0, 316.0, 231.0, 140.0, 80.0, 58.0, 45.0, 21.0, 18.0, 5.0, 7.0, 8.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.4375, -31.373046875, -30.30859375, -29.244140625, -28.1796875, -27.115234375, -26.05078125, -24.986328125, -23.921875, -22.857421875, -21.79296875, -20.728515625, -19.6640625, -18.599609375, -17.53515625, -16.470703125, -15.40625, -14.341796875, -13.27734375, -12.212890625, -11.1484375, -10.083984375, -9.01953125, -7.955078125, -6.890625, -5.826171875, -4.76171875, -3.697265625, -2.6328125, -1.568359375, -0.50390625, 0.560546875, 1.625, 2.689453125, 3.75390625, 4.818359375, 5.8828125, 6.947265625, 8.01171875, 9.076171875, 10.140625, 11.205078125, 12.26953125, 13.333984375, 14.3984375, 15.462890625, 16.52734375, 17.591796875, 18.65625, 19.720703125, 20.78515625, 21.849609375, 22.9140625, 23.978515625, 25.04296875, 26.107421875, 27.171875, 28.236328125, 29.30078125, 30.365234375, 31.4296875, 32.494140625, 33.55859375, 34.623046875, 35.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 3.0, 8.0, 6.0, 12.0, 13.0, 10.0, 20.0, 16.0, 26.0, 24.0, 27.0, 34.0, 47.0, 31.0, 38.0, 34.0, 49.0, 46.0, 34.0, 45.0, 54.0, 34.0, 35.0, 41.0, 32.0, 31.0, 27.0, 34.0, 26.0, 25.0, 19.0, 22.0, 16.0, 15.0, 13.0, 16.0, 8.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.484375, -28.6025390625, -27.720703125, -26.8388671875, -25.95703125, -25.0751953125, -24.193359375, -23.3115234375, -22.4296875, -21.5478515625, -20.666015625, -19.7841796875, -18.90234375, -18.0205078125, -17.138671875, -16.2568359375, -15.375, -14.4931640625, -13.611328125, -12.7294921875, -11.84765625, -10.9658203125, -10.083984375, -9.2021484375, -8.3203125, -7.4384765625, -6.556640625, -5.6748046875, -4.79296875, -3.9111328125, -3.029296875, -2.1474609375, -1.265625, -0.3837890625, 0.498046875, 1.3798828125, 2.26171875, 3.1435546875, 4.025390625, 4.9072265625, 5.7890625, 6.6708984375, 7.552734375, 8.4345703125, 9.31640625, 10.1982421875, 11.080078125, 11.9619140625, 12.84375, 13.7255859375, 14.607421875, 15.4892578125, 16.37109375, 17.2529296875, 18.134765625, 19.0166015625, 19.8984375, 20.7802734375, 21.662109375, 22.5439453125, 23.42578125, 24.3076171875, 25.189453125, 26.0712890625, 26.953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 8.0, 12.0, 10.0, 16.0, 26.0, 34.0, 38.0, 56.0, 128.0, 267.0, 733.0, 2375.0, 12514.0, 148224.0, 3790388.0, 219758.0, 15423.0, 2831.0, 781.0, 301.0, 118.0, 68.0, 36.0, 26.0, 20.0, 20.0, 14.0, 14.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.0, -89.173828125, -86.34765625, -83.521484375, -80.6953125, -77.869140625, -75.04296875, -72.216796875, -69.390625, -66.564453125, -63.73828125, -60.912109375, -58.0859375, -55.259765625, -52.43359375, -49.607421875, -46.78125, -43.955078125, -41.12890625, -38.302734375, -35.4765625, -32.650390625, -29.82421875, -26.998046875, -24.171875, -21.345703125, -18.51953125, -15.693359375, -12.8671875, -10.041015625, -7.21484375, -4.388671875, -1.5625, 1.263671875, 4.08984375, 6.916015625, 9.7421875, 12.568359375, 15.39453125, 18.220703125, 21.046875, 23.873046875, 26.69921875, 29.525390625, 32.3515625, 35.177734375, 38.00390625, 40.830078125, 43.65625, 46.482421875, 49.30859375, 52.134765625, 54.9609375, 57.787109375, 60.61328125, 63.439453125, 66.265625, 69.091796875, 71.91796875, 74.744140625, 77.5703125, 80.396484375, 83.22265625, 86.048828125, 88.875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 10.0, 7.0, 8.0, 12.0, 17.0, 23.0, 40.0, 67.0, 97.0, 154.0, 291.0, 461.0, 727.0, 819.0, 553.0, 316.0, 174.0, 97.0, 59.0, 45.0, 26.0, 14.0, 10.0, 14.0, 9.0, 8.0, 11.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.2587890625, -63.017578125, -60.7763671875, -58.53515625, -56.2939453125, -54.052734375, -51.8115234375, -49.5703125, -47.3291015625, -45.087890625, -42.8466796875, -40.60546875, -38.3642578125, -36.123046875, -33.8818359375, -31.640625, -29.3994140625, -27.158203125, -24.9169921875, -22.67578125, -20.4345703125, -18.193359375, -15.9521484375, -13.7109375, -11.4697265625, -9.228515625, -6.9873046875, -4.74609375, -2.5048828125, -0.263671875, 1.9775390625, 4.21875, 6.4599609375, 8.701171875, 10.9423828125, 13.18359375, 15.4248046875, 17.666015625, 19.9072265625, 22.1484375, 24.3896484375, 26.630859375, 28.8720703125, 31.11328125, 33.3544921875, 35.595703125, 37.8369140625, 40.078125, 42.3193359375, 44.560546875, 46.8017578125, 49.04296875, 51.2841796875, 53.525390625, 55.7666015625, 58.0078125, 60.2490234375, 62.490234375, 64.7314453125, 66.97265625, 69.2138671875, 71.455078125, 73.6962890625, 75.9375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 12.0, 23.0, 43.0, 66.0, 136.0, 183.0, 217.0, 142.0, 82.0, 37.0, 18.0, 10.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-706.7999877929688, -688.296875, -669.7937622070312, -651.2906494140625, -632.78759765625, -614.2844848632812, -595.7813720703125, -577.2782592773438, -558.775146484375, -540.2720336914062, -521.7689208984375, -503.2658386230469, -484.7627258300781, -466.2596130371094, -447.75653076171875, -429.25341796875, -410.75030517578125, -392.2471923828125, -373.74407958984375, -355.2409973144531, -336.7378845214844, -318.2347717285156, -299.731689453125, -281.22857666015625, -262.7254638671875, -244.22235107421875, -225.71925354003906, -207.21615600585938, -188.71304321289062, -170.20993041992188, -151.7068328857422, -133.2037353515625, -114.70062255859375, -96.19751739501953, -77.69441223144531, -59.191307067871094, -40.688201904296875, -22.185096740722656, -3.6819915771484375, 14.82110595703125, 33.32421875, 51.82732391357422, 70.33042907714844, 88.83353424072266, 107.33663940429688, 125.8397445678711, 144.3428497314453, 162.845947265625, 181.34906005859375, 199.8521728515625, 218.3552703857422, 236.85836791992188, 255.36148071289062, 273.8645935058594, 292.36767578125, 310.87078857421875, 329.3739013671875, 347.87701416015625, 366.380126953125, 384.8832092285156, 403.3863220214844, 421.8894348144531, 440.39251708984375, 458.8956298828125, 477.39874267578125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 11.0, 10.0, 14.0, 10.0, 14.0, 14.0, 19.0, 31.0, 41.0, 34.0, 58.0, 56.0, 72.0, 61.0, 71.0, 67.0, 66.0, 72.0, 51.0, 47.0, 32.0, 24.0, 15.0, 25.0, 19.0, 12.0, 14.0, 9.0, 3.0, 4.0, 5.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-348.3399963378906, -337.9934997558594, -327.6470031738281, -317.30047607421875, -306.9539794921875, -296.60748291015625, -286.260986328125, -275.91448974609375, -265.5679626464844, -255.22146606445312, -244.8749542236328, -234.52845764160156, -224.18194580078125, -213.83544921875, -203.48895263671875, -193.14244079589844, -182.7959442138672, -172.44944763183594, -162.10293579101562, -151.75643920898438, -141.40992736816406, -131.0634307861328, -120.71692657470703, -110.37042236328125, -100.02391815185547, -89.67741394042969, -79.3309097290039, -68.98440551757812, -58.63790512084961, -48.29140090942383, -37.94490051269531, -27.59839630126953, -17.25189208984375, -6.905388832092285, 3.4411144256591797, 13.787616729736328, 24.13412094116211, 34.48062515258789, 44.827125549316406, 55.17362976074219, 65.52013397216797, 75.86663818359375, 86.21314239501953, 96.55964660644531, 106.90614318847656, 117.25265502929688, 127.59915161132812, 137.94564819335938, 148.2921600341797, 158.63865661621094, 168.98516845703125, 179.3316650390625, 189.6781768798828, 200.02467346191406, 210.37118530273438, 220.71768188476562, 231.06417846679688, 241.41067504882812, 251.75718688964844, 262.10369873046875, 272.4501953125, 282.79669189453125, 293.1431884765625, 303.48968505859375, 313.8362121582031]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 12.0, 14.0, 21.0, 35.0, 51.0, 64.0, 94.0, 146.0, 191.0, 308.0, 459.0, 650.0, 1018.0, 1486.0, 2419.0, 3920.0, 6444.0, 10997.0, 19400.0, 36079.0, 69144.0, 138790.0, 249180.0, 237253.0, 128242.0, 63871.0, 33268.0, 18149.0, 10282.0, 6081.0, 3761.0, 2318.0, 1509.0, 927.0, 641.0, 420.0, 267.0, 187.0, 125.0, 97.0, 65.0, 51.0, 37.0, 27.0, 12.0, 21.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-40.96875, -39.72509765625, -38.4814453125, -37.23779296875, -35.994140625, -34.75048828125, -33.5068359375, -32.26318359375, -31.01953125, -29.77587890625, -28.5322265625, -27.28857421875, -26.044921875, -24.80126953125, -23.5576171875, -22.31396484375, -21.0703125, -19.82666015625, -18.5830078125, -17.33935546875, -16.095703125, -14.85205078125, -13.6083984375, -12.36474609375, -11.12109375, -9.87744140625, -8.6337890625, -7.39013671875, -6.146484375, -4.90283203125, -3.6591796875, -2.41552734375, -1.171875, 0.07177734375, 1.3154296875, 2.55908203125, 3.802734375, 5.04638671875, 6.2900390625, 7.53369140625, 8.77734375, 10.02099609375, 11.2646484375, 12.50830078125, 13.751953125, 14.99560546875, 16.2392578125, 17.48291015625, 18.7265625, 19.97021484375, 21.2138671875, 22.45751953125, 23.701171875, 24.94482421875, 26.1884765625, 27.43212890625, 28.67578125, 29.91943359375, 31.1630859375, 32.40673828125, 33.650390625, 34.89404296875, 36.1376953125, 37.38134765625, 38.625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 4.0, 12.0, 6.0, 15.0, 13.0, 14.0, 18.0, 14.0, 22.0, 19.0, 34.0, 40.0, 27.0, 38.0, 28.0, 39.0, 44.0, 32.0, 34.0, 35.0, 51.0, 38.0, 46.0, 42.0, 39.0, 21.0, 34.0, 34.0, 23.0, 31.0, 22.0, 26.0, 15.0, 14.0, 11.0, 10.0, 13.0, 10.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-28.859375, -27.97265625, -27.0859375, -26.19921875, -25.3125, -24.42578125, -23.5390625, -22.65234375, -21.765625, -20.87890625, -19.9921875, -19.10546875, -18.21875, -17.33203125, -16.4453125, -15.55859375, -14.671875, -13.78515625, -12.8984375, -12.01171875, -11.125, -10.23828125, -9.3515625, -8.46484375, -7.578125, -6.69140625, -5.8046875, -4.91796875, -4.03125, -3.14453125, -2.2578125, -1.37109375, -0.484375, 0.40234375, 1.2890625, 2.17578125, 3.0625, 3.94921875, 4.8359375, 5.72265625, 6.609375, 7.49609375, 8.3828125, 9.26953125, 10.15625, 11.04296875, 11.9296875, 12.81640625, 13.703125, 14.58984375, 15.4765625, 16.36328125, 17.25, 18.13671875, 19.0234375, 19.91015625, 20.796875, 21.68359375, 22.5703125, 23.45703125, 24.34375, 25.23046875, 26.1171875, 27.00390625, 27.890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 10.0, 9.0, 10.0, 21.0, 37.0, 40.0, 83.0, 113.0, 179.0, 267.0, 407.0, 707.0, 1419.0, 3433.0, 13682.0, 108450.0, 810064.0, 90961.0, 12273.0, 3177.0, 1323.0, 640.0, 439.0, 254.0, 163.0, 98.0, 78.0, 60.0, 47.0, 23.0, 25.0, 8.0, 7.0, 13.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-134.125, -130.544921875, -126.96484375, -123.384765625, -119.8046875, -116.224609375, -112.64453125, -109.064453125, -105.484375, -101.904296875, -98.32421875, -94.744140625, -91.1640625, -87.583984375, -84.00390625, -80.423828125, -76.84375, -73.263671875, -69.68359375, -66.103515625, -62.5234375, -58.943359375, -55.36328125, -51.783203125, -48.203125, -44.623046875, -41.04296875, -37.462890625, -33.8828125, -30.302734375, -26.72265625, -23.142578125, -19.5625, -15.982421875, -12.40234375, -8.822265625, -5.2421875, -1.662109375, 1.91796875, 5.498046875, 9.078125, 12.658203125, 16.23828125, 19.818359375, 23.3984375, 26.978515625, 30.55859375, 34.138671875, 37.71875, 41.298828125, 44.87890625, 48.458984375, 52.0390625, 55.619140625, 59.19921875, 62.779296875, 66.359375, 69.939453125, 73.51953125, 77.099609375, 80.6796875, 84.259765625, 87.83984375, 91.419921875, 95.0]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 5.0, 7.0, 7.0, 11.0, 15.0, 16.0, 18.0, 21.0, 25.0, 37.0, 35.0, 49.0, 54.0, 56.0, 46.0, 62.0, 48.0, 57.0, 58.0, 49.0, 47.0, 44.0, 34.0, 20.0, 29.0, 23.0, 29.0, 17.0, 18.0, 12.0, 6.0, 7.0, 9.0, 6.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-125.6875, -121.8515625, -118.015625, -114.1796875, -110.34375, -106.5078125, -102.671875, -98.8359375, -95.0, -91.1640625, -87.328125, -83.4921875, -79.65625, -75.8203125, -71.984375, -68.1484375, -64.3125, -60.4765625, -56.640625, -52.8046875, -48.96875, -45.1328125, -41.296875, -37.4609375, -33.625, -29.7890625, -25.953125, -22.1171875, -18.28125, -14.4453125, -10.609375, -6.7734375, -2.9375, 0.8984375, 4.734375, 8.5703125, 12.40625, 16.2421875, 20.078125, 23.9140625, 27.75, 31.5859375, 35.421875, 39.2578125, 43.09375, 46.9296875, 50.765625, 54.6015625, 58.4375, 62.2734375, 66.109375, 69.9453125, 73.78125, 77.6171875, 81.453125, 85.2890625, 89.125, 92.9609375, 96.796875, 100.6328125, 104.46875, 108.3046875, 112.140625, 115.9765625, 119.8125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 12.0, 8.0, 14.0, 23.0, 23.0, 45.0, 68.0, 88.0, 149.0, 235.0, 368.0, 770.0, 1434.0, 3938.0, 12931.0, 53762.0, 348561.0, 550317.0, 55122.0, 13273.0, 4076.0, 1572.0, 735.0, 403.0, 225.0, 113.0, 94.0, 56.0, 46.0, 23.0, 12.0, 21.0, 9.0, 8.0, 3.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.7626953125, -17.150390625, -16.5380859375, -15.92578125, -15.3134765625, -14.701171875, -14.0888671875, -13.4765625, -12.8642578125, -12.251953125, -11.6396484375, -11.02734375, -10.4150390625, -9.802734375, -9.1904296875, -8.578125, -7.9658203125, -7.353515625, -6.7412109375, -6.12890625, -5.5166015625, -4.904296875, -4.2919921875, -3.6796875, -3.0673828125, -2.455078125, -1.8427734375, -1.23046875, -0.6181640625, -0.005859375, 0.6064453125, 1.21875, 1.8310546875, 2.443359375, 3.0556640625, 3.66796875, 4.2802734375, 4.892578125, 5.5048828125, 6.1171875, 6.7294921875, 7.341796875, 7.9541015625, 8.56640625, 9.1787109375, 9.791015625, 10.4033203125, 11.015625, 11.6279296875, 12.240234375, 12.8525390625, 13.46484375, 14.0771484375, 14.689453125, 15.3017578125, 15.9140625, 16.5263671875, 17.138671875, 17.7509765625, 18.36328125, 18.9755859375, 19.587890625, 20.2001953125, 20.8125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 5.0, 7.0, 5.0, 6.0, 6.0, 9.0, 9.0, 7.0, 9.0, 18.0, 23.0, 23.0, 33.0, 33.0, 59.0, 67.0, 61.0, 72.0, 98.0, 86.0, 68.0, 73.0, 46.0, 31.0, 30.0, 26.0, 13.0, 16.0, 12.0, 13.0, 9.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0052642822265625, -0.005080282688140869, -0.004896283149719238, -0.004712283611297607, -0.0045282840728759766, -0.004344284534454346, -0.004160284996032715, -0.003976285457611084, -0.003792285919189453, -0.0036082863807678223, -0.0034242868423461914, -0.0032402873039245605, -0.0030562877655029297, -0.002872288227081299, -0.002688288688659668, -0.002504289150238037, -0.0023202896118164062, -0.0021362900733947754, -0.0019522905349731445, -0.0017682909965515137, -0.0015842914581298828, -0.001400291919708252, -0.001216292381286621, -0.0010322928428649902, -0.0008482933044433594, -0.0006642937660217285, -0.00048029422760009766, -0.0002962946891784668, -0.00011229515075683594, 7.170438766479492e-05, 0.0002557039260864258, 0.00043970346450805664, 0.0006237030029296875, 0.0008077025413513184, 0.0009917020797729492, 0.00117570161819458, 0.001359701156616211, 0.0015437006950378418, 0.0017277002334594727, 0.0019116997718811035, 0.0020956993103027344, 0.0022796988487243652, 0.002463698387145996, 0.002647697925567627, 0.002831697463989258, 0.0030156970024108887, 0.0031996965408325195, 0.0033836960792541504, 0.0035676956176757812, 0.003751695156097412, 0.003935694694519043, 0.004119694232940674, 0.004303693771362305, 0.0044876933097839355, 0.004671692848205566, 0.004855692386627197, 0.005039691925048828, 0.005223691463470459, 0.00540769100189209, 0.005591690540313721, 0.0057756900787353516, 0.005959689617156982, 0.006143689155578613, 0.006327688694000244, 0.006511688232421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 14.0, 16.0, 27.0, 39.0, 56.0, 88.0, 142.0, 256.0, 387.0, 672.0, 1368.0, 3308.0, 9764.0, 41513.0, 236781.0, 656969.0, 73540.0, 15363.0, 4531.0, 1695.0, 829.0, 413.0, 244.0, 177.0, 112.0, 67.0, 52.0, 42.0, 25.0, 12.0, 8.0, 5.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.3046875, -14.7198486328125, -14.135009765625, -13.5501708984375, -12.96533203125, -12.3804931640625, -11.795654296875, -11.2108154296875, -10.6259765625, -10.0411376953125, -9.456298828125, -8.8714599609375, -8.28662109375, -7.7017822265625, -7.116943359375, -6.5321044921875, -5.947265625, -5.3624267578125, -4.777587890625, -4.1927490234375, -3.60791015625, -3.0230712890625, -2.438232421875, -1.8533935546875, -1.2685546875, -0.6837158203125, -0.098876953125, 0.4859619140625, 1.07080078125, 1.6556396484375, 2.240478515625, 2.8253173828125, 3.41015625, 3.9949951171875, 4.579833984375, 5.1646728515625, 5.74951171875, 6.3343505859375, 6.919189453125, 7.5040283203125, 8.0888671875, 8.6737060546875, 9.258544921875, 9.8433837890625, 10.42822265625, 11.0130615234375, 11.597900390625, 12.1827392578125, 12.767578125, 13.3524169921875, 13.937255859375, 14.5220947265625, 15.10693359375, 15.6917724609375, 16.276611328125, 16.8614501953125, 17.4462890625, 18.0311279296875, 18.615966796875, 19.2008056640625, 19.78564453125, 20.3704833984375, 20.955322265625, 21.5401611328125, 22.125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 12.0, 12.0, 12.0, 21.0, 13.0, 25.0, 20.0, 31.0, 37.0, 44.0, 28.0, 42.0, 40.0, 63.0, 58.0, 57.0, 61.0, 57.0, 60.0, 40.0, 51.0, 33.0, 18.0, 24.0, 27.0, 17.0, 19.0, 10.0, 5.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.1484375, -11.7091064453125, -11.269775390625, -10.8304443359375, -10.39111328125, -9.9517822265625, -9.512451171875, -9.0731201171875, -8.6337890625, -8.1944580078125, -7.755126953125, -7.3157958984375, -6.87646484375, -6.4371337890625, -5.997802734375, -5.5584716796875, -5.119140625, -4.6798095703125, -4.240478515625, -3.8011474609375, -3.36181640625, -2.9224853515625, -2.483154296875, -2.0438232421875, -1.6044921875, -1.1651611328125, -0.725830078125, -0.2864990234375, 0.15283203125, 0.5921630859375, 1.031494140625, 1.4708251953125, 1.91015625, 2.3494873046875, 2.788818359375, 3.2281494140625, 3.66748046875, 4.1068115234375, 4.546142578125, 4.9854736328125, 5.4248046875, 5.8641357421875, 6.303466796875, 6.7427978515625, 7.18212890625, 7.6214599609375, 8.060791015625, 8.5001220703125, 8.939453125, 9.3787841796875, 9.818115234375, 10.2574462890625, 10.69677734375, 11.1361083984375, 11.575439453125, 12.0147705078125, 12.4541015625, 12.8934326171875, 13.332763671875, 13.7720947265625, 14.21142578125, 14.6507568359375, 15.090087890625, 15.5294189453125, 15.96875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 10.0, 15.0, 28.0, 40.0, 114.0, 242.0, 323.0, 103.0, 62.0, 27.0, 20.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-905.3668212890625, -882.2041625976562, -859.04150390625, -835.8788452148438, -812.7161865234375, -789.553466796875, -766.390869140625, -743.2281494140625, -720.0654907226562, -696.90283203125, -673.7401733398438, -650.5775146484375, -627.4148559570312, -604.252197265625, -581.0894775390625, -557.9268188476562, -534.76416015625, -511.60150146484375, -488.4388427734375, -465.27618408203125, -442.1134948730469, -418.9508361816406, -395.7881774902344, -372.62548828125, -349.462890625, -326.30023193359375, -303.1375732421875, -279.97491455078125, -256.8122253417969, -233.64956665039062, -210.48690795898438, -187.32423400878906, -164.16156005859375, -140.9989013671875, -117.83622741699219, -94.67356872558594, -71.51090240478516, -48.348236083984375, -25.185577392578125, -2.0229034423828125, 21.139755249023438, 44.30242156982422, 67.465087890625, 90.62774658203125, 113.79041290283203, 136.9530792236328, 160.11573791503906, 183.27841186523438, 206.44107055664062, 229.60372924804688, 252.7664031982422, 275.9290771484375, 299.09173583984375, 322.25439453125, 345.41705322265625, 368.5797119140625, 391.74237060546875, 414.905029296875, 438.06768798828125, 461.2303466796875, 484.3930358886719, 507.5556945800781, 530.7183837890625, 553.8810424804688, 577.043701171875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 8.0, 8.0, 4.0, 15.0, 12.0, 10.0, 18.0, 17.0, 16.0, 19.0, 27.0, 25.0, 33.0, 27.0, 32.0, 55.0, 97.0, 142.0, 82.0, 53.0, 37.0, 25.0, 35.0, 26.0, 25.0, 18.0, 15.0, 15.0, 13.0, 12.0, 11.0, 9.0, 5.0, 11.0, 6.0, 3.0, 4.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-438.62176513671875, -426.1958923339844, -413.77001953125, -401.3441162109375, -388.9182434082031, -376.49237060546875, -364.0664978027344, -351.640625, -339.2147216796875, -326.7888488769531, -314.36297607421875, -301.93707275390625, -289.5111999511719, -277.0853271484375, -264.6594543457031, -252.23358154296875, -239.80770874023438, -227.3818359375, -214.95594787597656, -202.5300750732422, -190.10418701171875, -177.67831420898438, -165.25244140625, -152.82656860351562, -140.4006805419922, -127.97480010986328, -115.54891967773438, -103.123046875, -90.6971664428711, -78.27128601074219, -65.84541320800781, -53.419532775878906, -40.99365234375, -28.567773818969727, -16.141895294189453, -3.7160186767578125, 8.709861755371094, 21.1357421875, 33.561614990234375, 45.98749542236328, 58.41337585449219, 70.8392562866211, 83.26513671875, 95.69100952148438, 108.11688995361328, 120.54277038574219, 132.96864318847656, 145.39453125, 157.82040405273438, 170.24627685546875, 182.6721649169922, 195.09803771972656, 207.52392578125, 219.94979858398438, 232.37567138671875, 244.80154418945312, 257.2274169921875, 269.6532897949219, 282.07916259765625, 294.50506591796875, 306.9309387207031, 319.3568115234375, 331.7826843261719, 344.20855712890625, 356.63446044921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 12.0, 11.0, 17.0, 38.0, 44.0, 70.0, 113.0, 190.0, 274.0, 522.0, 955.0, 1836.0, 4210.0, 11292.0, 43516.0, 282403.0, 1684330.0, 1772236.0, 322487.0, 48783.0, 12329.0, 4542.0, 1901.0, 938.0, 498.0, 280.0, 148.0, 111.0, 55.0, 52.0, 15.0, 15.0, 17.0, 12.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-66.0625, -64.2783203125, -62.494140625, -60.7099609375, -58.92578125, -57.1416015625, -55.357421875, -53.5732421875, -51.7890625, -50.0048828125, -48.220703125, -46.4365234375, -44.65234375, -42.8681640625, -41.083984375, -39.2998046875, -37.515625, -35.7314453125, -33.947265625, -32.1630859375, -30.37890625, -28.5947265625, -26.810546875, -25.0263671875, -23.2421875, -21.4580078125, -19.673828125, -17.8896484375, -16.10546875, -14.3212890625, -12.537109375, -10.7529296875, -8.96875, -7.1845703125, -5.400390625, -3.6162109375, -1.83203125, -0.0478515625, 1.736328125, 3.5205078125, 5.3046875, 7.0888671875, 8.873046875, 10.6572265625, 12.44140625, 14.2255859375, 16.009765625, 17.7939453125, 19.578125, 21.3623046875, 23.146484375, 24.9306640625, 26.71484375, 28.4990234375, 30.283203125, 32.0673828125, 33.8515625, 35.6357421875, 37.419921875, 39.2041015625, 40.98828125, 42.7724609375, 44.556640625, 46.3408203125, 48.125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 6.0, 4.0, 8.0, 6.0, 11.0, 5.0, 18.0, 17.0, 23.0, 13.0, 34.0, 29.0, 27.0, 29.0, 27.0, 45.0, 40.0, 54.0, 45.0, 37.0, 47.0, 42.0, 47.0, 49.0, 36.0, 42.0, 42.0, 26.0, 23.0, 28.0, 19.0, 23.0, 20.0, 16.0, 7.0, 9.0, 11.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-27.59375, -26.73046875, -25.8671875, -25.00390625, -24.140625, -23.27734375, -22.4140625, -21.55078125, -20.6875, -19.82421875, -18.9609375, -18.09765625, -17.234375, -16.37109375, -15.5078125, -14.64453125, -13.78125, -12.91796875, -12.0546875, -11.19140625, -10.328125, -9.46484375, -8.6015625, -7.73828125, -6.875, -6.01171875, -5.1484375, -4.28515625, -3.421875, -2.55859375, -1.6953125, -0.83203125, 0.03125, 0.89453125, 1.7578125, 2.62109375, 3.484375, 4.34765625, 5.2109375, 6.07421875, 6.9375, 7.80078125, 8.6640625, 9.52734375, 10.390625, 11.25390625, 12.1171875, 12.98046875, 13.84375, 14.70703125, 15.5703125, 16.43359375, 17.296875, 18.16015625, 19.0234375, 19.88671875, 20.75, 21.61328125, 22.4765625, 23.33984375, 24.203125, 25.06640625, 25.9296875, 26.79296875, 27.65625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 8.0, 23.0, 22.0, 39.0, 62.0, 99.0, 212.0, 419.0, 939.0, 3338.0, 33059.0, 4017689.0, 129693.0, 5920.0, 1459.0, 619.0, 289.0, 142.0, 76.0, 52.0, 45.0, 15.0, 12.0, 12.0, 4.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.625, -155.55859375, -149.4921875, -143.42578125, -137.359375, -131.29296875, -125.2265625, -119.16015625, -113.09375, -107.02734375, -100.9609375, -94.89453125, -88.828125, -82.76171875, -76.6953125, -70.62890625, -64.5625, -58.49609375, -52.4296875, -46.36328125, -40.296875, -34.23046875, -28.1640625, -22.09765625, -16.03125, -9.96484375, -3.8984375, 2.16796875, 8.234375, 14.30078125, 20.3671875, 26.43359375, 32.5, 38.56640625, 44.6328125, 50.69921875, 56.765625, 62.83203125, 68.8984375, 74.96484375, 81.03125, 87.09765625, 93.1640625, 99.23046875, 105.296875, 111.36328125, 117.4296875, 123.49609375, 129.5625, 135.62890625, 141.6953125, 147.76171875, 153.828125, 159.89453125, 165.9609375, 172.02734375, 178.09375, 184.16015625, 190.2265625, 196.29296875, 202.359375, 208.42578125, 214.4921875, 220.55859375, 226.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 9.0, 16.0, 19.0, 32.0, 36.0, 64.0, 99.0, 147.0, 177.0, 326.0, 413.0, 547.0, 590.0, 457.0, 306.0, 235.0, 172.0, 126.0, 82.0, 60.0, 38.0, 31.0, 17.0, 15.0, 4.0, 13.0, 7.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-87.9375, -85.1064453125, -82.275390625, -79.4443359375, -76.61328125, -73.7822265625, -70.951171875, -68.1201171875, -65.2890625, -62.4580078125, -59.626953125, -56.7958984375, -53.96484375, -51.1337890625, -48.302734375, -45.4716796875, -42.640625, -39.8095703125, -36.978515625, -34.1474609375, -31.31640625, -28.4853515625, -25.654296875, -22.8232421875, -19.9921875, -17.1611328125, -14.330078125, -11.4990234375, -8.66796875, -5.8369140625, -3.005859375, -0.1748046875, 2.65625, 5.4873046875, 8.318359375, 11.1494140625, 13.98046875, 16.8115234375, 19.642578125, 22.4736328125, 25.3046875, 28.1357421875, 30.966796875, 33.7978515625, 36.62890625, 39.4599609375, 42.291015625, 45.1220703125, 47.953125, 50.7841796875, 53.615234375, 56.4462890625, 59.27734375, 62.1083984375, 64.939453125, 67.7705078125, 70.6015625, 73.4326171875, 76.263671875, 79.0947265625, 81.92578125, 84.7568359375, 87.587890625, 90.4189453125, 93.25]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 6.0, 22.0, 65.0, 159.0, 292.0, 199.0, 116.0, 62.0, 30.0, 8.0, 12.0, 10.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-779.4631958007812, -732.6862182617188, -685.9091796875, -639.1322021484375, -592.355224609375, -545.5782470703125, -498.80120849609375, -452.02423095703125, -405.2472229003906, -358.47021484375, -311.6932373046875, -264.9162292480469, -218.1392364501953, -171.36224365234375, -124.58523559570312, -77.80825805664062, -31.03125, 15.745746612548828, 62.522743225097656, 109.29974365234375, 156.0767364501953, 202.85372924804688, 249.6307373046875, 296.40771484375, 343.1847229003906, 389.96173095703125, 436.73870849609375, 483.5157165527344, 530.292724609375, 577.0697021484375, 623.8466796875, 670.6236572265625, 717.4007568359375, 764.177734375, 810.9547729492188, 857.7317504882812, 904.5087280273438, 951.2857666015625, 998.062744140625, 1044.8397216796875, 1091.61669921875, 1138.3936767578125, 1185.170654296875, 1231.94775390625, 1278.7247314453125, 1325.501708984375, 1372.2786865234375, 1419.0556640625, 1465.832763671875, 1512.6097412109375, 1559.38671875, 1606.163818359375, 1652.9407958984375, 1699.7177734375, 1746.4947509765625, 1793.271728515625, 1840.0487060546875, 1886.82568359375, 1933.6026611328125, 1980.379638671875, 2027.15673828125, 2073.93359375, 2120.710693359375, 2167.48779296875, 2214.2646484375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 4.0, 5.0, 7.0, 8.0, 11.0, 10.0, 9.0, 8.0, 14.0, 18.0, 20.0, 16.0, 20.0, 33.0, 37.0, 46.0, 42.0, 35.0, 53.0, 33.0, 47.0, 53.0, 48.0, 53.0, 45.0, 38.0, 40.0, 39.0, 23.0, 24.0, 25.0, 23.0, 16.0, 17.0, 18.0, 17.0, 12.0, 6.0, 7.0, 4.0, 8.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-583.745849609375, -567.8884887695312, -552.0311279296875, -536.1737670898438, -520.31640625, -504.45904541015625, -488.6017150878906, -472.7443542480469, -456.8869934082031, -441.0296325683594, -425.1722717285156, -409.3149108886719, -393.45758056640625, -377.6002197265625, -361.74285888671875, -345.885498046875, -330.02813720703125, -314.1707763671875, -298.31341552734375, -282.4560546875, -266.59869384765625, -250.74134826660156, -234.88400268554688, -219.02664184570312, -203.16928100585938, -187.31192016601562, -171.45455932617188, -155.5972137451172, -139.73985290527344, -123.88249206542969, -108.02513885498047, -92.16778564453125, -76.31045532226562, -60.45309829711914, -44.595741271972656, -28.738384246826172, -12.881027221679688, 2.9763336181640625, 18.83368682861328, 34.6910400390625, 50.54840087890625, 66.40576171875, 82.26311492919922, 98.12046813964844, 113.97782897949219, 129.83518981933594, 145.69253540039062, 161.54989624023438, 177.40725708007812, 193.26461791992188, 209.12197875976562, 224.9793243408203, 240.83668518066406, 256.69403076171875, 272.5513916015625, 288.40875244140625, 304.26611328125, 320.12347412109375, 335.9808349609375, 351.83819580078125, 367.695556640625, 383.55291748046875, 399.4102478027344, 415.2676086425781, 431.1249694824219]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 20.0, 19.0, 51.0, 64.0, 101.0, 161.0, 318.0, 645.0, 1237.0, 2856.0, 7363.0, 21242.0, 75541.0, 482871.0, 362025.0, 63963.0, 18477.0, 6542.0, 2581.0, 1160.0, 579.0, 293.0, 158.0, 120.0, 63.0, 38.0, 12.0, 12.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.875, -74.7939453125, -72.712890625, -70.6318359375, -68.55078125, -66.4697265625, -64.388671875, -62.3076171875, -60.2265625, -58.1455078125, -56.064453125, -53.9833984375, -51.90234375, -49.8212890625, -47.740234375, -45.6591796875, -43.578125, -41.4970703125, -39.416015625, -37.3349609375, -35.25390625, -33.1728515625, -31.091796875, -29.0107421875, -26.9296875, -24.8486328125, -22.767578125, -20.6865234375, -18.60546875, -16.5244140625, -14.443359375, -12.3623046875, -10.28125, -8.2001953125, -6.119140625, -4.0380859375, -1.95703125, 0.1240234375, 2.205078125, 4.2861328125, 6.3671875, 8.4482421875, 10.529296875, 12.6103515625, 14.69140625, 16.7724609375, 18.853515625, 20.9345703125, 23.015625, 25.0966796875, 27.177734375, 29.2587890625, 31.33984375, 33.4208984375, 35.501953125, 37.5830078125, 39.6640625, 41.7451171875, 43.826171875, 45.9072265625, 47.98828125, 50.0693359375, 52.150390625, 54.2314453125, 56.3125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 8.0, 8.0, 6.0, 6.0, 10.0, 12.0, 15.0, 21.0, 19.0, 31.0, 23.0, 29.0, 41.0, 46.0, 42.0, 36.0, 45.0, 46.0, 46.0, 43.0, 49.0, 43.0, 32.0, 50.0, 42.0, 31.0, 42.0, 30.0, 20.0, 16.0, 27.0, 15.0, 17.0, 9.0, 12.0, 2.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.90625, -31.84912109375, -30.7919921875, -29.73486328125, -28.677734375, -27.62060546875, -26.5634765625, -25.50634765625, -24.44921875, -23.39208984375, -22.3349609375, -21.27783203125, -20.220703125, -19.16357421875, -18.1064453125, -17.04931640625, -15.9921875, -14.93505859375, -13.8779296875, -12.82080078125, -11.763671875, -10.70654296875, -9.6494140625, -8.59228515625, -7.53515625, -6.47802734375, -5.4208984375, -4.36376953125, -3.306640625, -2.24951171875, -1.1923828125, -0.13525390625, 0.921875, 1.97900390625, 3.0361328125, 4.09326171875, 5.150390625, 6.20751953125, 7.2646484375, 8.32177734375, 9.37890625, 10.43603515625, 11.4931640625, 12.55029296875, 13.607421875, 14.66455078125, 15.7216796875, 16.77880859375, 17.8359375, 18.89306640625, 19.9501953125, 21.00732421875, 22.064453125, 23.12158203125, 24.1787109375, 25.23583984375, 26.29296875, 27.35009765625, 28.4072265625, 29.46435546875, 30.521484375, 31.57861328125, 32.6357421875, 33.69287109375, 34.75]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 7.0, 14.0, 16.0, 26.0, 35.0, 41.0, 81.0, 107.0, 207.0, 346.0, 723.0, 1812.0, 6828.0, 50853.0, 921615.0, 55009.0, 7112.0, 1904.0, 817.0, 389.0, 201.0, 127.0, 80.0, 61.0, 39.0, 25.0, 17.0, 14.0, 16.0, 10.0, 5.0, 5.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.3125, -106.1455078125, -102.978515625, -99.8115234375, -96.64453125, -93.4775390625, -90.310546875, -87.1435546875, -83.9765625, -80.8095703125, -77.642578125, -74.4755859375, -71.30859375, -68.1416015625, -64.974609375, -61.8076171875, -58.640625, -55.4736328125, -52.306640625, -49.1396484375, -45.97265625, -42.8056640625, -39.638671875, -36.4716796875, -33.3046875, -30.1376953125, -26.970703125, -23.8037109375, -20.63671875, -17.4697265625, -14.302734375, -11.1357421875, -7.96875, -4.8017578125, -1.634765625, 1.5322265625, 4.69921875, 7.8662109375, 11.033203125, 14.2001953125, 17.3671875, 20.5341796875, 23.701171875, 26.8681640625, 30.03515625, 33.2021484375, 36.369140625, 39.5361328125, 42.703125, 45.8701171875, 49.037109375, 52.2041015625, 55.37109375, 58.5380859375, 61.705078125, 64.8720703125, 68.0390625, 71.2060546875, 74.373046875, 77.5400390625, 80.70703125, 83.8740234375, 87.041015625, 90.2080078125, 93.375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 1.0, 9.0, 7.0, 5.0, 12.0, 13.0, 15.0, 21.0, 23.0, 29.0, 31.0, 58.0, 72.0, 69.0, 84.0, 91.0, 77.0, 66.0, 51.0, 48.0, 27.0, 28.0, 24.0, 26.0, 21.0, 20.0, 12.0, 10.0, 8.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-154.125, -149.39453125, -144.6640625, -139.93359375, -135.203125, -130.47265625, -125.7421875, -121.01171875, -116.28125, -111.55078125, -106.8203125, -102.08984375, -97.359375, -92.62890625, -87.8984375, -83.16796875, -78.4375, -73.70703125, -68.9765625, -64.24609375, -59.515625, -54.78515625, -50.0546875, -45.32421875, -40.59375, -35.86328125, -31.1328125, -26.40234375, -21.671875, -16.94140625, -12.2109375, -7.48046875, -2.75, 1.98046875, 6.7109375, 11.44140625, 16.171875, 20.90234375, 25.6328125, 30.36328125, 35.09375, 39.82421875, 44.5546875, 49.28515625, 54.015625, 58.74609375, 63.4765625, 68.20703125, 72.9375, 77.66796875, 82.3984375, 87.12890625, 91.859375, 96.58984375, 101.3203125, 106.05078125, 110.78125, 115.51171875, 120.2421875, 124.97265625, 129.703125, 134.43359375, 139.1640625, 143.89453125, 148.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 1.0, 2.0, 2.0, 7.0, 12.0, 10.0, 13.0, 22.0, 46.0, 51.0, 84.0, 143.0, 297.0, 705.0, 2086.0, 8282.0, 57609.0, 919292.0, 49219.0, 7477.0, 1941.0, 577.0, 285.0, 133.0, 85.0, 56.0, 43.0, 29.0, 9.0, 14.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.671875, -20.983154296875, -20.29443359375, -19.605712890625, -18.9169921875, -18.228271484375, -17.53955078125, -16.850830078125, -16.162109375, -15.473388671875, -14.78466796875, -14.095947265625, -13.4072265625, -12.718505859375, -12.02978515625, -11.341064453125, -10.65234375, -9.963623046875, -9.27490234375, -8.586181640625, -7.8974609375, -7.208740234375, -6.52001953125, -5.831298828125, -5.142578125, -4.453857421875, -3.76513671875, -3.076416015625, -2.3876953125, -1.698974609375, -1.01025390625, -0.321533203125, 0.3671875, 1.055908203125, 1.74462890625, 2.433349609375, 3.1220703125, 3.810791015625, 4.49951171875, 5.188232421875, 5.876953125, 6.565673828125, 7.25439453125, 7.943115234375, 8.6318359375, 9.320556640625, 10.00927734375, 10.697998046875, 11.38671875, 12.075439453125, 12.76416015625, 13.452880859375, 14.1416015625, 14.830322265625, 15.51904296875, 16.207763671875, 16.896484375, 17.585205078125, 18.27392578125, 18.962646484375, 19.6513671875, 20.340087890625, 21.02880859375, 21.717529296875, 22.40625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 18.0, 13.0, 24.0, 34.0, 46.0, 79.0, 121.0, 143.0, 143.0, 100.0, 69.0, 50.0, 31.0, 29.0, 24.0, 12.0, 13.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0073089599609375, -0.007094025611877441, -0.006879091262817383, -0.006664156913757324, -0.006449222564697266, -0.006234288215637207, -0.0060193538665771484, -0.00580441951751709, -0.005589485168457031, -0.005374550819396973, -0.005159616470336914, -0.0049446821212768555, -0.004729747772216797, -0.004514813423156738, -0.00429987907409668, -0.004084944725036621, -0.0038700103759765625, -0.003655076026916504, -0.0034401416778564453, -0.0032252073287963867, -0.003010272979736328, -0.0027953386306762695, -0.002580404281616211, -0.0023654699325561523, -0.0021505355834960938, -0.0019356012344360352, -0.0017206668853759766, -0.001505732536315918, -0.0012907981872558594, -0.0010758638381958008, -0.0008609294891357422, -0.0006459951400756836, -0.000431060791015625, -0.0002161264419555664, -1.1920928955078125e-06, 0.00021374225616455078, 0.0004286766052246094, 0.000643610954284668, 0.0008585453033447266, 0.0010734796524047852, 0.0012884140014648438, 0.0015033483505249023, 0.001718282699584961, 0.0019332170486450195, 0.002148151397705078, 0.0023630857467651367, 0.0025780200958251953, 0.002792954444885254, 0.0030078887939453125, 0.003222823143005371, 0.0034377574920654297, 0.0036526918411254883, 0.003867626190185547, 0.0040825605392456055, 0.004297494888305664, 0.004512429237365723, 0.004727363586425781, 0.00494229793548584, 0.0051572322845458984, 0.005372166633605957, 0.005587100982666016, 0.005802035331726074, 0.006016969680786133, 0.006231904029846191, 0.00644683837890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 6.0, 3.0, 7.0, 7.0, 8.0, 12.0, 19.0, 23.0, 45.0, 62.0, 127.0, 267.0, 745.0, 2278.0, 11290.0, 153448.0, 853086.0, 21672.0, 3635.0, 1014.0, 373.0, 175.0, 106.0, 44.0, 34.0, 20.0, 11.0, 12.0, 14.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.1875, -21.556396484375, -20.92529296875, -20.294189453125, -19.6630859375, -19.031982421875, -18.40087890625, -17.769775390625, -17.138671875, -16.507568359375, -15.87646484375, -15.245361328125, -14.6142578125, -13.983154296875, -13.35205078125, -12.720947265625, -12.08984375, -11.458740234375, -10.82763671875, -10.196533203125, -9.5654296875, -8.934326171875, -8.30322265625, -7.672119140625, -7.041015625, -6.409912109375, -5.77880859375, -5.147705078125, -4.5166015625, -3.885498046875, -3.25439453125, -2.623291015625, -1.9921875, -1.361083984375, -0.72998046875, -0.098876953125, 0.5322265625, 1.163330078125, 1.79443359375, 2.425537109375, 3.056640625, 3.687744140625, 4.31884765625, 4.949951171875, 5.5810546875, 6.212158203125, 6.84326171875, 7.474365234375, 8.10546875, 8.736572265625, 9.36767578125, 9.998779296875, 10.6298828125, 11.260986328125, 11.89208984375, 12.523193359375, 13.154296875, 13.785400390625, 14.41650390625, 15.047607421875, 15.6787109375, 16.309814453125, 16.94091796875, 17.572021484375, 18.203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 5.0, 7.0, 4.0, 4.0, 7.0, 10.0, 11.0, 12.0, 24.0, 25.0, 30.0, 40.0, 45.0, 56.0, 81.0, 97.0, 108.0, 78.0, 86.0, 63.0, 45.0, 25.0, 28.0, 26.0, 13.0, 15.0, 11.0, 10.0, 8.0, 4.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.484375, -11.0751953125, -10.666015625, -10.2568359375, -9.84765625, -9.4384765625, -9.029296875, -8.6201171875, -8.2109375, -7.8017578125, -7.392578125, -6.9833984375, -6.57421875, -6.1650390625, -5.755859375, -5.3466796875, -4.9375, -4.5283203125, -4.119140625, -3.7099609375, -3.30078125, -2.8916015625, -2.482421875, -2.0732421875, -1.6640625, -1.2548828125, -0.845703125, -0.4365234375, -0.02734375, 0.3818359375, 0.791015625, 1.2001953125, 1.609375, 2.0185546875, 2.427734375, 2.8369140625, 3.24609375, 3.6552734375, 4.064453125, 4.4736328125, 4.8828125, 5.2919921875, 5.701171875, 6.1103515625, 6.51953125, 6.9287109375, 7.337890625, 7.7470703125, 8.15625, 8.5654296875, 8.974609375, 9.3837890625, 9.79296875, 10.2021484375, 10.611328125, 11.0205078125, 11.4296875, 11.8388671875, 12.248046875, 12.6572265625, 13.06640625, 13.4755859375, 13.884765625, 14.2939453125, 14.703125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 17.0, 26.0, 61.0, 122.0, 550.0, 104.0, 64.0, 27.0, 15.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-958.3433837890625, -932.1453857421875, -905.9473266601562, -879.7493286132812, -853.55126953125, -827.353271484375, -801.1552734375, -774.957275390625, -748.7592163085938, -722.5612182617188, -696.3631591796875, -670.1651611328125, -643.9671630859375, -617.7691040039062, -591.5711059570312, -565.373046875, -539.175048828125, -512.97705078125, -486.77899169921875, -460.58099365234375, -434.3829650878906, -408.1849365234375, -381.9869384765625, -355.7889099121094, -329.59088134765625, -303.3928527832031, -277.19482421875, -250.996826171875, -224.79879760742188, -198.60076904296875, -172.4027557373047, -146.20474243164062, -120.0067138671875, -93.8086929321289, -67.61067199707031, -41.41265106201172, -15.214630126953125, 10.9833984375, 37.18141174316406, 63.379425048828125, 89.57745361328125, 115.77547454833984, 141.97349548339844, 168.1715087890625, 194.36953735351562, 220.56756591796875, 246.7655792236328, 272.9635925292969, 299.16162109375, 325.3596496582031, 351.55767822265625, 377.75567626953125, 403.9537048339844, 430.1517333984375, 456.3497314453125, 482.5477600097656, 508.74578857421875, 534.9437866210938, 561.141845703125, 587.33984375, 613.537841796875, 639.7359008789062, 665.9338989257812, 692.1319580078125, 718.3299560546875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 6.0, 5.0, 5.0, 11.0, 5.0, 13.0, 19.0, 11.0, 19.0, 24.0, 25.0, 15.0, 22.0, 26.0, 35.0, 54.0, 274.0, 163.0, 42.0, 26.0, 20.0, 26.0, 25.0, 16.0, 7.0, 15.0, 15.0, 12.0, 6.0, 9.0, 7.0, 9.0, 5.0, 3.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-336.88006591796875, -325.17572021484375, -313.4714050292969, -301.7670593261719, -290.062744140625, -278.3583984375, -266.654052734375, -254.94973754882812, -243.2454071044922, -231.54107666015625, -219.8367462158203, -208.13241577148438, -196.42807006835938, -184.7237548828125, -173.0194091796875, -161.31507873535156, -149.61074829101562, -137.9064178466797, -126.20208740234375, -114.49774932861328, -102.79341888427734, -91.0890884399414, -79.38475036621094, -67.680419921875, -55.97608947753906, -44.271759033203125, -32.56742477416992, -20.86309051513672, -9.158760070800781, 2.5455703735351562, 14.249908447265625, 25.954238891601562, 37.658599853515625, 49.36293029785156, 61.067264556884766, 72.77159881591797, 84.4759292602539, 96.18025970458984, 107.88459777832031, 119.58892822265625, 131.2932586669922, 142.99758911132812, 154.70191955566406, 166.40625, 178.110595703125, 189.81491088867188, 201.51925659179688, 213.2235870361328, 224.92791748046875, 236.6322479248047, 248.33657836914062, 260.0409240722656, 271.7452392578125, 283.4495849609375, 295.1539306640625, 306.8582458496094, 318.56256103515625, 330.26690673828125, 341.9712219238281, 353.6755676269531, 365.3798828125, 377.084228515625, 388.78857421875, 400.4928894042969, 412.1972351074219]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 7.0, 11.0, 5.0, 10.0, 8.0, 10.0, 9.0, 15.0, 22.0, 25.0, 31.0, 39.0, 26.0, 35.0, 78.0, 195.0, 146.0, 52.0, 44.0, 27.0, 23.0, 32.0, 28.0, 18.0, 16.0, 13.0, 8.0, 9.0, 11.0, 10.0, 3.0, 12.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-36.0625, -35.059326171875, -34.05615234375, -33.052978515625, -32.0498046875, -31.046630859375, -30.04345703125, -29.040283203125, -28.037109375, -27.033935546875, -26.03076171875, -25.027587890625, -24.0244140625, -23.021240234375, -22.01806640625, -21.014892578125, -20.01171875, -19.008544921875, -18.00537109375, -17.002197265625, -15.9990234375, -14.995849609375, -13.99267578125, -12.989501953125, -11.986328125, -10.983154296875, -9.97998046875, -8.976806640625, -7.9736328125, -6.970458984375, -5.96728515625, -4.964111328125, -3.9609375, -2.957763671875, -1.95458984375, -0.951416015625, 0.0517578125, 1.054931640625, 2.05810546875, 3.061279296875, 4.064453125, 5.067626953125, 6.07080078125, 7.073974609375, 8.0771484375, 9.080322265625, 10.08349609375, 11.086669921875, 12.08984375, 13.093017578125, 14.09619140625, 15.099365234375, 16.1025390625, 17.105712890625, 18.10888671875, 19.112060546875, 20.115234375, 21.118408203125, 22.12158203125, 23.124755859375, 24.1279296875, 25.131103515625, 26.13427734375, 27.137451171875, 28.140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 7.0, 3.0, 1.0, 2.0, 8.0, 16.0, 16.0, 42.0, 36.0, 45.0, 90.0, 261.0, 862.0, 4537.0, 8298987.0, 79373.0, 3230.0, 627.0, 176.0, 90.0, 55.0, 30.0, 22.0, 14.0, 10.0, 3.0, 5.0, 5.0, 5.0, 2.0, 2.0, 8.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-454.3185729980469, -440.08111572265625, -425.8436584472656, -411.606201171875, -397.3687438964844, -383.13128662109375, -368.893798828125, -354.6563720703125, -340.41888427734375, -326.1814270019531, -311.9439697265625, -297.7065124511719, -283.46905517578125, -269.2315979003906, -254.99412536621094, -240.7566680908203, -226.51922607421875, -212.28176879882812, -198.0443115234375, -183.80685424804688, -169.56939697265625, -155.33193969726562, -141.09446716308594, -126.85700988769531, -112.61955261230469, -98.38209533691406, -84.14463806152344, -69.90717315673828, -55.669715881347656, -41.43225860595703, -27.194793701171875, -12.95733642578125, 1.280120849609375, 15.517580032348633, 29.75503921508789, 43.99250030517578, 58.229957580566406, 72.46741485595703, 86.70487976074219, 100.94233703613281, 115.17979431152344, 129.41725158691406, 143.6547088623047, 157.89218139648438, 172.129638671875, 186.36709594726562, 200.60455322265625, 214.84201049804688, 229.0794677734375, 243.31692504882812, 257.55438232421875, 271.7918395996094, 286.029296875, 300.2667541503906, 314.50421142578125, 328.74169921875, 342.9791259765625, 357.2165832519531, 371.45404052734375, 385.6914978027344, 399.928955078125, 414.1664123535156, 428.40386962890625, 442.641357421875, 456.8788146972656]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 6.0, 1.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 6.0, 2.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-155.1586151123047, -147.841552734375, -140.52447509765625, -133.20741271972656, -125.89035034179688, -118.57328033447266, -111.25621032714844, -103.93914794921875, -96.62207794189453, -89.30500793457031, -81.98794555664062, -74.6708755493164, -67.35380554199219, -60.0367431640625, -52.71967315673828, -45.40260696411133, -38.085540771484375, -30.768474578857422, -23.451406478881836, -16.13433837890625, -8.817272186279297, -1.5002059936523438, 5.816864013671875, 13.133930206298828, 20.45099639892578, 27.768062591552734, 35.08512878417969, 42.402198791503906, 49.71926498413086, 57.03633117675781, 64.35340118408203, 71.67047119140625, 78.987548828125, 86.30461883544922, 93.6216812133789, 100.93875122070312, 108.25581359863281, 115.57288360595703, 122.88995361328125, 130.20701599121094, 137.52407836914062, 144.8411407470703, 152.15821838378906, 159.47528076171875, 166.79234313964844, 174.10940551757812, 181.42648315429688, 188.74354553222656, 196.0606231689453, 203.377685546875, 210.69476318359375, 218.01182556152344, 225.32888793945312, 232.64596557617188, 239.96302795410156, 247.28009033203125, 254.59716796875, 261.91424560546875, 269.2312927246094, 276.5483703613281, 283.8654479980469, 291.1824951171875, 298.49957275390625, 305.816650390625, 313.1336975097656]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 10.0, 12.0, 23.0, 29.0, 38.0, 57.0, 64.0, 117.0, 163.0, 334.0, 714.0, 1649.0, 4337.0, 13760.0, 50224.0, 187431.0, 190102.0, 52120.0, 14777.0, 4812.0, 1727.0, 742.0, 390.0, 201.0, 145.0, 74.0, 60.0, 46.0, 27.0, 16.0, 14.0, 14.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-349.5, -340.3046875, -331.109375, -321.9140625, -312.71875, -303.5234375, -294.328125, -285.1328125, -275.9375, -266.7421875, -257.546875, -248.3515625, -239.15625, -229.9609375, -220.765625, -211.5703125, -202.375, -193.1796875, -183.984375, -174.7890625, -165.59375, -156.3984375, -147.203125, -138.0078125, -128.8125, -119.6171875, -110.421875, -101.2265625, -92.03125, -82.8359375, -73.640625, -64.4453125, -55.25, -46.0546875, -36.859375, -27.6640625, -18.46875, -9.2734375, -0.078125, 9.1171875, 18.3125, 27.5078125, 36.703125, 45.8984375, 55.09375, 64.2890625, 73.484375, 82.6796875, 91.875, 101.0703125, 110.265625, 119.4609375, 128.65625, 137.8515625, 147.046875, 156.2421875, 165.4375, 174.6328125, 183.828125, 193.0234375, 202.21875, 211.4140625, 220.609375, 229.8046875, 239.0]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 7.0, 9.0, 6.0, 9.0, 15.0, 19.0, 22.0, 22.0, 37.0, 37.0, 36.0, 45.0, 62.0, 50.0, 69.0, 70.0, 74.0, 52.0, 64.0, 39.0, 49.0, 39.0, 20.0, 22.0, 29.0, 24.0, 16.0, 16.0, 8.0, 10.0, 8.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.09375, -33.861328125, -32.62890625, -31.396484375, -30.1640625, -28.931640625, -27.69921875, -26.466796875, -25.234375, -24.001953125, -22.76953125, -21.537109375, -20.3046875, -19.072265625, -17.83984375, -16.607421875, -15.375, -14.142578125, -12.91015625, -11.677734375, -10.4453125, -9.212890625, -7.98046875, -6.748046875, -5.515625, -4.283203125, -3.05078125, -1.818359375, -0.5859375, 0.646484375, 1.87890625, 3.111328125, 4.34375, 5.576171875, 6.80859375, 8.041015625, 9.2734375, 10.505859375, 11.73828125, 12.970703125, 14.203125, 15.435546875, 16.66796875, 17.900390625, 19.1328125, 20.365234375, 21.59765625, 22.830078125, 24.0625, 25.294921875, 26.52734375, 27.759765625, 28.9921875, 30.224609375, 31.45703125, 32.689453125, 33.921875, 35.154296875, 36.38671875, 37.619140625, 38.8515625, 40.083984375, 41.31640625, 42.548828125, 43.78125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 11.0, 12.0, 59.0, 127.0, 137.0, 74.0, 22.0, 8.0, 12.0, 5.0, 7.0, 3.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-462.75238037109375, -447.48675537109375, -432.22113037109375, -416.9554748535156, -401.6898498535156, -386.4242248535156, -371.1585693359375, -355.8929443359375, -340.6273193359375, -325.3616943359375, -310.0960693359375, -294.8304138183594, -279.5647888183594, -264.2991638183594, -249.0335235595703, -233.76788330078125, -218.50225830078125, -203.23663330078125, -187.9709930419922, -172.70535278320312, -157.43972778320312, -142.17410278320312, -126.90846252441406, -111.64282989501953, -96.377197265625, -81.11156463623047, -65.84593200683594, -50.580299377441406, -35.314666748046875, -20.049034118652344, -4.7834014892578125, 10.482231140136719, 25.74786376953125, 41.01349639892578, 56.27912902832031, 71.54476165771484, 86.81039428710938, 102.0760269165039, 117.34165954589844, 132.6072998046875, 147.8729248046875, 163.1385498046875, 178.40419006347656, 193.66983032226562, 208.93545532226562, 224.20108032226562, 239.4667205810547, 254.73236083984375, 269.99798583984375, 285.26361083984375, 300.52923583984375, 315.7948913574219, 331.0605163574219, 346.3261413574219, 361.591796875, 376.857421875, 392.123046875, 407.388671875, 422.654296875, 437.9199523925781, 453.1855773925781, 468.4512023925781, 483.71685791015625, 498.98248291015625, 514.2481079101562]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 5.0, 5.0, 5.0, 10.0, 10.0, 6.0, 16.0, 32.0, 82.0, 120.0, 100.0, 34.0, 16.0, 14.0, 4.0, 7.0, 3.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.38954162597656, -212.75387573242188, -204.1182098388672, -195.4825439453125, -186.84686279296875, -178.21121215820312, -169.57553100585938, -160.9398651123047, -152.30419921875, -143.6685333251953, -135.03286743164062, -126.3971939086914, -117.76152801513672, -109.12586212158203, -100.49018859863281, -91.85452270507812, -83.21885681152344, -74.58319091796875, -65.94752502441406, -57.311851501464844, -48.676185607910156, -40.04051971435547, -31.404850006103516, -22.769180297851562, -14.133514404296875, -5.497846603393555, 3.1378211975097656, 11.773488998413086, 20.409156799316406, 29.044822692871094, 37.68049240112305, 46.316162109375, 54.95184326171875, 63.58750915527344, 72.22317504882812, 80.85884857177734, 89.49451446533203, 98.13018035888672, 106.76585388183594, 115.40151977539062, 124.03718566894531, 132.6728515625, 141.3085174560547, 149.94418334960938, 158.57986450195312, 167.21551513671875, 175.8511962890625, 184.4868621826172, 193.12252807617188, 201.75819396972656, 210.39385986328125, 219.02952575683594, 227.66519165039062, 236.30087280273438, 244.93653869628906, 253.57220458984375, 262.2078857421875, 270.84356689453125, 279.4792175292969, 288.1148986816406, 296.75054931640625, 305.38623046875, 314.0218811035156, 322.6575622558594, 331.293212890625]}, "eval/loss": 6.7275872230529785, "eval/wer": 1.4950096235887056, "eval/runtime": 1512.5692, "eval/samples_per_second": 1.747, "eval/steps_per_second": 0.437} \ No newline at end of file +{"train/loss": 6.4331, "train/learning_rate": 2.2647779629448096e-05, "train/epoch": 0.84, "train/global_step": 3000, "_runtime": 12512, "_timestamp": 1646226791, "_step": 3004, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 19.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 30396.0, 61.0, 10.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4632.0, -4527.953125, -4423.90625, -4319.859375, -4215.8125, -4111.765625, -4007.71875, -3903.671875, -3799.625, -3695.578125, -3591.53125, -3487.484375, -3383.4375, -3279.390625, -3175.34375, -3071.296875, -2967.25, -2863.203125, -2759.15625, -2655.109375, -2551.0625, -2447.015625, -2342.96875, -2238.921875, -2134.875, -2030.828125, -1926.78125, -1822.734375, -1718.6875, -1614.640625, -1510.59375, -1406.546875, -1302.5, -1198.453125, -1094.40625, -990.359375, -886.3125, -782.265625, -678.21875, -574.171875, -470.125, -366.078125, -262.03125, -157.984375, -53.9375, 50.109375, 154.15625, 258.203125, 362.25, 466.296875, 570.34375, 674.390625, 778.4375, 882.484375, 986.53125, 1090.578125, 1194.625, 1298.671875, 1402.71875, 1506.765625, 1610.8125, 1714.859375, 1818.90625, 1922.953125, 2027.0]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 10.0, 4.0, 7.0, 17.0, 18.0, 56.0, 76.0, 106.0, 185.0, 162.0, 120.0, 101.0, 48.0, 30.0, 18.0, 7.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2122.14208984375, -2072.442626953125, -2022.7432861328125, -1973.0438232421875, -1923.344482421875, -1873.64501953125, -1823.945556640625, -1774.2462158203125, -1724.546875, -1674.847412109375, -1625.1480712890625, -1575.4486083984375, -1525.749267578125, -1476.0498046875, -1426.350341796875, -1376.6510009765625, -1326.9515380859375, -1277.2520751953125, -1227.552734375, -1177.853271484375, -1128.1539306640625, -1078.4544677734375, -1028.755126953125, -979.0556640625, -929.3562622070312, -879.6568603515625, -829.9574584960938, -780.258056640625, -730.55859375, -680.8592529296875, -631.1597900390625, -581.4603881835938, -531.7608642578125, -482.06146240234375, -432.362060546875, -382.6626281738281, -332.9632263183594, -283.2638244628906, -233.56439208984375, -183.864990234375, -134.16558837890625, -84.46617889404297, -34.76676940917969, 14.932647705078125, 64.63204956054688, 114.33145141601562, 164.0308837890625, 213.73028564453125, 263.4296875, 313.12908935546875, 362.8284912109375, 412.5279235839844, 462.2273254394531, 511.9267272949219, 561.6261596679688, 611.3255615234375, 661.0249633789062, 710.724365234375, 760.4237670898438, 810.1231689453125, 859.8226318359375, 909.52197265625, 959.221435546875, 1008.9208374023438, 1058.6202392578125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 11.0, 6.0, 12.0, 16.0, 11.0, 14.0, 21.0, 25.0, 23.0, 16.0, 32.0, 31.0, 32.0, 43.0, 41.0, 33.0, 33.0, 51.0, 34.0, 37.0, 45.0, 51.0, 39.0, 35.0, 35.0, 29.0, 36.0, 26.0, 30.0, 19.0, 15.0, 19.0, 17.0, 15.0, 9.0, 12.0, 8.0, 6.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-624.51416015625, -602.9755249023438, -581.4368896484375, -559.8982543945312, -538.359619140625, -516.821044921875, -495.28240966796875, -473.7437744140625, -452.20513916015625, -430.66650390625, -409.12786865234375, -387.5892639160156, -366.0506286621094, -344.5119934082031, -322.973388671875, -301.43475341796875, -279.8961181640625, -258.35748291015625, -236.81886291503906, -215.28024291992188, -193.74160766601562, -172.20297241210938, -150.6643524169922, -129.125732421875, -107.58709716796875, -86.04846954345703, -64.50984191894531, -42.971214294433594, -21.432586669921875, 0.10604095458984375, 21.644668579101562, 43.18328857421875, 64.721923828125, 86.26055145263672, 107.79917907714844, 129.33779907226562, 150.87643432617188, 172.41506958007812, 193.9536895751953, 215.4923095703125, 237.03094482421875, 258.569580078125, 280.10821533203125, 301.6468200683594, 323.1854553222656, 344.7240905761719, 366.2626953125, 387.80133056640625, 409.3399658203125, 430.87860107421875, 452.417236328125, 473.9558410644531, 495.4944763183594, 517.0330810546875, 538.5717163085938, 560.1103515625, 581.6489868164062, 603.1876220703125, 624.7262573242188, 646.264892578125, 667.803466796875, 689.3421020507812, 710.8807373046875, 732.4193725585938, 753.9580078125]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 8.0, 11.0, 21.0, 25.0, 35.0, 56.0, 80.0, 116.0, 158.0, 218.0, 354.0, 471.0, 636.0, 992.0, 1481.0, 2059.0, 3250.0, 4707.0, 7369.0, 11341.0, 18799.0, 31169.0, 55873.0, 119648.0, 428467.0, 188229.0, 72085.0, 38592.0, 22704.0, 13722.0, 8789.0, 5686.0, 3700.0, 2464.0, 1653.0, 1068.0, 764.0, 512.0, 388.0, 265.0, 170.0, 133.0, 79.0, 59.0, 37.0, 34.0, 18.0, 11.0, 13.0, 12.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0], "bins": [-1773.0, -1718.765625, -1664.53125, -1610.296875, -1556.0625, -1501.828125, -1447.59375, -1393.359375, -1339.125, -1284.890625, -1230.65625, -1176.421875, -1122.1875, -1067.953125, -1013.71875, -959.484375, -905.25, -851.015625, -796.78125, -742.546875, -688.3125, -634.078125, -579.84375, -525.609375, -471.375, -417.140625, -362.90625, -308.671875, -254.4375, -200.203125, -145.96875, -91.734375, -37.5, 16.734375, 70.96875, 125.203125, 179.4375, 233.671875, 287.90625, 342.140625, 396.375, 450.609375, 504.84375, 559.078125, 613.3125, 667.546875, 721.78125, 776.015625, 830.25, 884.484375, 938.71875, 992.953125, 1047.1875, 1101.421875, 1155.65625, 1209.890625, 1264.125, 1318.359375, 1372.59375, 1426.828125, 1481.0625, 1535.296875, 1589.53125, 1643.765625, 1698.0]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 9.0, 4.0, 18.0, 13.0, 13.0, 13.0, 12.0, 20.0, 21.0, 26.0, 38.0, 33.0, 49.0, 63.0, 109.0, 151.0, 126.0, 65.0, 32.0, 26.0, 24.0, 17.0, 22.0, 14.0, 18.0, 7.0, 8.0, 14.0, 4.0, 6.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-654.0, -633.921875, -613.84375, -593.765625, -573.6875, -553.609375, -533.53125, -513.453125, -493.375, -473.296875, -453.21875, -433.140625, -413.0625, -392.984375, -372.90625, -352.828125, -332.75, -312.671875, -292.59375, -272.515625, -252.4375, -232.359375, -212.28125, -192.203125, -172.125, -152.046875, -131.96875, -111.890625, -91.8125, -71.734375, -51.65625, -31.578125, -11.5, 8.578125, 28.65625, 48.734375, 68.8125, 88.890625, 108.96875, 129.046875, 149.125, 169.203125, 189.28125, 209.359375, 229.4375, 249.515625, 269.59375, 289.671875, 309.75, 329.828125, 349.90625, 369.984375, 390.0625, 410.140625, 430.21875, 450.296875, 470.375, 490.453125, 510.53125, 530.609375, 550.6875, 570.765625, 590.84375, 610.921875, 631.0]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 7.0, 3.0, 6.0, 5.0, 13.0, 21.0, 29.0, 31.0, 31.0, 50.0, 57.0, 85.0, 77.0, 109.0, 76.0, 87.0, 55.0, 55.0, 36.0, 34.0, 20.0, 22.0, 14.0, 13.0, 9.0, 13.0, 6.0, 7.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-420.38818359375, -407.6455383300781, -394.90289306640625, -382.1602478027344, -369.4176025390625, -356.6749572753906, -343.93231201171875, -331.18963623046875, -318.447021484375, -305.7043762207031, -292.96173095703125, -280.2190856933594, -267.4764404296875, -254.73379516601562, -241.9911346435547, -229.2484893798828, -216.50582885742188, -203.76318359375, -191.02053833007812, -178.27789306640625, -165.53524780273438, -152.7926025390625, -140.04994201660156, -127.30729675292969, -114.56465148925781, -101.82200622558594, -89.07936096191406, -76.33670806884766, -63.59406280517578, -50.851417541503906, -38.1087646484375, -25.366119384765625, -12.62347412109375, 0.11917304992675781, 12.861820220947266, 25.604469299316406, 38.34711456298828, 51.089759826660156, 63.83241271972656, 76.57505798339844, 89.31770324707031, 102.06034851074219, 114.80299377441406, 127.54564666748047, 140.28829956054688, 153.03094482421875, 165.77359008789062, 178.5162353515625, 191.25888061523438, 204.00152587890625, 216.74417114257812, 229.48681640625, 242.22946166992188, 254.97210693359375, 267.71478271484375, 280.4573974609375, 293.2000732421875, 305.9427185058594, 318.68536376953125, 331.4280090332031, 344.170654296875, 356.9132995605469, 369.65594482421875, 382.39862060546875, 395.1412353515625]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 6.0, 8.0, 4.0, 13.0, 21.0, 15.0, 27.0, 26.0, 22.0, 35.0, 31.0, 39.0, 20.0, 33.0, 38.0, 30.0, 48.0, 41.0, 42.0, 35.0, 36.0, 39.0, 39.0, 38.0, 33.0, 30.0, 17.0, 37.0, 19.0, 17.0, 23.0, 27.0, 18.0, 8.0, 16.0, 8.0, 3.0, 9.0, 8.0, 5.0, 5.0, 8.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-286.638916015625, -277.99169921875, -269.3444519042969, -260.6972351074219, -252.0500030517578, -243.40277099609375, -234.75555419921875, -226.1083221435547, -217.46109008789062, -208.81385803222656, -200.1666259765625, -191.5194091796875, -182.87217712402344, -174.22494506835938, -165.57772827148438, -156.9304962158203, -148.28326416015625, -139.6360321044922, -130.98880004882812, -122.34158325195312, -113.69435119628906, -105.047119140625, -96.39989471435547, -87.75267028808594, -79.10543823242188, -70.45820617675781, -61.81098175048828, -53.163753509521484, -44.51652526855469, -35.86929702758789, -27.222068786621094, -18.574840545654297, -9.9276123046875, -1.2803840637207031, 7.366844177246094, 16.01407241821289, 24.661300659179688, 33.308528900146484, 41.95575714111328, 50.60298538208008, 59.250213623046875, 67.89744567871094, 76.54467010498047, 85.19189453125, 93.83912658691406, 102.48635864257812, 111.13358306884766, 119.78080749511719, 128.42803955078125, 137.0752716064453, 145.72250366210938, 154.36972045898438, 163.01695251464844, 171.6641845703125, 180.3114013671875, 188.95863342285156, 197.60586547851562, 206.2530975341797, 214.90032958984375, 223.54754638671875, 232.1947784423828, 240.84201049804688, 249.48922729492188, 258.136474609375, 266.78369140625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 14.0, 17.0, 22.0, 44.0, 66.0, 86.0, 158.0, 201.0, 350.0, 507.0, 699.0, 1127.0, 1719.0, 2659.0, 4404.0, 7190.0, 12280.0, 22238.0, 41837.0, 85378.0, 211375.0, 1265027.0, 1972747.0, 331615.0, 111230.0, 53185.0, 28344.0, 15908.0, 9148.0, 5366.0, 3282.0, 2111.0, 1321.0, 876.0, 574.0, 378.0, 257.0, 175.0, 106.0, 92.0, 60.0, 27.0, 23.0, 26.0, 11.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-422.25, -409.12109375, -395.9921875, -382.86328125, -369.734375, -356.60546875, -343.4765625, -330.34765625, -317.21875, -304.08984375, -290.9609375, -277.83203125, -264.703125, -251.57421875, -238.4453125, -225.31640625, -212.1875, -199.05859375, -185.9296875, -172.80078125, -159.671875, -146.54296875, -133.4140625, -120.28515625, -107.15625, -94.02734375, -80.8984375, -67.76953125, -54.640625, -41.51171875, -28.3828125, -15.25390625, -2.125, 11.00390625, 24.1328125, 37.26171875, 50.390625, 63.51953125, 76.6484375, 89.77734375, 102.90625, 116.03515625, 129.1640625, 142.29296875, 155.421875, 168.55078125, 181.6796875, 194.80859375, 207.9375, 221.06640625, 234.1953125, 247.32421875, 260.453125, 273.58203125, 286.7109375, 299.83984375, 312.96875, 326.09765625, 339.2265625, 352.35546875, 365.484375, 378.61328125, 391.7421875, 404.87109375, 418.0]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 13.0, 20.0, 17.0, 28.0, 20.0, 15.0, 24.0, 36.0, 24.0, 37.0, 30.0, 38.0, 42.0, 33.0, 48.0, 32.0, 40.0, 41.0, 38.0, 27.0, 33.0, 41.0, 32.0, 40.0, 13.0, 35.0, 24.0, 23.0, 23.0, 17.0, 20.0, 5.0, 10.0, 14.0, 7.0, 6.0, 7.0, 3.0, 5.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-143.0, -138.802734375, -134.60546875, -130.408203125, -126.2109375, -122.013671875, -117.81640625, -113.619140625, -109.421875, -105.224609375, -101.02734375, -96.830078125, -92.6328125, -88.435546875, -84.23828125, -80.041015625, -75.84375, -71.646484375, -67.44921875, -63.251953125, -59.0546875, -54.857421875, -50.66015625, -46.462890625, -42.265625, -38.068359375, -33.87109375, -29.673828125, -25.4765625, -21.279296875, -17.08203125, -12.884765625, -8.6875, -4.490234375, -0.29296875, 3.904296875, 8.1015625, 12.298828125, 16.49609375, 20.693359375, 24.890625, 29.087890625, 33.28515625, 37.482421875, 41.6796875, 45.876953125, 50.07421875, 54.271484375, 58.46875, 62.666015625, 66.86328125, 71.060546875, 75.2578125, 79.455078125, 83.65234375, 87.849609375, 92.046875, 96.244140625, 100.44140625, 104.638671875, 108.8359375, 113.033203125, 117.23046875, 121.427734375, 125.625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 5.0, 8.0, 14.0, 18.0, 31.0, 34.0, 65.0, 68.0, 127.0, 231.0, 309.0, 427.0, 712.0, 1076.0, 1652.0, 2622.0, 4289.0, 7256.0, 12045.0, 21729.0, 40284.0, 77446.0, 164186.0, 397852.0, 1412728.0, 1338837.0, 384071.0, 159529.0, 76100.0, 39117.0, 21140.0, 12168.0, 6893.0, 4211.0, 2632.0, 1573.0, 984.0, 680.0, 384.0, 256.0, 158.0, 85.0, 79.0, 59.0, 40.0, 30.0, 17.0, 13.0, 8.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-273.25, -264.96484375, -256.6796875, -248.39453125, -240.109375, -231.82421875, -223.5390625, -215.25390625, -206.96875, -198.68359375, -190.3984375, -182.11328125, -173.828125, -165.54296875, -157.2578125, -148.97265625, -140.6875, -132.40234375, -124.1171875, -115.83203125, -107.546875, -99.26171875, -90.9765625, -82.69140625, -74.40625, -66.12109375, -57.8359375, -49.55078125, -41.265625, -32.98046875, -24.6953125, -16.41015625, -8.125, 0.16015625, 8.4453125, 16.73046875, 25.015625, 33.30078125, 41.5859375, 49.87109375, 58.15625, 66.44140625, 74.7265625, 83.01171875, 91.296875, 99.58203125, 107.8671875, 116.15234375, 124.4375, 132.72265625, 141.0078125, 149.29296875, 157.578125, 165.86328125, 174.1484375, 182.43359375, 190.71875, 199.00390625, 207.2890625, 215.57421875, 223.859375, 232.14453125, 240.4296875, 248.71484375, 257.0]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 8.0, 8.0, 12.0, 13.0, 24.0, 21.0, 34.0, 40.0, 36.0, 60.0, 75.0, 76.0, 128.0, 165.0, 194.0, 244.0, 377.0, 525.0, 552.0, 357.0, 253.0, 209.0, 134.0, 104.0, 92.0, 73.0, 41.0, 46.0, 26.0, 37.0, 21.0, 11.0, 7.0, 20.0, 6.0, 10.0, 9.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-92.5, -89.7783203125, -87.056640625, -84.3349609375, -81.61328125, -78.8916015625, -76.169921875, -73.4482421875, -70.7265625, -68.0048828125, -65.283203125, -62.5615234375, -59.83984375, -57.1181640625, -54.396484375, -51.6748046875, -48.953125, -46.2314453125, -43.509765625, -40.7880859375, -38.06640625, -35.3447265625, -32.623046875, -29.9013671875, -27.1796875, -24.4580078125, -21.736328125, -19.0146484375, -16.29296875, -13.5712890625, -10.849609375, -8.1279296875, -5.40625, -2.6845703125, 0.037109375, 2.7587890625, 5.48046875, 8.2021484375, 10.923828125, 13.6455078125, 16.3671875, 19.0888671875, 21.810546875, 24.5322265625, 27.25390625, 29.9755859375, 32.697265625, 35.4189453125, 38.140625, 40.8623046875, 43.583984375, 46.3056640625, 49.02734375, 51.7490234375, 54.470703125, 57.1923828125, 59.9140625, 62.6357421875, 65.357421875, 68.0791015625, 70.80078125, 73.5224609375, 76.244140625, 78.9658203125, 81.6875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 3.0, 10.0, 11.0, 18.0, 33.0, 32.0, 39.0, 49.0, 75.0, 71.0, 96.0, 98.0, 91.0, 86.0, 68.0, 56.0, 36.0, 38.0, 21.0, 14.0, 15.0, 5.0, 11.0, 5.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-291.8419189453125, -283.3953552246094, -274.9488220214844, -266.50225830078125, -258.05572509765625, -249.60916137695312, -241.16259765625, -232.71604919433594, -224.26950073242188, -215.8229522705078, -207.37640380859375, -198.92984008789062, -190.48329162597656, -182.0367431640625, -173.59017944335938, -165.1436309814453, -156.69708251953125, -148.2505340576172, -139.80398559570312, -131.357421875, -122.91087341308594, -114.46432495117188, -106.01776885986328, -97.57121276855469, -89.12466430664062, -80.67811584472656, -72.23155975341797, -63.78500747680664, -55.33845520019531, -46.891902923583984, -38.445350646972656, -29.998798370361328, -21.552230834960938, -13.10567855834961, -4.659126281738281, 3.787425994873047, 12.233978271484375, 20.680530548095703, 29.12708282470703, 37.57363510131836, 46.02018737792969, 54.466739654541016, 62.913291931152344, 71.35984802246094, 79.806396484375, 88.25294494628906, 96.69950103759766, 105.14605712890625, 113.59260559082031, 122.03915405273438, 130.4857177734375, 138.93226623535156, 147.37881469726562, 155.8253631591797, 164.27191162109375, 172.71847534179688, 181.16502380371094, 189.611572265625, 198.05813598632812, 206.5046844482422, 214.95123291015625, 223.3977813720703, 231.84432983398438, 240.2908935546875, 248.73744201660156]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 3.0, 3.0, 6.0, 17.0, 13.0, 18.0, 21.0, 17.0, 18.0, 18.0, 26.0, 29.0, 38.0, 25.0, 39.0, 37.0, 41.0, 33.0, 44.0, 39.0, 36.0, 30.0, 35.0, 44.0, 33.0, 38.0, 42.0, 25.0, 27.0, 18.0, 21.0, 26.0, 19.0, 16.0, 15.0, 10.0, 15.0, 13.0, 10.0, 5.0, 5.0, 5.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-172.21194458007812, -167.1827850341797, -162.15362548828125, -157.12448120117188, -152.09532165527344, -147.066162109375, -142.03700256347656, -137.00784301757812, -131.97869873046875, -126.94953918457031, -121.9203872680664, -116.89122772216797, -111.86207580566406, -106.83291625976562, -101.80375671386719, -96.77459716796875, -91.74543762207031, -86.71627807617188, -81.68712615966797, -76.65796661376953, -71.62881469726562, -66.59965515136719, -61.57049560546875, -56.54133987426758, -51.512184143066406, -46.483028411865234, -41.45387268066406, -36.424713134765625, -31.395557403564453, -26.36640167236328, -21.337244033813477, -16.308086395263672, -11.278915405273438, -6.249758720397949, -1.220602035522461, 3.8085546493530273, 8.837711334228516, 13.866867065429688, 18.896024703979492, 23.925182342529297, 28.95433807373047, 33.98349380493164, 39.01264953613281, 44.04180908203125, 49.07096481323242, 54.100120544433594, 59.12928009033203, 64.15843200683594, 69.18759155273438, 74.21675109863281, 79.24590301513672, 84.27506256103516, 89.30421447753906, 94.3333740234375, 99.36253356933594, 104.39169311523438, 109.42084503173828, 114.45000457763672, 119.47915649414062, 124.50831604003906, 129.5374755859375, 134.56661987304688, 139.5957794189453, 144.62493896484375, 149.6540985107422]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 12.0, 14.0, 21.0, 24.0, 42.0, 75.0, 129.0, 182.0, 283.0, 490.0, 713.0, 1233.0, 2112.0, 3446.0, 5930.0, 10295.0, 18581.0, 34939.0, 67290.0, 138655.0, 281288.0, 241556.0, 116213.0, 57394.0, 29473.0, 16094.0, 9133.0, 5180.0, 2956.0, 1831.0, 1116.0, 657.0, 449.0, 273.0, 158.0, 123.0, 76.0, 41.0, 34.0, 14.0, 13.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-222.0, -215.447265625, -208.89453125, -202.341796875, -195.7890625, -189.236328125, -182.68359375, -176.130859375, -169.578125, -163.025390625, -156.47265625, -149.919921875, -143.3671875, -136.814453125, -130.26171875, -123.708984375, -117.15625, -110.603515625, -104.05078125, -97.498046875, -90.9453125, -84.392578125, -77.83984375, -71.287109375, -64.734375, -58.181640625, -51.62890625, -45.076171875, -38.5234375, -31.970703125, -25.41796875, -18.865234375, -12.3125, -5.759765625, 0.79296875, 7.345703125, 13.8984375, 20.451171875, 27.00390625, 33.556640625, 40.109375, 46.662109375, 53.21484375, 59.767578125, 66.3203125, 72.873046875, 79.42578125, 85.978515625, 92.53125, 99.083984375, 105.63671875, 112.189453125, 118.7421875, 125.294921875, 131.84765625, 138.400390625, 144.953125, 151.505859375, 158.05859375, 164.611328125, 171.1640625, 177.716796875, 184.26953125, 190.822265625, 197.375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 10.0, 12.0, 19.0, 15.0, 16.0, 17.0, 25.0, 28.0, 22.0, 42.0, 44.0, 23.0, 32.0, 36.0, 31.0, 34.0, 45.0, 43.0, 34.0, 40.0, 43.0, 37.0, 28.0, 34.0, 33.0, 26.0, 30.0, 22.0, 21.0, 18.0, 20.0, 15.0, 21.0, 12.0, 6.0, 10.0, 4.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.625, -139.9609375, -135.296875, -130.6328125, -125.96875, -121.3046875, -116.640625, -111.9765625, -107.3125, -102.6484375, -97.984375, -93.3203125, -88.65625, -83.9921875, -79.328125, -74.6640625, -70.0, -65.3359375, -60.671875, -56.0078125, -51.34375, -46.6796875, -42.015625, -37.3515625, -32.6875, -28.0234375, -23.359375, -18.6953125, -14.03125, -9.3671875, -4.703125, -0.0390625, 4.625, 9.2890625, 13.953125, 18.6171875, 23.28125, 27.9453125, 32.609375, 37.2734375, 41.9375, 46.6015625, 51.265625, 55.9296875, 60.59375, 65.2578125, 69.921875, 74.5859375, 79.25, 83.9140625, 88.578125, 93.2421875, 97.90625, 102.5703125, 107.234375, 111.8984375, 116.5625, 121.2265625, 125.890625, 130.5546875, 135.21875, 139.8828125, 144.546875, 149.2109375, 153.875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 4.0, 9.0, 22.0, 27.0, 27.0, 52.0, 74.0, 116.0, 142.0, 250.0, 374.0, 512.0, 915.0, 1419.0, 2331.0, 4192.0, 7628.0, 13766.0, 27316.0, 62695.0, 210408.0, 495813.0, 127649.0, 46028.0, 21229.0, 11011.0, 6065.0, 3300.0, 1960.0, 1175.0, 711.0, 425.0, 279.0, 180.0, 133.0, 97.0, 68.0, 44.0, 22.0, 25.0, 16.0, 14.0, 14.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-179.25, -174.02734375, -168.8046875, -163.58203125, -158.359375, -153.13671875, -147.9140625, -142.69140625, -137.46875, -132.24609375, -127.0234375, -121.80078125, -116.578125, -111.35546875, -106.1328125, -100.91015625, -95.6875, -90.46484375, -85.2421875, -80.01953125, -74.796875, -69.57421875, -64.3515625, -59.12890625, -53.90625, -48.68359375, -43.4609375, -38.23828125, -33.015625, -27.79296875, -22.5703125, -17.34765625, -12.125, -6.90234375, -1.6796875, 3.54296875, 8.765625, 13.98828125, 19.2109375, 24.43359375, 29.65625, 34.87890625, 40.1015625, 45.32421875, 50.546875, 55.76953125, 60.9921875, 66.21484375, 71.4375, 76.66015625, 81.8828125, 87.10546875, 92.328125, 97.55078125, 102.7734375, 107.99609375, 113.21875, 118.44140625, 123.6640625, 128.88671875, 134.109375, 139.33203125, 144.5546875, 149.77734375, 155.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 10.0, 5.0, 7.0, 8.0, 16.0, 16.0, 18.0, 13.0, 21.0, 16.0, 20.0, 26.0, 22.0, 34.0, 18.0, 33.0, 35.0, 30.0, 37.0, 34.0, 28.0, 26.0, 34.0, 32.0, 33.0, 30.0, 31.0, 38.0, 33.0, 27.0, 37.0, 26.0, 33.0, 25.0, 16.0, 18.0, 12.0, 12.0, 18.0, 17.0, 7.0, 12.0, 9.0, 4.0, 9.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-119.4375, -115.4423828125, -111.447265625, -107.4521484375, -103.45703125, -99.4619140625, -95.466796875, -91.4716796875, -87.4765625, -83.4814453125, -79.486328125, -75.4912109375, -71.49609375, -67.5009765625, -63.505859375, -59.5107421875, -55.515625, -51.5205078125, -47.525390625, -43.5302734375, -39.53515625, -35.5400390625, -31.544921875, -27.5498046875, -23.5546875, -19.5595703125, -15.564453125, -11.5693359375, -7.57421875, -3.5791015625, 0.416015625, 4.4111328125, 8.40625, 12.4013671875, 16.396484375, 20.3916015625, 24.38671875, 28.3818359375, 32.376953125, 36.3720703125, 40.3671875, 44.3623046875, 48.357421875, 52.3525390625, 56.34765625, 60.3427734375, 64.337890625, 68.3330078125, 72.328125, 76.3232421875, 80.318359375, 84.3134765625, 88.30859375, 92.3037109375, 96.298828125, 100.2939453125, 104.2890625, 108.2841796875, 112.279296875, 116.2744140625, 120.26953125, 124.2646484375, 128.259765625, 132.2548828125, 136.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 16.0, 15.0, 13.0, 34.0, 51.0, 37.0, 74.0, 102.0, 133.0, 222.0, 292.0, 508.0, 705.0, 1110.0, 1724.0, 3109.0, 6350.0, 15837.0, 63854.0, 758871.0, 151230.0, 25426.0, 8622.0, 4037.0, 2183.0, 1299.0, 855.0, 574.0, 375.0, 290.0, 178.0, 126.0, 84.0, 61.0, 32.0, 29.0, 12.0, 13.0, 14.0, 12.0, 9.0, 1.0, 1.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-276.0, -267.29296875, -258.5859375, -249.87890625, -241.171875, -232.46484375, -223.7578125, -215.05078125, -206.34375, -197.63671875, -188.9296875, -180.22265625, -171.515625, -162.80859375, -154.1015625, -145.39453125, -136.6875, -127.98046875, -119.2734375, -110.56640625, -101.859375, -93.15234375, -84.4453125, -75.73828125, -67.03125, -58.32421875, -49.6171875, -40.91015625, -32.203125, -23.49609375, -14.7890625, -6.08203125, 2.625, 11.33203125, 20.0390625, 28.74609375, 37.453125, 46.16015625, 54.8671875, 63.57421875, 72.28125, 80.98828125, 89.6953125, 98.40234375, 107.109375, 115.81640625, 124.5234375, 133.23046875, 141.9375, 150.64453125, 159.3515625, 168.05859375, 176.765625, 185.47265625, 194.1796875, 202.88671875, 211.59375, 220.30078125, 229.0078125, 237.71484375, 246.421875, 255.12890625, 263.8359375, 272.54296875, 281.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 16.0, 13.0, 19.0, 20.0, 42.0, 71.0, 90.0, 106.0, 145.0, 148.0, 111.0, 71.0, 54.0, 41.0, 22.0, 13.0, 5.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.019805908203125, -0.0193326473236084, -0.018859386444091797, -0.018386125564575195, -0.017912864685058594, -0.017439603805541992, -0.01696634292602539, -0.01649308204650879, -0.016019821166992188, -0.015546560287475586, -0.015073299407958984, -0.014600038528442383, -0.014126777648925781, -0.01365351676940918, -0.013180255889892578, -0.012706995010375977, -0.012233734130859375, -0.011760473251342773, -0.011287212371826172, -0.01081395149230957, -0.010340690612792969, -0.009867429733276367, -0.009394168853759766, -0.008920907974243164, -0.008447647094726562, -0.007974386215209961, -0.007501125335693359, -0.007027864456176758, -0.006554603576660156, -0.006081342697143555, -0.005608081817626953, -0.0051348209381103516, -0.00466156005859375, -0.0041882991790771484, -0.003715038299560547, -0.0032417774200439453, -0.0027685165405273438, -0.002295255661010742, -0.0018219947814941406, -0.001348733901977539, -0.0008754730224609375, -0.00040221214294433594, 7.104873657226562e-05, 0.0005443096160888672, 0.0010175704956054688, 0.0014908313751220703, 0.001964092254638672, 0.0024373531341552734, 0.002910614013671875, 0.0033838748931884766, 0.003857135772705078, 0.00433039665222168, 0.004803657531738281, 0.005276918411254883, 0.005750179290771484, 0.006223440170288086, 0.0066967010498046875, 0.007169961929321289, 0.007643222808837891, 0.008116483688354492, 0.008589744567871094, 0.009063005447387695, 0.009536266326904297, 0.010009527206420898, 0.0104827880859375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 17.0, 17.0, 21.0, 32.0, 38.0, 45.0, 82.0, 107.0, 154.0, 201.0, 329.0, 466.0, 838.0, 1599.0, 2947.0, 5950.0, 12867.0, 38022.0, 313260.0, 587986.0, 53003.0, 15629.0, 7002.0, 3414.0, 1797.0, 1029.0, 568.0, 355.0, 236.0, 161.0, 86.0, 86.0, 61.0, 32.0, 32.0, 28.0, 8.0, 11.0, 10.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.25, -311.546875, -300.84375, -290.140625, -279.4375, -268.734375, -258.03125, -247.328125, -236.625, -225.921875, -215.21875, -204.515625, -193.8125, -183.109375, -172.40625, -161.703125, -151.0, -140.296875, -129.59375, -118.890625, -108.1875, -97.484375, -86.78125, -76.078125, -65.375, -54.671875, -43.96875, -33.265625, -22.5625, -11.859375, -1.15625, 9.546875, 20.25, 30.953125, 41.65625, 52.359375, 63.0625, 73.765625, 84.46875, 95.171875, 105.875, 116.578125, 127.28125, 137.984375, 148.6875, 159.390625, 170.09375, 180.796875, 191.5, 202.203125, 212.90625, 223.609375, 234.3125, 245.015625, 255.71875, 266.421875, 277.125, 287.828125, 298.53125, 309.234375, 319.9375, 330.640625, 341.34375, 352.046875, 362.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 5.0, 7.0, 6.0, 8.0, 12.0, 15.0, 13.0, 49.0, 115.0, 260.0, 245.0, 115.0, 52.0, 26.0, 17.0, 12.0, 9.0, 7.0, 7.0, 9.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.25, -108.39453125, -105.5390625, -102.68359375, -99.828125, -96.97265625, -94.1171875, -91.26171875, -88.40625, -85.55078125, -82.6953125, -79.83984375, -76.984375, -74.12890625, -71.2734375, -68.41796875, -65.5625, -62.70703125, -59.8515625, -56.99609375, -54.140625, -51.28515625, -48.4296875, -45.57421875, -42.71875, -39.86328125, -37.0078125, -34.15234375, -31.296875, -28.44140625, -25.5859375, -22.73046875, -19.875, -17.01953125, -14.1640625, -11.30859375, -8.453125, -5.59765625, -2.7421875, 0.11328125, 2.96875, 5.82421875, 8.6796875, 11.53515625, 14.390625, 17.24609375, 20.1015625, 22.95703125, 25.8125, 28.66796875, 31.5234375, 34.37890625, 37.234375, 40.08984375, 42.9453125, 45.80078125, 48.65625, 51.51171875, 54.3671875, 57.22265625, 60.078125, 62.93359375, 65.7890625, 68.64453125, 71.5]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 7.0, 10.0, 12.0, 18.0, 21.0, 28.0, 25.0, 34.0, 51.0, 62.0, 81.0, 98.0, 100.0, 98.0, 74.0, 54.0, 38.0, 35.0, 35.0, 30.0, 26.0, 18.0, 10.0, 12.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-258.6842346191406, -251.5355224609375, -244.3867950439453, -237.2380828857422, -230.08935546875, -222.94064331054688, -215.79193115234375, -208.64320373535156, -201.49447631835938, -194.34576416015625, -187.19703674316406, -180.04832458496094, -172.89959716796875, -165.75088500976562, -158.6021728515625, -151.4534454345703, -144.3047332763672, -137.15602111816406, -130.00729370117188, -122.85858154296875, -115.70985412597656, -108.56114196777344, -101.41242218017578, -94.26370239257812, -87.11498260498047, -79.96626281738281, -72.81754302978516, -65.6688232421875, -58.52010726928711, -51.37138748168945, -44.22267150878906, -37.073951721191406, -29.925216674804688, -22.77649688720703, -15.627779006958008, -8.479061126708984, -1.3303413391113281, 5.818378448486328, 12.967094421386719, 20.115814208984375, 27.26453399658203, 34.41325378417969, 41.561973571777344, 48.710689544677734, 55.85940933227539, 63.00812911987305, 70.15684509277344, 77.3055648803711, 84.45428466796875, 91.6030044555664, 98.75172424316406, 105.90043640136719, 113.04916381835938, 120.1978759765625, 127.34659576416016, 134.4953155517578, 141.64404296875, 148.79275512695312, 155.9414825439453, 163.09019470214844, 170.23892211914062, 177.38763427734375, 184.53634643554688, 191.68507385253906, 198.8337860107422]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 8.0, 7.0, 7.0, 13.0, 11.0, 9.0, 18.0, 17.0, 19.0, 20.0, 31.0, 33.0, 28.0, 32.0, 22.0, 29.0, 33.0, 35.0, 44.0, 39.0, 52.0, 52.0, 38.0, 39.0, 35.0, 32.0, 39.0, 28.0, 25.0, 25.0, 21.0, 28.0, 15.0, 21.0, 14.0, 11.0, 13.0, 8.0, 7.0, 8.0, 11.0, 7.0, 0.0, 0.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-153.67152404785156, -149.09848022460938, -144.52545166015625, -139.95240783691406, -135.37936401367188, -130.80633544921875, -126.23329162597656, -121.6602554321289, -117.08721923828125, -112.5141830444336, -107.9411392211914, -103.36810302734375, -98.7950668334961, -94.22203063964844, -89.64898681640625, -85.0759506225586, -80.5029067993164, -75.92987060546875, -71.35682678222656, -66.7837905883789, -62.21075439453125, -57.63771438598633, -53.064674377441406, -48.49163818359375, -43.91859817504883, -39.345558166503906, -34.77252197265625, -30.199481964111328, -25.62644386291504, -21.05340576171875, -16.480365753173828, -11.907329559326172, -7.33428955078125, -2.7612509727478027, 1.8117876052856445, 6.38482666015625, 10.957864761352539, 15.530902862548828, 20.10394287109375, 24.676979064941406, 29.250019073486328, 33.82305908203125, 38.396095275878906, 42.96913528442383, 47.54217529296875, 52.115211486816406, 56.68825149536133, 61.261287689208984, 65.8343276977539, 70.40736389160156, 74.98040771484375, 79.5534439086914, 84.12648010253906, 88.69952392578125, 93.2725601196289, 97.84559631347656, 102.41864013671875, 106.9916763305664, 111.5647201538086, 116.13775634765625, 120.7107925415039, 125.28382873535156, 129.85687255859375, 134.42990112304688, 139.00294494628906]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 3.0, 5.0, 12.0, 9.0, 22.0, 23.0, 45.0, 52.0, 85.0, 135.0, 185.0, 310.0, 550.0, 807.0, 1373.0, 2288.0, 3916.0, 6912.0, 12332.0, 21981.0, 40496.0, 79353.0, 164080.0, 282209.0, 212967.0, 103695.0, 51439.0, 27627.0, 15150.0, 8431.0, 4811.0, 2841.0, 1689.0, 988.0, 600.0, 394.0, 242.0, 138.0, 105.0, 85.0, 49.0, 29.0, 16.0, 18.0, 15.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-303.25, -293.03515625, -282.8203125, -272.60546875, -262.390625, -252.17578125, -241.9609375, -231.74609375, -221.53125, -211.31640625, -201.1015625, -190.88671875, -180.671875, -170.45703125, -160.2421875, -150.02734375, -139.8125, -129.59765625, -119.3828125, -109.16796875, -98.953125, -88.73828125, -78.5234375, -68.30859375, -58.09375, -47.87890625, -37.6640625, -27.44921875, -17.234375, -7.01953125, 3.1953125, 13.41015625, 23.625, 33.83984375, 44.0546875, 54.26953125, 64.484375, 74.69921875, 84.9140625, 95.12890625, 105.34375, 115.55859375, 125.7734375, 135.98828125, 146.203125, 156.41796875, 166.6328125, 176.84765625, 187.0625, 197.27734375, 207.4921875, 217.70703125, 227.921875, 238.13671875, 248.3515625, 258.56640625, 268.78125, 278.99609375, 289.2109375, 299.42578125, 309.640625, 319.85546875, 330.0703125, 340.28515625, 350.5]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 6.0, 11.0, 6.0, 15.0, 14.0, 23.0, 21.0, 23.0, 36.0, 27.0, 37.0, 25.0, 33.0, 30.0, 34.0, 48.0, 41.0, 42.0, 50.0, 31.0, 43.0, 44.0, 45.0, 37.0, 31.0, 29.0, 25.0, 27.0, 21.0, 14.0, 16.0, 18.0, 20.0, 12.0, 13.0, 15.0, 5.0, 3.0, 5.0, 1.0, 4.0, 5.0, 0.0, 6.0, 3.0, 2.0, 2.0], "bins": [-113.375, -110.189453125, -107.00390625, -103.818359375, -100.6328125, -97.447265625, -94.26171875, -91.076171875, -87.890625, -84.705078125, -81.51953125, -78.333984375, -75.1484375, -71.962890625, -68.77734375, -65.591796875, -62.40625, -59.220703125, -56.03515625, -52.849609375, -49.6640625, -46.478515625, -43.29296875, -40.107421875, -36.921875, -33.736328125, -30.55078125, -27.365234375, -24.1796875, -20.994140625, -17.80859375, -14.623046875, -11.4375, -8.251953125, -5.06640625, -1.880859375, 1.3046875, 4.490234375, 7.67578125, 10.861328125, 14.046875, 17.232421875, 20.41796875, 23.603515625, 26.7890625, 29.974609375, 33.16015625, 36.345703125, 39.53125, 42.716796875, 45.90234375, 49.087890625, 52.2734375, 55.458984375, 58.64453125, 61.830078125, 65.015625, 68.201171875, 71.38671875, 74.572265625, 77.7578125, 80.943359375, 84.12890625, 87.314453125, 90.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 4.0, 12.0, 13.0, 11.0, 17.0, 30.0, 37.0, 73.0, 92.0, 170.0, 215.0, 331.0, 549.0, 829.0, 1178.0, 1873.0, 2668.0, 4412.0, 6628.0, 10561.0, 16969.0, 26970.0, 44351.0, 75369.0, 130890.0, 211123.0, 204620.0, 124344.0, 71445.0, 42280.0, 26109.0, 15841.0, 10157.0, 6286.0, 4168.0, 2668.0, 1769.0, 1131.0, 782.0, 513.0, 361.0, 221.0, 165.0, 124.0, 68.0, 40.0, 28.0, 27.0, 17.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-211.875, -205.244140625, -198.61328125, -191.982421875, -185.3515625, -178.720703125, -172.08984375, -165.458984375, -158.828125, -152.197265625, -145.56640625, -138.935546875, -132.3046875, -125.673828125, -119.04296875, -112.412109375, -105.78125, -99.150390625, -92.51953125, -85.888671875, -79.2578125, -72.626953125, -65.99609375, -59.365234375, -52.734375, -46.103515625, -39.47265625, -32.841796875, -26.2109375, -19.580078125, -12.94921875, -6.318359375, 0.3125, 6.943359375, 13.57421875, 20.205078125, 26.8359375, 33.466796875, 40.09765625, 46.728515625, 53.359375, 59.990234375, 66.62109375, 73.251953125, 79.8828125, 86.513671875, 93.14453125, 99.775390625, 106.40625, 113.037109375, 119.66796875, 126.298828125, 132.9296875, 139.560546875, 146.19140625, 152.822265625, 159.453125, 166.083984375, 172.71484375, 179.345703125, 185.9765625, 192.607421875, 199.23828125, 205.869140625, 212.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 4.0, 9.0, 11.0, 5.0, 11.0, 8.0, 18.0, 18.0, 16.0, 18.0, 33.0, 31.0, 31.0, 31.0, 33.0, 23.0, 34.0, 34.0, 43.0, 43.0, 46.0, 41.0, 41.0, 33.0, 38.0, 35.0, 41.0, 40.0, 37.0, 29.0, 29.0, 18.0, 29.0, 18.0, 10.0, 10.0, 15.0, 10.0, 6.0, 4.0, 3.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -63.9541015625, -61.470703125, -58.9873046875, -56.50390625, -54.0205078125, -51.537109375, -49.0537109375, -46.5703125, -44.0869140625, -41.603515625, -39.1201171875, -36.63671875, -34.1533203125, -31.669921875, -29.1865234375, -26.703125, -24.2197265625, -21.736328125, -19.2529296875, -16.76953125, -14.2861328125, -11.802734375, -9.3193359375, -6.8359375, -4.3525390625, -1.869140625, 0.6142578125, 3.09765625, 5.5810546875, 8.064453125, 10.5478515625, 13.03125, 15.5146484375, 17.998046875, 20.4814453125, 22.96484375, 25.4482421875, 27.931640625, 30.4150390625, 32.8984375, 35.3818359375, 37.865234375, 40.3486328125, 42.83203125, 45.3154296875, 47.798828125, 50.2822265625, 52.765625, 55.2490234375, 57.732421875, 60.2158203125, 62.69921875, 65.1826171875, 67.666015625, 70.1494140625, 72.6328125, 75.1162109375, 77.599609375, 80.0830078125, 82.56640625, 85.0498046875, 87.533203125, 90.0166015625, 92.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 5.0, 13.0, 13.0, 17.0, 20.0, 32.0, 33.0, 44.0, 62.0, 85.0, 104.0, 149.0, 202.0, 282.0, 429.0, 584.0, 825.0, 1323.0, 2047.0, 3605.0, 6665.0, 13751.0, 31118.0, 86917.0, 420840.0, 344732.0, 77394.0, 28900.0, 12526.0, 6329.0, 3453.0, 2036.0, 1272.0, 815.0, 525.0, 362.0, 251.0, 223.0, 137.0, 95.0, 91.0, 65.0, 43.0, 40.0, 26.0, 19.0, 12.0, 10.0, 12.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 3.0], "bins": [-221.125, -214.4140625, -207.703125, -200.9921875, -194.28125, -187.5703125, -180.859375, -174.1484375, -167.4375, -160.7265625, -154.015625, -147.3046875, -140.59375, -133.8828125, -127.171875, -120.4609375, -113.75, -107.0390625, -100.328125, -93.6171875, -86.90625, -80.1953125, -73.484375, -66.7734375, -60.0625, -53.3515625, -46.640625, -39.9296875, -33.21875, -26.5078125, -19.796875, -13.0859375, -6.375, 0.3359375, 7.046875, 13.7578125, 20.46875, 27.1796875, 33.890625, 40.6015625, 47.3125, 54.0234375, 60.734375, 67.4453125, 74.15625, 80.8671875, 87.578125, 94.2890625, 101.0, 107.7109375, 114.421875, 121.1328125, 127.84375, 134.5546875, 141.265625, 147.9765625, 154.6875, 161.3984375, 168.109375, 174.8203125, 181.53125, 188.2421875, 194.953125, 201.6640625, 208.375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 14.0, 27.0, 48.0, 55.0, 96.0, 168.0, 194.0, 132.0, 107.0, 45.0, 31.0, 23.0, 15.0, 7.0, 4.0, 7.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0145263671875, -0.013927459716796875, -0.01332855224609375, -0.012729644775390625, -0.0121307373046875, -0.011531829833984375, -0.01093292236328125, -0.010334014892578125, -0.009735107421875, -0.009136199951171875, -0.00853729248046875, -0.007938385009765625, -0.0073394775390625, -0.006740570068359375, -0.00614166259765625, -0.005542755126953125, -0.00494384765625, -0.004344940185546875, -0.00374603271484375, -0.003147125244140625, -0.0025482177734375, -0.001949310302734375, -0.00135040283203125, -0.000751495361328125, -0.000152587890625, 0.000446319580078125, 0.00104522705078125, 0.001644134521484375, 0.0022430419921875, 0.002841949462890625, 0.00344085693359375, 0.004039764404296875, 0.004638671875, 0.005237579345703125, 0.00583648681640625, 0.006435394287109375, 0.0070343017578125, 0.007633209228515625, 0.00823211669921875, 0.008831024169921875, 0.009429931640625, 0.010028839111328125, 0.01062774658203125, 0.011226654052734375, 0.0118255615234375, 0.012424468994140625, 0.01302337646484375, 0.013622283935546875, 0.01422119140625, 0.014820098876953125, 0.01541900634765625, 0.016017913818359375, 0.0166168212890625, 0.017215728759765625, 0.01781463623046875, 0.018413543701171875, 0.019012451171875, 0.019611358642578125, 0.02021026611328125, 0.020809173583984375, 0.0214080810546875, 0.022006988525390625, 0.02260589599609375, 0.023204803466796875, 0.0238037109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 15.0, 10.0, 18.0, 31.0, 32.0, 49.0, 74.0, 92.0, 159.0, 218.0, 282.0, 459.0, 729.0, 1054.0, 1697.0, 2779.0, 5504.0, 14353.0, 63841.0, 635279.0, 266988.0, 34463.0, 9606.0, 4233.0, 2337.0, 1402.0, 929.0, 598.0, 401.0, 274.0, 196.0, 120.0, 107.0, 65.0, 39.0, 27.0, 24.0, 10.0, 10.0, 13.0, 9.0, 9.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-334.25, -323.74609375, -313.2421875, -302.73828125, -292.234375, -281.73046875, -271.2265625, -260.72265625, -250.21875, -239.71484375, -229.2109375, -218.70703125, -208.203125, -197.69921875, -187.1953125, -176.69140625, -166.1875, -155.68359375, -145.1796875, -134.67578125, -124.171875, -113.66796875, -103.1640625, -92.66015625, -82.15625, -71.65234375, -61.1484375, -50.64453125, -40.140625, -29.63671875, -19.1328125, -8.62890625, 1.875, 12.37890625, 22.8828125, 33.38671875, 43.890625, 54.39453125, 64.8984375, 75.40234375, 85.90625, 96.41015625, 106.9140625, 117.41796875, 127.921875, 138.42578125, 148.9296875, 159.43359375, 169.9375, 180.44140625, 190.9453125, 201.44921875, 211.953125, 222.45703125, 232.9609375, 243.46484375, 253.96875, 264.47265625, 274.9765625, 285.48046875, 295.984375, 306.48828125, 316.9921875, 327.49609375, 338.0]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 5.0, 19.0, 20.0, 41.0, 74.0, 132.0, 155.0, 190.0, 136.0, 86.0, 71.0, 31.0, 11.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.75, -84.0625, -81.375, -78.6875, -76.0, -73.3125, -70.625, -67.9375, -65.25, -62.5625, -59.875, -57.1875, -54.5, -51.8125, -49.125, -46.4375, -43.75, -41.0625, -38.375, -35.6875, -33.0, -30.3125, -27.625, -24.9375, -22.25, -19.5625, -16.875, -14.1875, -11.5, -8.8125, -6.125, -3.4375, -0.75, 1.9375, 4.625, 7.3125, 10.0, 12.6875, 15.375, 18.0625, 20.75, 23.4375, 26.125, 28.8125, 31.5, 34.1875, 36.875, 39.5625, 42.25, 44.9375, 47.625, 50.3125, 53.0, 55.6875, 58.375, 61.0625, 63.75, 66.4375, 69.125, 71.8125, 74.5, 77.1875, 79.875, 82.5625, 85.25]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 5.0, 6.0, 8.0, 11.0, 14.0, 17.0, 15.0, 35.0, 36.0, 44.0, 54.0, 67.0, 82.0, 98.0, 73.0, 76.0, 52.0, 66.0, 49.0, 31.0, 32.0, 25.0, 19.0, 22.0, 14.0, 10.0, 6.0, 6.0, 3.0, 4.0, 5.0, 0.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.383544921875, -124.29437255859375, -119.20520782470703, -114.11603546142578, -109.02687072753906, -103.93769836425781, -98.84852600097656, -93.75935363769531, -88.6701889038086, -83.58101654052734, -78.49185180664062, -73.40267944335938, -68.31350708007812, -63.224342346191406, -58.135169982910156, -53.04600143432617, -47.95683288574219, -42.8676643371582, -37.77849578857422, -32.68932342529297, -27.600154876708984, -22.510986328125, -17.421815872192383, -12.332645416259766, -7.243476867675781, -2.1543073654174805, 2.9348621368408203, 8.024031639099121, 13.113201141357422, 18.202369689941406, 23.291540145874023, 28.38071060180664, 33.46986389160156, 38.55903244018555, 43.64820098876953, 48.73737335205078, 53.826541900634766, 58.91571044921875, 64.0048828125, 69.09405517578125, 74.18321990966797, 79.27239227294922, 84.36155700683594, 89.45072937011719, 94.53990173339844, 99.62906646728516, 104.7182388305664, 109.80740356445312, 114.89657592773438, 119.98574829101562, 125.07491302490234, 130.16407775878906, 135.2532501220703, 140.34242248535156, 145.4315948486328, 150.52076721191406, 155.60992431640625, 160.6990966796875, 165.78826904296875, 170.87742614746094, 175.9665985107422, 181.05577087402344, 186.1449432373047, 191.23411560058594, 196.3232879638672]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 8.0, 12.0, 11.0, 11.0, 12.0, 18.0, 19.0, 24.0, 27.0, 30.0, 24.0, 29.0, 40.0, 39.0, 40.0, 37.0, 36.0, 35.0, 41.0, 35.0, 41.0, 35.0, 36.0, 34.0, 37.0, 31.0, 28.0, 31.0, 26.0, 24.0, 17.0, 17.0, 17.0, 14.0, 15.0, 12.0, 7.0, 8.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.5198974609375, -108.95657348632812, -105.39324951171875, -101.82992553710938, -98.2666015625, -94.70327758789062, -91.13995361328125, -87.5766372680664, -84.01331329345703, -80.44998931884766, -76.88666534423828, -73.3233413696289, -69.76001739501953, -66.19670104980469, -62.63337326049805, -59.07005310058594, -55.5067253112793, -51.94340133666992, -48.38007736206055, -44.81675720214844, -41.25343322753906, -37.69010925292969, -34.12678527832031, -30.56346321105957, -27.000139236450195, -23.43681526184082, -19.873493194580078, -16.310169219970703, -12.746846199035645, -9.183523178100586, -5.620199203491211, -2.0568771362304688, 1.5064468383789062, 5.069769859313965, 8.633092880249023, 12.196416854858398, 15.759739875793457, 19.323062896728516, 22.88638687133789, 26.449708938598633, 30.013032913208008, 33.57635498046875, 37.139678955078125, 40.7030029296875, 44.266326904296875, 47.82965087890625, 51.392974853515625, 54.956295013427734, 58.51961898803711, 62.082942962646484, 65.6462631225586, 69.20958709716797, 72.77291107177734, 76.33623504638672, 79.8995590209961, 83.46288299560547, 87.02620697021484, 90.58953094482422, 94.1528549194336, 97.71617889404297, 101.27950286865234, 104.84281921386719, 108.40614318847656, 111.96946716308594, 115.53279113769531]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 8.0, 7.0, 22.0, 39.0, 38.0, 73.0, 121.0, 177.0, 279.0, 456.0, 711.0, 1202.0, 1782.0, 2971.0, 4811.0, 8122.0, 13066.0, 22408.0, 37737.0, 66550.0, 124517.0, 268654.0, 992597.0, 1711674.0, 525545.0, 187313.0, 94518.0, 52291.0, 30158.0, 17909.0, 10854.0, 6661.0, 4051.0, 2664.0, 1605.0, 992.0, 627.0, 373.0, 259.0, 167.0, 96.0, 53.0, 48.0, 22.0, 21.0, 14.0, 9.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.75, -148.16015625, -143.5703125, -138.98046875, -134.390625, -129.80078125, -125.2109375, -120.62109375, -116.03125, -111.44140625, -106.8515625, -102.26171875, -97.671875, -93.08203125, -88.4921875, -83.90234375, -79.3125, -74.72265625, -70.1328125, -65.54296875, -60.953125, -56.36328125, -51.7734375, -47.18359375, -42.59375, -38.00390625, -33.4140625, -28.82421875, -24.234375, -19.64453125, -15.0546875, -10.46484375, -5.875, -1.28515625, 3.3046875, 7.89453125, 12.484375, 17.07421875, 21.6640625, 26.25390625, 30.84375, 35.43359375, 40.0234375, 44.61328125, 49.203125, 53.79296875, 58.3828125, 62.97265625, 67.5625, 72.15234375, 76.7421875, 81.33203125, 85.921875, 90.51171875, 95.1015625, 99.69140625, 104.28125, 108.87109375, 113.4609375, 118.05078125, 122.640625, 127.23046875, 131.8203125, 136.41015625, 141.0]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 0.0, 2.0, 7.0, 4.0, 4.0, 8.0, 9.0, 11.0, 10.0, 9.0, 18.0, 17.0, 25.0, 27.0, 29.0, 36.0, 31.0, 45.0, 38.0, 45.0, 46.0, 44.0, 52.0, 48.0, 40.0, 37.0, 27.0, 49.0, 44.0, 26.0, 33.0, 31.0, 21.0, 27.0, 24.0, 19.0, 17.0, 10.0, 7.0, 11.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.15625, -59.16943359375, -57.1826171875, -55.19580078125, -53.208984375, -51.22216796875, -49.2353515625, -47.24853515625, -45.26171875, -43.27490234375, -41.2880859375, -39.30126953125, -37.314453125, -35.32763671875, -33.3408203125, -31.35400390625, -29.3671875, -27.38037109375, -25.3935546875, -23.40673828125, -21.419921875, -19.43310546875, -17.4462890625, -15.45947265625, -13.47265625, -11.48583984375, -9.4990234375, -7.51220703125, -5.525390625, -3.53857421875, -1.5517578125, 0.43505859375, 2.421875, 4.40869140625, 6.3955078125, 8.38232421875, 10.369140625, 12.35595703125, 14.3427734375, 16.32958984375, 18.31640625, 20.30322265625, 22.2900390625, 24.27685546875, 26.263671875, 28.25048828125, 30.2373046875, 32.22412109375, 34.2109375, 36.19775390625, 38.1845703125, 40.17138671875, 42.158203125, 44.14501953125, 46.1318359375, 48.11865234375, 50.10546875, 52.09228515625, 54.0791015625, 56.06591796875, 58.052734375, 60.03955078125, 62.0263671875, 64.01318359375, 66.0]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 8.0, 8.0, 12.0, 13.0, 20.0, 38.0, 47.0, 49.0, 103.0, 119.0, 205.0, 284.0, 429.0, 655.0, 986.0, 1497.0, 2265.0, 3517.0, 5695.0, 9188.0, 15269.0, 26827.0, 47743.0, 90588.0, 183202.0, 417671.0, 1168668.0, 1330605.0, 464260.0, 202430.0, 99315.0, 51573.0, 28557.0, 16290.0, 9916.0, 5879.0, 3739.0, 2230.0, 1519.0, 946.0, 630.0, 389.0, 281.0, 202.0, 108.0, 98.0, 80.0, 51.0, 23.0, 16.0, 14.0, 13.0, 10.0, 7.0, 0.0, 2.0, 0.0, 4.0], "bins": [-118.9375, -115.33984375, -111.7421875, -108.14453125, -104.546875, -100.94921875, -97.3515625, -93.75390625, -90.15625, -86.55859375, -82.9609375, -79.36328125, -75.765625, -72.16796875, -68.5703125, -64.97265625, -61.375, -57.77734375, -54.1796875, -50.58203125, -46.984375, -43.38671875, -39.7890625, -36.19140625, -32.59375, -28.99609375, -25.3984375, -21.80078125, -18.203125, -14.60546875, -11.0078125, -7.41015625, -3.8125, -0.21484375, 3.3828125, 6.98046875, 10.578125, 14.17578125, 17.7734375, 21.37109375, 24.96875, 28.56640625, 32.1640625, 35.76171875, 39.359375, 42.95703125, 46.5546875, 50.15234375, 53.75, 57.34765625, 60.9453125, 64.54296875, 68.140625, 71.73828125, 75.3359375, 78.93359375, 82.53125, 86.12890625, 89.7265625, 93.32421875, 96.921875, 100.51953125, 104.1171875, 107.71484375, 111.3125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 1.0, 5.0, 6.0, 9.0, 13.0, 12.0, 22.0, 34.0, 30.0, 46.0, 50.0, 68.0, 79.0, 107.0, 120.0, 152.0, 162.0, 196.0, 231.0, 287.0, 397.0, 414.0, 331.0, 273.0, 205.0, 162.0, 148.0, 107.0, 84.0, 65.0, 52.0, 34.0, 41.0, 25.0, 20.0, 19.0, 10.0, 13.0, 8.0, 15.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.265625, -29.109130859375, -27.95263671875, -26.796142578125, -25.6396484375, -24.483154296875, -23.32666015625, -22.170166015625, -21.013671875, -19.857177734375, -18.70068359375, -17.544189453125, -16.3876953125, -15.231201171875, -14.07470703125, -12.918212890625, -11.76171875, -10.605224609375, -9.44873046875, -8.292236328125, -7.1357421875, -5.979248046875, -4.82275390625, -3.666259765625, -2.509765625, -1.353271484375, -0.19677734375, 0.959716796875, 2.1162109375, 3.272705078125, 4.42919921875, 5.585693359375, 6.7421875, 7.898681640625, 9.05517578125, 10.211669921875, 11.3681640625, 12.524658203125, 13.68115234375, 14.837646484375, 15.994140625, 17.150634765625, 18.30712890625, 19.463623046875, 20.6201171875, 21.776611328125, 22.93310546875, 24.089599609375, 25.24609375, 26.402587890625, 27.55908203125, 28.715576171875, 29.8720703125, 31.028564453125, 32.18505859375, 33.341552734375, 34.498046875, 35.654541015625, 36.81103515625, 37.967529296875, 39.1240234375, 40.280517578125, 41.43701171875, 42.593505859375, 43.75]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 11.0, 8.0, 6.0, 5.0, 8.0, 19.0, 19.0, 34.0, 39.0, 48.0, 63.0, 91.0, 106.0, 94.0, 94.0, 76.0, 71.0, 43.0, 48.0, 20.0, 22.0, 18.0, 13.0, 10.0, 11.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.8041000366211, -122.79422760009766, -118.78435516357422, -114.77447509765625, -110.76460266113281, -106.75473022460938, -102.74485778808594, -98.7349853515625, -94.72511291503906, -90.71524047851562, -86.70536804199219, -82.69549560546875, -78.68561553955078, -74.67574310302734, -70.6658706665039, -66.65599822998047, -62.6461181640625, -58.63624572753906, -54.62636947631836, -50.61649703979492, -46.60662078857422, -42.59674835205078, -38.586875915527344, -34.577003479003906, -30.567127227783203, -26.557252883911133, -22.547378540039062, -18.537506103515625, -14.527631759643555, -10.517757415771484, -6.507884979248047, -2.4980106353759766, 1.5118560791015625, 5.521729946136475, 9.531603813171387, 13.54147720336914, 17.55135154724121, 21.56122589111328, 25.57109832763672, 29.58097267150879, 33.59084701538086, 37.6007194519043, 41.610595703125, 45.62046813964844, 49.630340576171875, 53.64021682739258, 57.650089263916016, 61.65996551513672, 65.66983795166016, 69.6797103881836, 73.68958282470703, 77.699462890625, 81.70933532714844, 85.71920776367188, 89.72908020019531, 93.73895263671875, 97.74882507324219, 101.75869750976562, 105.76856994628906, 109.7784423828125, 113.78832244873047, 117.7981948852539, 121.80806732177734, 125.81793975830078, 129.82781982421875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 6.0, 9.0, 6.0, 10.0, 7.0, 14.0, 18.0, 9.0, 13.0, 12.0, 24.0, 18.0, 26.0, 27.0, 30.0, 31.0, 38.0, 33.0, 29.0, 52.0, 38.0, 32.0, 39.0, 33.0, 35.0, 38.0, 32.0, 38.0, 28.0, 27.0, 26.0, 32.0, 25.0, 25.0, 16.0, 11.0, 20.0, 15.0, 21.0, 11.0, 6.0, 11.0, 7.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.47868347167969, -62.263492584228516, -60.048301696777344, -57.83311080932617, -55.617919921875, -53.40272903442383, -51.187538146972656, -48.972347259521484, -46.75715637207031, -44.54196548461914, -42.32677459716797, -40.1115837097168, -37.896392822265625, -35.68120193481445, -33.46601104736328, -31.25082015991211, -29.035629272460938, -26.820438385009766, -24.605247497558594, -22.390056610107422, -20.17486572265625, -17.959674835205078, -15.744483947753906, -13.529293060302734, -11.314102172851562, -9.09891128540039, -6.883720397949219, -4.668529510498047, -2.453338623046875, -0.23814773559570312, 1.9770431518554688, 4.192234039306641, 6.407417297363281, 8.622608184814453, 10.837799072265625, 13.052989959716797, 15.268180847167969, 17.48337173461914, 19.698562622070312, 21.913753509521484, 24.128944396972656, 26.344135284423828, 28.559326171875, 30.774517059326172, 32.989707946777344, 35.204898834228516, 37.42008972167969, 39.63528060913086, 41.85047149658203, 44.0656623840332, 46.280853271484375, 48.49604415893555, 50.71123504638672, 52.92642593383789, 55.14161682128906, 57.356807708740234, 59.571998596191406, 61.78718948364258, 64.00238037109375, 66.21757507324219, 68.4327621459961, 70.64794921875, 72.86314392089844, 75.07833862304688, 77.29352569580078]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 7.0, 13.0, 8.0, 19.0, 27.0, 48.0, 46.0, 65.0, 105.0, 169.0, 237.0, 312.0, 489.0, 766.0, 1211.0, 1975.0, 3302.0, 5761.0, 10481.0, 19776.0, 38904.0, 78300.0, 174271.0, 358461.0, 185096.0, 82127.0, 40038.0, 20472.0, 10982.0, 5888.0, 3460.0, 2029.0, 1285.0, 799.0, 543.0, 334.0, 230.0, 166.0, 100.0, 81.0, 45.0, 43.0, 32.0, 18.0, 11.0, 7.0, 4.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-91.875, -89.05078125, -86.2265625, -83.40234375, -80.578125, -77.75390625, -74.9296875, -72.10546875, -69.28125, -66.45703125, -63.6328125, -60.80859375, -57.984375, -55.16015625, -52.3359375, -49.51171875, -46.6875, -43.86328125, -41.0390625, -38.21484375, -35.390625, -32.56640625, -29.7421875, -26.91796875, -24.09375, -21.26953125, -18.4453125, -15.62109375, -12.796875, -9.97265625, -7.1484375, -4.32421875, -1.5, 1.32421875, 4.1484375, 6.97265625, 9.796875, 12.62109375, 15.4453125, 18.26953125, 21.09375, 23.91796875, 26.7421875, 29.56640625, 32.390625, 35.21484375, 38.0390625, 40.86328125, 43.6875, 46.51171875, 49.3359375, 52.16015625, 54.984375, 57.80859375, 60.6328125, 63.45703125, 66.28125, 69.10546875, 71.9296875, 74.75390625, 77.578125, 80.40234375, 83.2265625, 86.05078125, 88.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 3.0, 10.0, 8.0, 11.0, 15.0, 11.0, 11.0, 10.0, 21.0, 25.0, 24.0, 22.0, 31.0, 25.0, 29.0, 42.0, 32.0, 45.0, 41.0, 30.0, 40.0, 43.0, 40.0, 34.0, 40.0, 34.0, 37.0, 30.0, 27.0, 30.0, 26.0, 20.0, 24.0, 15.0, 23.0, 14.0, 11.0, 18.0, 10.0, 14.0, 3.0, 1.0, 2.0, 7.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.8125, -67.4892578125, -65.166015625, -62.8427734375, -60.51953125, -58.1962890625, -55.873046875, -53.5498046875, -51.2265625, -48.9033203125, -46.580078125, -44.2568359375, -41.93359375, -39.6103515625, -37.287109375, -34.9638671875, -32.640625, -30.3173828125, -27.994140625, -25.6708984375, -23.34765625, -21.0244140625, -18.701171875, -16.3779296875, -14.0546875, -11.7314453125, -9.408203125, -7.0849609375, -4.76171875, -2.4384765625, -0.115234375, 2.2080078125, 4.53125, 6.8544921875, 9.177734375, 11.5009765625, 13.82421875, 16.1474609375, 18.470703125, 20.7939453125, 23.1171875, 25.4404296875, 27.763671875, 30.0869140625, 32.41015625, 34.7333984375, 37.056640625, 39.3798828125, 41.703125, 44.0263671875, 46.349609375, 48.6728515625, 50.99609375, 53.3193359375, 55.642578125, 57.9658203125, 60.2890625, 62.6123046875, 64.935546875, 67.2587890625, 69.58203125, 71.9052734375, 74.228515625, 76.5517578125, 78.875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 10.0, 16.0, 22.0, 33.0, 48.0, 72.0, 102.0, 131.0, 212.0, 302.0, 440.0, 698.0, 1153.0, 1783.0, 3119.0, 5369.0, 9141.0, 16962.0, 33294.0, 80744.0, 293931.0, 413697.0, 102399.0, 39929.0, 19483.0, 10490.0, 5886.0, 3456.0, 2054.0, 1232.0, 760.0, 502.0, 352.0, 214.0, 148.0, 106.0, 73.0, 52.0, 38.0, 33.0, 21.0, 19.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.875, -79.474609375, -77.07421875, -74.673828125, -72.2734375, -69.873046875, -67.47265625, -65.072265625, -62.671875, -60.271484375, -57.87109375, -55.470703125, -53.0703125, -50.669921875, -48.26953125, -45.869140625, -43.46875, -41.068359375, -38.66796875, -36.267578125, -33.8671875, -31.466796875, -29.06640625, -26.666015625, -24.265625, -21.865234375, -19.46484375, -17.064453125, -14.6640625, -12.263671875, -9.86328125, -7.462890625, -5.0625, -2.662109375, -0.26171875, 2.138671875, 4.5390625, 6.939453125, 9.33984375, 11.740234375, 14.140625, 16.541015625, 18.94140625, 21.341796875, 23.7421875, 26.142578125, 28.54296875, 30.943359375, 33.34375, 35.744140625, 38.14453125, 40.544921875, 42.9453125, 45.345703125, 47.74609375, 50.146484375, 52.546875, 54.947265625, 57.34765625, 59.748046875, 62.1484375, 64.548828125, 66.94921875, 69.349609375, 71.75]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 15.0, 11.0, 8.0, 6.0, 13.0, 24.0, 16.0, 15.0, 26.0, 29.0, 17.0, 35.0, 30.0, 27.0, 36.0, 31.0, 34.0, 37.0, 26.0, 21.0, 35.0, 48.0, 36.0, 37.0, 28.0, 16.0, 38.0, 37.0, 28.0, 34.0, 26.0, 25.0, 23.0, 17.0, 18.0, 12.0, 18.0, 8.0, 12.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0], "bins": [-79.5625, -77.2939453125, -75.025390625, -72.7568359375, -70.48828125, -68.2197265625, -65.951171875, -63.6826171875, -61.4140625, -59.1455078125, -56.876953125, -54.6083984375, -52.33984375, -50.0712890625, -47.802734375, -45.5341796875, -43.265625, -40.9970703125, -38.728515625, -36.4599609375, -34.19140625, -31.9228515625, -29.654296875, -27.3857421875, -25.1171875, -22.8486328125, -20.580078125, -18.3115234375, -16.04296875, -13.7744140625, -11.505859375, -9.2373046875, -6.96875, -4.7001953125, -2.431640625, -0.1630859375, 2.10546875, 4.3740234375, 6.642578125, 8.9111328125, 11.1796875, 13.4482421875, 15.716796875, 17.9853515625, 20.25390625, 22.5224609375, 24.791015625, 27.0595703125, 29.328125, 31.5966796875, 33.865234375, 36.1337890625, 38.40234375, 40.6708984375, 42.939453125, 45.2080078125, 47.4765625, 49.7451171875, 52.013671875, 54.2822265625, 56.55078125, 58.8193359375, 61.087890625, 63.3564453125, 65.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 7.0, 3.0, 13.0, 8.0, 16.0, 11.0, 27.0, 28.0, 36.0, 40.0, 45.0, 75.0, 96.0, 124.0, 158.0, 184.0, 258.0, 348.0, 402.0, 622.0, 876.0, 1246.0, 2033.0, 3495.0, 6394.0, 14896.0, 52594.0, 610118.0, 288587.0, 38759.0, 12327.0, 5516.0, 3057.0, 1842.0, 1174.0, 783.0, 563.0, 412.0, 318.0, 210.0, 199.0, 147.0, 108.0, 91.0, 84.0, 58.0, 40.0, 41.0, 23.0, 17.0, 16.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-148.75, -143.935546875, -139.12109375, -134.306640625, -129.4921875, -124.677734375, -119.86328125, -115.048828125, -110.234375, -105.419921875, -100.60546875, -95.791015625, -90.9765625, -86.162109375, -81.34765625, -76.533203125, -71.71875, -66.904296875, -62.08984375, -57.275390625, -52.4609375, -47.646484375, -42.83203125, -38.017578125, -33.203125, -28.388671875, -23.57421875, -18.759765625, -13.9453125, -9.130859375, -4.31640625, 0.498046875, 5.3125, 10.126953125, 14.94140625, 19.755859375, 24.5703125, 29.384765625, 34.19921875, 39.013671875, 43.828125, 48.642578125, 53.45703125, 58.271484375, 63.0859375, 67.900390625, 72.71484375, 77.529296875, 82.34375, 87.158203125, 91.97265625, 96.787109375, 101.6015625, 106.416015625, 111.23046875, 116.044921875, 120.859375, 125.673828125, 130.48828125, 135.302734375, 140.1171875, 144.931640625, 149.74609375, 154.560546875, 159.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 17.0, 16.0, 15.0, 32.0, 47.0, 43.0, 79.0, 79.0, 81.0, 113.0, 90.0, 79.0, 60.0, 51.0, 33.0, 35.0, 29.0, 11.0, 21.0, 16.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00653076171875, -0.00633549690246582, -0.006140232086181641, -0.005944967269897461, -0.005749702453613281, -0.0055544376373291016, -0.005359172821044922, -0.005163908004760742, -0.0049686431884765625, -0.004773378372192383, -0.004578113555908203, -0.0043828487396240234, -0.004187583923339844, -0.003992319107055664, -0.0037970542907714844, -0.0036017894744873047, -0.003406524658203125, -0.0032112598419189453, -0.0030159950256347656, -0.002820730209350586, -0.0026254653930664062, -0.0024302005767822266, -0.002234935760498047, -0.002039670944213867, -0.0018444061279296875, -0.0016491413116455078, -0.0014538764953613281, -0.0012586116790771484, -0.0010633468627929688, -0.0008680820465087891, -0.0006728172302246094, -0.0004775524139404297, -0.00028228759765625, -8.702278137207031e-05, 0.00010824203491210938, 0.00030350685119628906, 0.0004987716674804688, 0.0006940364837646484, 0.0008893013000488281, 0.0010845661163330078, 0.0012798309326171875, 0.0014750957489013672, 0.0016703605651855469, 0.0018656253814697266, 0.0020608901977539062, 0.002256155014038086, 0.0024514198303222656, 0.0026466846466064453, 0.002841949462890625, 0.0030372142791748047, 0.0032324790954589844, 0.003427743911743164, 0.0036230087280273438, 0.0038182735443115234, 0.004013538360595703, 0.004208803176879883, 0.0044040679931640625, 0.004599332809448242, 0.004794597625732422, 0.0049898624420166016, 0.005185127258300781, 0.005380392074584961, 0.005575656890869141, 0.00577092170715332, 0.0059661865234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 11.0, 7.0, 14.0, 11.0, 14.0, 25.0, 17.0, 37.0, 47.0, 66.0, 78.0, 126.0, 149.0, 196.0, 282.0, 337.0, 509.0, 682.0, 994.0, 1467.0, 2320.0, 4028.0, 8329.0, 22911.0, 84223.0, 496956.0, 325281.0, 63536.0, 18316.0, 7263.0, 3426.0, 2089.0, 1362.0, 918.0, 701.0, 472.0, 369.0, 256.0, 191.0, 146.0, 101.0, 79.0, 48.0, 44.0, 24.0, 25.0, 21.0, 21.0, 9.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-147.625, -142.84765625, -138.0703125, -133.29296875, -128.515625, -123.73828125, -118.9609375, -114.18359375, -109.40625, -104.62890625, -99.8515625, -95.07421875, -90.296875, -85.51953125, -80.7421875, -75.96484375, -71.1875, -66.41015625, -61.6328125, -56.85546875, -52.078125, -47.30078125, -42.5234375, -37.74609375, -32.96875, -28.19140625, -23.4140625, -18.63671875, -13.859375, -9.08203125, -4.3046875, 0.47265625, 5.25, 10.02734375, 14.8046875, 19.58203125, 24.359375, 29.13671875, 33.9140625, 38.69140625, 43.46875, 48.24609375, 53.0234375, 57.80078125, 62.578125, 67.35546875, 72.1328125, 76.91015625, 81.6875, 86.46484375, 91.2421875, 96.01953125, 100.796875, 105.57421875, 110.3515625, 115.12890625, 119.90625, 124.68359375, 129.4609375, 134.23828125, 139.015625, 143.79296875, 148.5703125, 153.34765625, 158.125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 6.0, 8.0, 9.0, 31.0, 48.0, 80.0, 121.0, 142.0, 155.0, 134.0, 87.0, 80.0, 39.0, 19.0, 9.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.9375, -40.556640625, -39.17578125, -37.794921875, -36.4140625, -35.033203125, -33.65234375, -32.271484375, -30.890625, -29.509765625, -28.12890625, -26.748046875, -25.3671875, -23.986328125, -22.60546875, -21.224609375, -19.84375, -18.462890625, -17.08203125, -15.701171875, -14.3203125, -12.939453125, -11.55859375, -10.177734375, -8.796875, -7.416015625, -6.03515625, -4.654296875, -3.2734375, -1.892578125, -0.51171875, 0.869140625, 2.25, 3.630859375, 5.01171875, 6.392578125, 7.7734375, 9.154296875, 10.53515625, 11.916015625, 13.296875, 14.677734375, 16.05859375, 17.439453125, 18.8203125, 20.201171875, 21.58203125, 22.962890625, 24.34375, 25.724609375, 27.10546875, 28.486328125, 29.8671875, 31.248046875, 32.62890625, 34.009765625, 35.390625, 36.771484375, 38.15234375, 39.533203125, 40.9140625, 42.294921875, 43.67578125, 45.056640625, 46.4375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 12.0, 11.0, 10.0, 21.0, 20.0, 26.0, 49.0, 56.0, 57.0, 93.0, 117.0, 116.0, 75.0, 78.0, 52.0, 42.0, 36.0, 31.0, 12.0, 14.0, 19.0, 9.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.67796325683594, -123.4287338256836, -119.17950439453125, -114.93026733398438, -110.68103790283203, -106.43180847167969, -102.18257141113281, -97.93334197998047, -93.68411254882812, -89.43488311767578, -85.18565368652344, -80.93641662597656, -76.68718719482422, -72.43795776367188, -68.188720703125, -63.939491271972656, -59.69026184082031, -55.44103240966797, -51.19179916381836, -46.94256591796875, -42.693336486816406, -38.44410705566406, -34.19487380981445, -29.945642471313477, -25.6964111328125, -21.447179794311523, -17.197948455810547, -12.94871711730957, -8.699485778808594, -4.450254440307617, -0.20102310180664062, 4.048208236694336, 8.29742431640625, 12.546655654907227, 16.795886993408203, 21.04511833190918, 25.294349670410156, 29.543581008911133, 33.79281234741211, 38.04204559326172, 42.29127502441406, 46.540504455566406, 50.789737701416016, 55.038970947265625, 59.28820037841797, 63.53742980957031, 67.78666687011719, 72.03589630126953, 76.28512573242188, 80.53435516357422, 84.78358459472656, 89.03282165527344, 93.28205108642578, 97.53128051757812, 101.780517578125, 106.02974700927734, 110.27897644042969, 114.52820587158203, 118.77743530273438, 123.02667236328125, 127.2759017944336, 131.52513122558594, 135.7743682861328, 140.02359008789062, 144.2728271484375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 6.0, 8.0, 11.0, 5.0, 18.0, 9.0, 18.0, 17.0, 11.0, 21.0, 21.0, 36.0, 22.0, 25.0, 36.0, 19.0, 48.0, 30.0, 44.0, 45.0, 49.0, 33.0, 46.0, 25.0, 33.0, 38.0, 36.0, 29.0, 25.0, 30.0, 26.0, 19.0, 14.0, 22.0, 16.0, 17.0, 16.0, 14.0, 14.0, 6.0, 10.0, 3.0, 6.0, 6.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.49182891845703, -69.17189025878906, -66.8519515991211, -64.53201293945312, -62.212074279785156, -59.89213562011719, -57.57219696044922, -55.25225830078125, -52.93231964111328, -50.61238098144531, -48.292442321777344, -45.972503662109375, -43.652565002441406, -41.33262634277344, -39.01268768310547, -36.6927490234375, -34.3728141784668, -32.05287551879883, -29.73293685913086, -27.41299819946289, -25.093059539794922, -22.773120880126953, -20.453184127807617, -18.13324546813965, -15.81330680847168, -13.493368148803711, -11.173429489135742, -8.85349178314209, -6.533553123474121, -4.213614463806152, -1.8936767578125, 0.42626190185546875, 2.7462005615234375, 5.066139221191406, 7.386077404022217, 9.706015586853027, 12.025954246520996, 14.345892906188965, 16.665830612182617, 18.985769271850586, 21.305707931518555, 23.625646591186523, 25.945585250854492, 28.265522003173828, 30.585460662841797, 32.905399322509766, 35.225337982177734, 37.5452766418457, 39.86521530151367, 42.18515396118164, 44.50509262084961, 46.82503128051758, 49.14496994018555, 51.464908599853516, 53.78484344482422, 56.10478210449219, 58.424720764160156, 60.744659423828125, 63.064598083496094, 65.38453674316406, 67.70447540283203, 70.0244140625, 72.34435272216797, 74.66429138183594, 76.9842300415039]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 21.0, 28.0, 34.0, 60.0, 60.0, 102.0, 164.0, 229.0, 369.0, 543.0, 787.0, 1122.0, 1882.0, 2696.0, 4008.0, 6020.0, 9239.0, 13867.0, 21551.0, 33797.0, 54421.0, 90532.0, 148929.0, 212498.0, 169801.0, 104281.0, 62601.0, 38366.0, 24355.0, 15604.0, 10158.0, 6766.0, 4431.0, 3034.0, 2014.0, 1379.0, 962.0, 605.0, 427.0, 254.0, 190.0, 123.0, 65.0, 50.0, 58.0, 18.0, 18.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-127.875, -123.95703125, -120.0390625, -116.12109375, -112.203125, -108.28515625, -104.3671875, -100.44921875, -96.53125, -92.61328125, -88.6953125, -84.77734375, -80.859375, -76.94140625, -73.0234375, -69.10546875, -65.1875, -61.26953125, -57.3515625, -53.43359375, -49.515625, -45.59765625, -41.6796875, -37.76171875, -33.84375, -29.92578125, -26.0078125, -22.08984375, -18.171875, -14.25390625, -10.3359375, -6.41796875, -2.5, 1.41796875, 5.3359375, 9.25390625, 13.171875, 17.08984375, 21.0078125, 24.92578125, 28.84375, 32.76171875, 36.6796875, 40.59765625, 44.515625, 48.43359375, 52.3515625, 56.26953125, 60.1875, 64.10546875, 68.0234375, 71.94140625, 75.859375, 79.77734375, 83.6953125, 87.61328125, 91.53125, 95.44921875, 99.3671875, 103.28515625, 107.203125, 111.12109375, 115.0390625, 118.95703125, 122.875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 3.0, 2.0, 7.0, 10.0, 10.0, 14.0, 12.0, 18.0, 15.0, 12.0, 23.0, 24.0, 31.0, 41.0, 39.0, 29.0, 32.0, 31.0, 50.0, 40.0, 49.0, 45.0, 50.0, 45.0, 50.0, 37.0, 29.0, 30.0, 21.0, 37.0, 28.0, 20.0, 25.0, 22.0, 24.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.96875, -62.02099609375, -60.0732421875, -58.12548828125, -56.177734375, -54.22998046875, -52.2822265625, -50.33447265625, -48.38671875, -46.43896484375, -44.4912109375, -42.54345703125, -40.595703125, -38.64794921875, -36.7001953125, -34.75244140625, -32.8046875, -30.85693359375, -28.9091796875, -26.96142578125, -25.013671875, -23.06591796875, -21.1181640625, -19.17041015625, -17.22265625, -15.27490234375, -13.3271484375, -11.37939453125, -9.431640625, -7.48388671875, -5.5361328125, -3.58837890625, -1.640625, 0.30712890625, 2.2548828125, 4.20263671875, 6.150390625, 8.09814453125, 10.0458984375, 11.99365234375, 13.94140625, 15.88916015625, 17.8369140625, 19.78466796875, 21.732421875, 23.68017578125, 25.6279296875, 27.57568359375, 29.5234375, 31.47119140625, 33.4189453125, 35.36669921875, 37.314453125, 39.26220703125, 41.2099609375, 43.15771484375, 45.10546875, 47.05322265625, 49.0009765625, 50.94873046875, 52.896484375, 54.84423828125, 56.7919921875, 58.73974609375, 60.6875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 16.0, 22.0, 30.0, 42.0, 54.0, 101.0, 185.0, 214.0, 334.0, 491.0, 694.0, 984.0, 1577.0, 2264.0, 3378.0, 5036.0, 7661.0, 11998.0, 18933.0, 30546.0, 49225.0, 83496.0, 144415.0, 218814.0, 186025.0, 110391.0, 64485.0, 39062.0, 24167.0, 15257.0, 9686.0, 6403.0, 4126.0, 2727.0, 1854.0, 1245.0, 832.0, 538.0, 385.0, 282.0, 185.0, 119.0, 85.0, 63.0, 39.0, 28.0, 27.0, 12.0, 8.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-99.0, -95.78125, -92.5625, -89.34375, -86.125, -82.90625, -79.6875, -76.46875, -73.25, -70.03125, -66.8125, -63.59375, -60.375, -57.15625, -53.9375, -50.71875, -47.5, -44.28125, -41.0625, -37.84375, -34.625, -31.40625, -28.1875, -24.96875, -21.75, -18.53125, -15.3125, -12.09375, -8.875, -5.65625, -2.4375, 0.78125, 4.0, 7.21875, 10.4375, 13.65625, 16.875, 20.09375, 23.3125, 26.53125, 29.75, 32.96875, 36.1875, 39.40625, 42.625, 45.84375, 49.0625, 52.28125, 55.5, 58.71875, 61.9375, 65.15625, 68.375, 71.59375, 74.8125, 78.03125, 81.25, 84.46875, 87.6875, 90.90625, 94.125, 97.34375, 100.5625, 103.78125, 107.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 4.0, 5.0, 4.0, 13.0, 13.0, 12.0, 9.0, 15.0, 13.0, 23.0, 24.0, 20.0, 21.0, 28.0, 36.0, 32.0, 31.0, 31.0, 45.0, 55.0, 51.0, 32.0, 47.0, 42.0, 34.0, 29.0, 36.0, 38.0, 27.0, 25.0, 21.0, 25.0, 30.0, 22.0, 20.0, 14.0, 11.0, 11.0, 8.0, 11.0, 7.0, 8.0, 8.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.375, -34.1318359375, -32.888671875, -31.6455078125, -30.40234375, -29.1591796875, -27.916015625, -26.6728515625, -25.4296875, -24.1865234375, -22.943359375, -21.7001953125, -20.45703125, -19.2138671875, -17.970703125, -16.7275390625, -15.484375, -14.2412109375, -12.998046875, -11.7548828125, -10.51171875, -9.2685546875, -8.025390625, -6.7822265625, -5.5390625, -4.2958984375, -3.052734375, -1.8095703125, -0.56640625, 0.6767578125, 1.919921875, 3.1630859375, 4.40625, 5.6494140625, 6.892578125, 8.1357421875, 9.37890625, 10.6220703125, 11.865234375, 13.1083984375, 14.3515625, 15.5947265625, 16.837890625, 18.0810546875, 19.32421875, 20.5673828125, 21.810546875, 23.0537109375, 24.296875, 25.5400390625, 26.783203125, 28.0263671875, 29.26953125, 30.5126953125, 31.755859375, 32.9990234375, 34.2421875, 35.4853515625, 36.728515625, 37.9716796875, 39.21484375, 40.4580078125, 41.701171875, 42.9443359375, 44.1875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 8.0, 8.0, 12.0, 10.0, 8.0, 19.0, 21.0, 16.0, 40.0, 49.0, 65.0, 88.0, 132.0, 180.0, 253.0, 302.0, 395.0, 590.0, 931.0, 1418.0, 2213.0, 4159.0, 8740.0, 22507.0, 73684.0, 570883.0, 279461.0, 49679.0, 16524.0, 6905.0, 3355.0, 1845.0, 1236.0, 762.0, 566.0, 439.0, 279.0, 181.0, 151.0, 136.0, 72.0, 58.0, 40.0, 27.0, 30.0, 14.0, 19.0, 12.0, 11.0, 11.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-291.0, -281.86328125, -272.7265625, -263.58984375, -254.453125, -245.31640625, -236.1796875, -227.04296875, -217.90625, -208.76953125, -199.6328125, -190.49609375, -181.359375, -172.22265625, -163.0859375, -153.94921875, -144.8125, -135.67578125, -126.5390625, -117.40234375, -108.265625, -99.12890625, -89.9921875, -80.85546875, -71.71875, -62.58203125, -53.4453125, -44.30859375, -35.171875, -26.03515625, -16.8984375, -7.76171875, 1.375, 10.51171875, 19.6484375, 28.78515625, 37.921875, 47.05859375, 56.1953125, 65.33203125, 74.46875, 83.60546875, 92.7421875, 101.87890625, 111.015625, 120.15234375, 129.2890625, 138.42578125, 147.5625, 156.69921875, 165.8359375, 174.97265625, 184.109375, 193.24609375, 202.3828125, 211.51953125, 220.65625, 229.79296875, 238.9296875, 248.06640625, 257.203125, 266.33984375, 275.4765625, 284.61328125, 293.75]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 11.0, 21.0, 30.0, 58.0, 94.0, 138.0, 137.0, 176.0, 123.0, 68.0, 44.0, 22.0, 21.0, 13.0, 9.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01025390625, -0.009781837463378906, -0.009309768676757812, -0.008837699890136719, -0.008365631103515625, -0.007893562316894531, -0.0074214935302734375, -0.006949424743652344, -0.00647735595703125, -0.006005287170410156, -0.0055332183837890625, -0.005061149597167969, -0.004589080810546875, -0.004117012023925781, -0.0036449432373046875, -0.0031728744506835938, -0.0027008056640625, -0.0022287368774414062, -0.0017566680908203125, -0.0012845993041992188, -0.000812530517578125, -0.00034046173095703125, 0.0001316070556640625, 0.0006036758422851562, 0.00107574462890625, 0.0015478134155273438, 0.0020198822021484375, 0.0024919509887695312, 0.002964019775390625, 0.0034360885620117188, 0.0039081573486328125, 0.004380226135253906, 0.004852294921875, 0.005324363708496094, 0.0057964324951171875, 0.006268501281738281, 0.006740570068359375, 0.007212638854980469, 0.0076847076416015625, 0.008156776428222656, 0.00862884521484375, 0.009100914001464844, 0.009572982788085938, 0.010045051574707031, 0.010517120361328125, 0.010989189147949219, 0.011461257934570312, 0.011933326721191406, 0.0124053955078125, 0.012877464294433594, 0.013349533081054688, 0.013821601867675781, 0.014293670654296875, 0.014765739440917969, 0.015237808227539062, 0.015709877014160156, 0.01618194580078125, 0.016654014587402344, 0.017126083374023438, 0.01759815216064453, 0.018070220947265625, 0.01854228973388672, 0.019014358520507812, 0.019486427307128906, 0.01995849609375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 14.0, 10.0, 20.0, 30.0, 41.0, 55.0, 79.0, 102.0, 131.0, 214.0, 257.0, 375.0, 557.0, 813.0, 1350.0, 2146.0, 4281.0, 11013.0, 58551.0, 787293.0, 149880.0, 18026.0, 5827.0, 2737.0, 1645.0, 957.0, 656.0, 435.0, 300.0, 218.0, 145.0, 97.0, 77.0, 48.0, 43.0, 28.0, 23.0, 16.0, 11.0, 7.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-326.0, -313.78125, -301.5625, -289.34375, -277.125, -264.90625, -252.6875, -240.46875, -228.25, -216.03125, -203.8125, -191.59375, -179.375, -167.15625, -154.9375, -142.71875, -130.5, -118.28125, -106.0625, -93.84375, -81.625, -69.40625, -57.1875, -44.96875, -32.75, -20.53125, -8.3125, 3.90625, 16.125, 28.34375, 40.5625, 52.78125, 65.0, 77.21875, 89.4375, 101.65625, 113.875, 126.09375, 138.3125, 150.53125, 162.75, 174.96875, 187.1875, 199.40625, 211.625, 223.84375, 236.0625, 248.28125, 260.5, 272.71875, 284.9375, 297.15625, 309.375, 321.59375, 333.8125, 346.03125, 358.25, 370.46875, 382.6875, 394.90625, 407.125, 419.34375, 431.5625, 443.78125, 456.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 16.0, 25.0, 36.0, 74.0, 114.0, 159.0, 180.0, 154.0, 107.0, 47.0, 33.0, 19.0, 6.0, 2.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.375, -91.8564453125, -89.337890625, -86.8193359375, -84.30078125, -81.7822265625, -79.263671875, -76.7451171875, -74.2265625, -71.7080078125, -69.189453125, -66.6708984375, -64.15234375, -61.6337890625, -59.115234375, -56.5966796875, -54.078125, -51.5595703125, -49.041015625, -46.5224609375, -44.00390625, -41.4853515625, -38.966796875, -36.4482421875, -33.9296875, -31.4111328125, -28.892578125, -26.3740234375, -23.85546875, -21.3369140625, -18.818359375, -16.2998046875, -13.78125, -11.2626953125, -8.744140625, -6.2255859375, -3.70703125, -1.1884765625, 1.330078125, 3.8486328125, 6.3671875, 8.8857421875, 11.404296875, 13.9228515625, 16.44140625, 18.9599609375, 21.478515625, 23.9970703125, 26.515625, 29.0341796875, 31.552734375, 34.0712890625, 36.58984375, 39.1083984375, 41.626953125, 44.1455078125, 46.6640625, 49.1826171875, 51.701171875, 54.2197265625, 56.73828125, 59.2568359375, 61.775390625, 64.2939453125, 66.8125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 8.0, 15.0, 17.0, 30.0, 35.0, 47.0, 76.0, 107.0, 119.0, 107.0, 74.0, 86.0, 49.0, 41.0, 25.0, 31.0, 23.0, 12.0, 18.0, 5.0, 7.0, 7.0, 10.0, 3.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.25507354736328, -78.41082763671875, -74.56658172607422, -70.72233581542969, -66.87809753417969, -63.033851623535156, -59.189605712890625, -55.345359802246094, -51.50111770629883, -47.6568717956543, -43.81262969970703, -39.9683837890625, -36.12413787841797, -32.2798957824707, -28.435649871826172, -24.591405868530273, -20.747161865234375, -16.902917861938477, -13.058672904968262, -9.214427947998047, -5.370183944702148, -1.52593994140625, 2.3183059692382812, 6.16254997253418, 10.006793975830078, 13.851037979125977, 17.695281982421875, 21.539527893066406, 25.383771896362305, 29.228015899658203, 33.072261810302734, 36.91650390625, 40.76075744628906, 44.605003356933594, 48.44924545288086, 52.29349136352539, 56.137733459472656, 59.98197937011719, 63.82622528076172, 67.67047119140625, 71.51470947265625, 75.35895538330078, 79.20320129394531, 83.04743957519531, 86.89168548583984, 90.73593139648438, 94.5801773071289, 98.42442321777344, 102.26866912841797, 106.1129150390625, 109.95716094970703, 113.80140686035156, 117.64564514160156, 121.4898910522461, 125.33413696289062, 129.17837524414062, 133.0226287841797, 136.8668670654297, 140.71112060546875, 144.55535888671875, 148.3996124267578, 152.2438507080078, 156.08810424804688, 159.93234252929688, 163.77658081054688]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 4.0, 5.0, 7.0, 18.0, 9.0, 22.0, 15.0, 16.0, 18.0, 17.0, 22.0, 29.0, 43.0, 25.0, 44.0, 39.0, 50.0, 49.0, 43.0, 42.0, 48.0, 40.0, 33.0, 40.0, 45.0, 51.0, 35.0, 27.0, 32.0, 22.0, 20.0, 24.0, 15.0, 10.0, 10.0, 8.0, 11.0, 1.0, 3.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-75.36639404296875, -73.18787384033203, -71.00934600830078, -68.83082580566406, -66.65230560302734, -64.47378540039062, -62.295257568359375, -60.116737365722656, -57.93821716308594, -55.75969314575195, -53.581172943115234, -51.40264892578125, -49.22412872314453, -47.04560470581055, -44.86708068847656, -42.688560485839844, -40.51003646850586, -38.331512451171875, -36.152992248535156, -33.97446823120117, -31.795948028564453, -29.61742401123047, -27.438901901245117, -25.260379791259766, -23.081857681274414, -20.903335571289062, -18.72481346130371, -16.54629135131836, -14.367768287658691, -12.18924617767334, -10.010723114013672, -7.83220100402832, -5.653678894042969, -3.475156545639038, -1.2966341972351074, 0.8818883895874023, 3.060410499572754, 5.2389326095581055, 7.417455673217773, 9.595977783203125, 11.774499893188477, 13.953022003173828, 16.13154411315918, 18.31006622314453, 20.488590240478516, 22.667110443115234, 24.84563446044922, 27.02415657043457, 29.202678680419922, 31.381200790405273, 33.559722900390625, 35.73824691772461, 37.91676712036133, 40.09529113769531, 42.27381134033203, 44.452335357666016, 46.630859375, 48.809383392333984, 50.9879035949707, 53.16642761230469, 55.344947814941406, 57.52347183227539, 59.701995849609375, 61.880516052246094, 64.05903625488281]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 8.0, 5.0, 15.0, 12.0, 21.0, 37.0, 58.0, 82.0, 136.0, 181.0, 249.0, 414.0, 629.0, 965.0, 1488.0, 2064.0, 3432.0, 5163.0, 7923.0, 12877.0, 20627.0, 33902.0, 58625.0, 106007.0, 218129.0, 622104.0, 1670665.0, 875180.0, 266282.0, 121655.0, 65053.0, 37801.0, 22615.0, 13756.0, 8840.0, 5878.0, 3720.0, 2447.0, 1613.0, 1103.0, 758.0, 509.0, 407.0, 262.0, 206.0, 122.0, 79.0, 51.0, 45.0, 26.0, 17.0, 18.0, 14.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-76.0625, -73.4951171875, -70.927734375, -68.3603515625, -65.79296875, -63.2255859375, -60.658203125, -58.0908203125, -55.5234375, -52.9560546875, -50.388671875, -47.8212890625, -45.25390625, -42.6865234375, -40.119140625, -37.5517578125, -34.984375, -32.4169921875, -29.849609375, -27.2822265625, -24.71484375, -22.1474609375, -19.580078125, -17.0126953125, -14.4453125, -11.8779296875, -9.310546875, -6.7431640625, -4.17578125, -1.6083984375, 0.958984375, 3.5263671875, 6.09375, 8.6611328125, 11.228515625, 13.7958984375, 16.36328125, 18.9306640625, 21.498046875, 24.0654296875, 26.6328125, 29.2001953125, 31.767578125, 34.3349609375, 36.90234375, 39.4697265625, 42.037109375, 44.6044921875, 47.171875, 49.7392578125, 52.306640625, 54.8740234375, 57.44140625, 60.0087890625, 62.576171875, 65.1435546875, 67.7109375, 70.2783203125, 72.845703125, 75.4130859375, 77.98046875, 80.5478515625, 83.115234375, 85.6826171875, 88.25]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 9.0, 7.0, 9.0, 15.0, 8.0, 13.0, 19.0, 19.0, 25.0, 35.0, 25.0, 28.0, 24.0, 37.0, 45.0, 33.0, 37.0, 40.0, 46.0, 48.0, 47.0, 43.0, 46.0, 37.0, 37.0, 43.0, 36.0, 34.0, 28.0, 21.0, 16.0, 19.0, 6.0, 14.0, 8.0, 5.0, 13.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-37.0, -35.91552734375, -34.8310546875, -33.74658203125, -32.662109375, -31.57763671875, -30.4931640625, -29.40869140625, -28.32421875, -27.23974609375, -26.1552734375, -25.07080078125, -23.986328125, -22.90185546875, -21.8173828125, -20.73291015625, -19.6484375, -18.56396484375, -17.4794921875, -16.39501953125, -15.310546875, -14.22607421875, -13.1416015625, -12.05712890625, -10.97265625, -9.88818359375, -8.8037109375, -7.71923828125, -6.634765625, -5.55029296875, -4.4658203125, -3.38134765625, -2.296875, -1.21240234375, -0.1279296875, 0.95654296875, 2.041015625, 3.12548828125, 4.2099609375, 5.29443359375, 6.37890625, 7.46337890625, 8.5478515625, 9.63232421875, 10.716796875, 11.80126953125, 12.8857421875, 13.97021484375, 15.0546875, 16.13916015625, 17.2236328125, 18.30810546875, 19.392578125, 20.47705078125, 21.5615234375, 22.64599609375, 23.73046875, 24.81494140625, 25.8994140625, 26.98388671875, 28.068359375, 29.15283203125, 30.2373046875, 31.32177734375, 32.40625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 6.0, 5.0, 6.0, 13.0, 15.0, 18.0, 29.0, 49.0, 45.0, 72.0, 100.0, 131.0, 154.0, 243.0, 298.0, 444.0, 657.0, 935.0, 1381.0, 2100.0, 3368.0, 5708.0, 9923.0, 18781.0, 38687.0, 87469.0, 228177.0, 758607.0, 2036654.0, 643830.0, 200068.0, 78611.0, 35774.0, 17809.0, 9369.0, 5317.0, 3262.0, 2001.0, 1286.0, 889.0, 612.0, 396.0, 283.0, 187.0, 146.0, 104.0, 56.0, 65.0, 42.0, 24.0, 29.0, 22.0, 8.0, 11.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-92.875, -89.9208984375, -86.966796875, -84.0126953125, -81.05859375, -78.1044921875, -75.150390625, -72.1962890625, -69.2421875, -66.2880859375, -63.333984375, -60.3798828125, -57.42578125, -54.4716796875, -51.517578125, -48.5634765625, -45.609375, -42.6552734375, -39.701171875, -36.7470703125, -33.79296875, -30.8388671875, -27.884765625, -24.9306640625, -21.9765625, -19.0224609375, -16.068359375, -13.1142578125, -10.16015625, -7.2060546875, -4.251953125, -1.2978515625, 1.65625, 4.6103515625, 7.564453125, 10.5185546875, 13.47265625, 16.4267578125, 19.380859375, 22.3349609375, 25.2890625, 28.2431640625, 31.197265625, 34.1513671875, 37.10546875, 40.0595703125, 43.013671875, 45.9677734375, 48.921875, 51.8759765625, 54.830078125, 57.7841796875, 60.73828125, 63.6923828125, 66.646484375, 69.6005859375, 72.5546875, 75.5087890625, 78.462890625, 81.4169921875, 84.37109375, 87.3251953125, 90.279296875, 93.2333984375, 96.1875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 0.0, 3.0, 5.0, 9.0, 14.0, 16.0, 28.0, 25.0, 37.0, 41.0, 53.0, 77.0, 95.0, 132.0, 162.0, 171.0, 235.0, 288.0, 325.0, 431.0, 361.0, 344.0, 265.0, 202.0, 169.0, 132.0, 95.0, 68.0, 68.0, 59.0, 38.0, 25.0, 14.0, 17.0, 16.0, 9.0, 11.0, 8.0, 4.0, 5.0, 3.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.544921875, -17.85546875, -17.166015625, -16.4765625, -15.787109375, -15.09765625, -14.408203125, -13.71875, -13.029296875, -12.33984375, -11.650390625, -10.9609375, -10.271484375, -9.58203125, -8.892578125, -8.203125, -7.513671875, -6.82421875, -6.134765625, -5.4453125, -4.755859375, -4.06640625, -3.376953125, -2.6875, -1.998046875, -1.30859375, -0.619140625, 0.0703125, 0.759765625, 1.44921875, 2.138671875, 2.828125, 3.517578125, 4.20703125, 4.896484375, 5.5859375, 6.275390625, 6.96484375, 7.654296875, 8.34375, 9.033203125, 9.72265625, 10.412109375, 11.1015625, 11.791015625, 12.48046875, 13.169921875, 13.859375, 14.548828125, 15.23828125, 15.927734375, 16.6171875, 17.306640625, 17.99609375, 18.685546875, 19.375, 20.064453125, 20.75390625, 21.443359375, 22.1328125, 22.822265625, 23.51171875, 24.201171875, 24.890625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 13.0, 19.0, 14.0, 29.0, 34.0, 42.0, 53.0, 77.0, 98.0, 131.0, 111.0, 95.0, 71.0, 43.0, 38.0, 25.0, 14.0, 18.0, 8.0, 9.0, 7.0, 3.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.93960952758789, -58.42152404785156, -55.90343475341797, -53.38534927368164, -50.86726379394531, -48.34917449951172, -45.83108901977539, -43.31300354003906, -40.79491424560547, -38.27682876586914, -35.75873947143555, -33.24065399169922, -30.72256851196289, -28.20448112487793, -25.68639373779297, -23.16830825805664, -20.650222778320312, -18.13213539123535, -15.614049911499023, -13.095962524414062, -10.577876091003418, -8.059789657592773, -5.5417022705078125, -3.0236167907714844, -0.5055294036865234, 2.0125572681427, 4.530643939971924, 7.048730850219727, 9.566817283630371, 12.084903717041016, 14.602991104125977, 17.121076583862305, 19.63916778564453, 22.157255172729492, 24.67534065246582, 27.19342803955078, 29.71151351928711, 32.22959899902344, 34.74768829345703, 37.26577377319336, 39.78385925292969, 42.301944732666016, 44.82003402709961, 47.33811950683594, 49.856204986572266, 52.374290466308594, 54.89237976074219, 57.410465240478516, 59.92855453491211, 62.44664001464844, 64.96472930908203, 67.48281860351562, 70.00090026855469, 72.51898956298828, 75.03707885742188, 77.55516052246094, 80.07324981689453, 82.59133911132812, 85.10942077636719, 87.62751007080078, 90.14559936523438, 92.66368103027344, 95.18177032470703, 97.69985961914062, 100.21794128417969]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 11.0, 7.0, 6.0, 8.0, 12.0, 25.0, 11.0, 17.0, 17.0, 27.0, 14.0, 20.0, 17.0, 26.0, 23.0, 35.0, 31.0, 32.0, 55.0, 41.0, 40.0, 48.0, 36.0, 35.0, 33.0, 27.0, 40.0, 27.0, 34.0, 31.0, 22.0, 29.0, 20.0, 21.0, 12.0, 20.0, 8.0, 13.0, 11.0, 8.0, 10.0, 11.0, 4.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.36384201049805, -34.25358963012695, -33.14333724975586, -32.03308868408203, -30.922836303710938, -29.812583923339844, -28.70233154296875, -27.592079162597656, -26.481828689575195, -25.3715763092041, -24.26132583618164, -23.151073455810547, -22.040821075439453, -20.930570602416992, -19.8203182220459, -18.710067749023438, -17.599815368652344, -16.48956298828125, -15.379312515258789, -14.269060134887695, -13.158808708190918, -12.04855728149414, -10.938304901123047, -9.82805347442627, -8.717802047729492, -7.607550621032715, -6.497298717498779, -5.387046813964844, -4.276795387268066, -3.166543960571289, -2.0562920570373535, -0.946040153503418, 0.164215087890625, 1.2744667530059814, 2.384718418121338, 3.4949700832366943, 4.605221748352051, 5.715473175048828, 6.825725078582764, 7.935976982116699, 9.046228408813477, 10.156479835510254, 11.266731262207031, 12.376983642578125, 13.487235069274902, 14.59748649597168, 15.707738876342773, 16.817989349365234, 17.928241729736328, 19.038494110107422, 20.148744583129883, 21.258996963500977, 22.369247436523438, 23.47949981689453, 24.589752197265625, 25.70000457763672, 26.81025505065918, 27.920507431030273, 29.030757904052734, 30.141010284423828, 31.251262664794922, 32.36151123046875, 33.471763610839844, 34.58201599121094, 35.69226837158203]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 16.0, 12.0, 25.0, 37.0, 55.0, 62.0, 79.0, 119.0, 153.0, 234.0, 338.0, 460.0, 670.0, 991.0, 1528.0, 2011.0, 3145.0, 4656.0, 7229.0, 11948.0, 20254.0, 36284.0, 70830.0, 160901.0, 359452.0, 188320.0, 79831.0, 40591.0, 22010.0, 12958.0, 7914.0, 4993.0, 3273.0, 2164.0, 1475.0, 990.0, 759.0, 496.0, 374.0, 254.0, 183.0, 130.0, 91.0, 59.0, 60.0, 37.0, 35.0, 20.0, 13.0, 12.0, 6.0, 3.0, 6.0, 4.0, 4.0, 0.0, 4.0], "bins": [-47.1875, -45.693359375, -44.19921875, -42.705078125, -41.2109375, -39.716796875, -38.22265625, -36.728515625, -35.234375, -33.740234375, -32.24609375, -30.751953125, -29.2578125, -27.763671875, -26.26953125, -24.775390625, -23.28125, -21.787109375, -20.29296875, -18.798828125, -17.3046875, -15.810546875, -14.31640625, -12.822265625, -11.328125, -9.833984375, -8.33984375, -6.845703125, -5.3515625, -3.857421875, -2.36328125, -0.869140625, 0.625, 2.119140625, 3.61328125, 5.107421875, 6.6015625, 8.095703125, 9.58984375, 11.083984375, 12.578125, 14.072265625, 15.56640625, 17.060546875, 18.5546875, 20.048828125, 21.54296875, 23.037109375, 24.53125, 26.025390625, 27.51953125, 29.013671875, 30.5078125, 32.001953125, 33.49609375, 34.990234375, 36.484375, 37.978515625, 39.47265625, 40.966796875, 42.4609375, 43.955078125, 45.44921875, 46.943359375, 48.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 10.0, 4.0, 6.0, 8.0, 5.0, 5.0, 12.0, 10.0, 17.0, 18.0, 14.0, 23.0, 17.0, 20.0, 22.0, 23.0, 25.0, 33.0, 50.0, 38.0, 51.0, 45.0, 40.0, 38.0, 53.0, 38.0, 46.0, 46.0, 36.0, 32.0, 26.0, 32.0, 16.0, 18.0, 24.0, 11.0, 11.0, 13.0, 15.0, 17.0, 8.0, 10.0, 6.0, 5.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-47.1875, -45.87744140625, -44.5673828125, -43.25732421875, -41.947265625, -40.63720703125, -39.3271484375, -38.01708984375, -36.70703125, -35.39697265625, -34.0869140625, -32.77685546875, -31.466796875, -30.15673828125, -28.8466796875, -27.53662109375, -26.2265625, -24.91650390625, -23.6064453125, -22.29638671875, -20.986328125, -19.67626953125, -18.3662109375, -17.05615234375, -15.74609375, -14.43603515625, -13.1259765625, -11.81591796875, -10.505859375, -9.19580078125, -7.8857421875, -6.57568359375, -5.265625, -3.95556640625, -2.6455078125, -1.33544921875, -0.025390625, 1.28466796875, 2.5947265625, 3.90478515625, 5.21484375, 6.52490234375, 7.8349609375, 9.14501953125, 10.455078125, 11.76513671875, 13.0751953125, 14.38525390625, 15.6953125, 17.00537109375, 18.3154296875, 19.62548828125, 20.935546875, 22.24560546875, 23.5556640625, 24.86572265625, 26.17578125, 27.48583984375, 28.7958984375, 30.10595703125, 31.416015625, 32.72607421875, 34.0361328125, 35.34619140625, 36.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 11.0, 14.0, 21.0, 16.0, 24.0, 44.0, 71.0, 78.0, 108.0, 161.0, 231.0, 289.0, 441.0, 640.0, 893.0, 1400.0, 2153.0, 3529.0, 6350.0, 12672.0, 29647.0, 94396.0, 578183.0, 225895.0, 50614.0, 18915.0, 8662.0, 4712.0, 2799.0, 1812.0, 1190.0, 807.0, 528.0, 373.0, 254.0, 174.0, 128.0, 99.0, 54.0, 35.0, 32.0, 22.0, 29.0, 11.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-70.1875, -67.9052734375, -65.623046875, -63.3408203125, -61.05859375, -58.7763671875, -56.494140625, -54.2119140625, -51.9296875, -49.6474609375, -47.365234375, -45.0830078125, -42.80078125, -40.5185546875, -38.236328125, -35.9541015625, -33.671875, -31.3896484375, -29.107421875, -26.8251953125, -24.54296875, -22.2607421875, -19.978515625, -17.6962890625, -15.4140625, -13.1318359375, -10.849609375, -8.5673828125, -6.28515625, -4.0029296875, -1.720703125, 0.5615234375, 2.84375, 5.1259765625, 7.408203125, 9.6904296875, 11.97265625, 14.2548828125, 16.537109375, 18.8193359375, 21.1015625, 23.3837890625, 25.666015625, 27.9482421875, 30.23046875, 32.5126953125, 34.794921875, 37.0771484375, 39.359375, 41.6416015625, 43.923828125, 46.2060546875, 48.48828125, 50.7705078125, 53.052734375, 55.3349609375, 57.6171875, 59.8994140625, 62.181640625, 64.4638671875, 66.74609375, 69.0283203125, 71.310546875, 73.5927734375, 75.875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 3.0, 3.0, 9.0, 14.0, 8.0, 12.0, 13.0, 16.0, 17.0, 24.0, 17.0, 23.0, 23.0, 31.0, 28.0, 44.0, 30.0, 29.0, 37.0, 27.0, 35.0, 55.0, 41.0, 40.0, 33.0, 32.0, 31.0, 31.0, 30.0, 39.0, 26.0, 23.0, 23.0, 25.0, 23.0, 13.0, 12.0, 14.0, 8.0, 15.0, 9.0, 4.0, 8.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-35.8125, -34.70556640625, -33.5986328125, -32.49169921875, -31.384765625, -30.27783203125, -29.1708984375, -28.06396484375, -26.95703125, -25.85009765625, -24.7431640625, -23.63623046875, -22.529296875, -21.42236328125, -20.3154296875, -19.20849609375, -18.1015625, -16.99462890625, -15.8876953125, -14.78076171875, -13.673828125, -12.56689453125, -11.4599609375, -10.35302734375, -9.24609375, -8.13916015625, -7.0322265625, -5.92529296875, -4.818359375, -3.71142578125, -2.6044921875, -1.49755859375, -0.390625, 0.71630859375, 1.8232421875, 2.93017578125, 4.037109375, 5.14404296875, 6.2509765625, 7.35791015625, 8.46484375, 9.57177734375, 10.6787109375, 11.78564453125, 12.892578125, 13.99951171875, 15.1064453125, 16.21337890625, 17.3203125, 18.42724609375, 19.5341796875, 20.64111328125, 21.748046875, 22.85498046875, 23.9619140625, 25.06884765625, 26.17578125, 27.28271484375, 28.3896484375, 29.49658203125, 30.603515625, 31.71044921875, 32.8173828125, 33.92431640625, 35.03125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 7.0, 5.0, 5.0, 4.0, 11.0, 14.0, 17.0, 26.0, 26.0, 50.0, 77.0, 95.0, 120.0, 168.0, 234.0, 307.0, 440.0, 652.0, 927.0, 1194.0, 1801.0, 2686.0, 4055.0, 6633.0, 12172.0, 25481.0, 73999.0, 550597.0, 266633.0, 52329.0, 20532.0, 9906.0, 5747.0, 3618.0, 2334.0, 1551.0, 1197.0, 756.0, 625.0, 442.0, 275.0, 215.0, 173.0, 121.0, 81.0, 68.0, 48.0, 35.0, 14.0, 14.0, 15.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0], "bins": [-64.4375, -62.4765625, -60.515625, -58.5546875, -56.59375, -54.6328125, -52.671875, -50.7109375, -48.75, -46.7890625, -44.828125, -42.8671875, -40.90625, -38.9453125, -36.984375, -35.0234375, -33.0625, -31.1015625, -29.140625, -27.1796875, -25.21875, -23.2578125, -21.296875, -19.3359375, -17.375, -15.4140625, -13.453125, -11.4921875, -9.53125, -7.5703125, -5.609375, -3.6484375, -1.6875, 0.2734375, 2.234375, 4.1953125, 6.15625, 8.1171875, 10.078125, 12.0390625, 14.0, 15.9609375, 17.921875, 19.8828125, 21.84375, 23.8046875, 25.765625, 27.7265625, 29.6875, 31.6484375, 33.609375, 35.5703125, 37.53125, 39.4921875, 41.453125, 43.4140625, 45.375, 47.3359375, 49.296875, 51.2578125, 53.21875, 55.1796875, 57.140625, 59.1015625, 61.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 2.0, 5.0, 6.0, 9.0, 8.0, 10.0, 10.0, 13.0, 17.0, 25.0, 19.0, 28.0, 32.0, 37.0, 43.0, 53.0, 62.0, 70.0, 65.0, 67.0, 58.0, 50.0, 44.0, 34.0, 29.0, 27.0, 23.0, 32.0, 16.0, 13.0, 18.0, 14.0, 9.0, 6.0, 5.0, 9.0, 6.0, 8.0, 3.0, 3.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0019702911376953125, -0.0019056499004364014, -0.0018410086631774902, -0.001776367425918579, -0.001711726188659668, -0.0016470849514007568, -0.0015824437141418457, -0.0015178024768829346, -0.0014531612396240234, -0.0013885200023651123, -0.0013238787651062012, -0.00125923752784729, -0.001194596290588379, -0.0011299550533294678, -0.0010653138160705566, -0.0010006725788116455, -0.0009360313415527344, -0.0008713901042938232, -0.0008067488670349121, -0.000742107629776001, -0.0006774663925170898, -0.0006128251552581787, -0.0005481839179992676, -0.00048354268074035645, -0.0004189014434814453, -0.0003542602062225342, -0.00028961896896362305, -0.00022497773170471191, -0.00016033649444580078, -9.569525718688965e-05, -3.1054019927978516e-05, 3.358721733093262e-05, 9.822845458984375e-05, 0.00016286969184875488, 0.00022751092910766602, 0.00029215216636657715, 0.0003567934036254883, 0.0004214346408843994, 0.00048607587814331055, 0.0005507171154022217, 0.0006153583526611328, 0.0006799995899200439, 0.0007446408271789551, 0.0008092820644378662, 0.0008739233016967773, 0.0009385645389556885, 0.0010032057762145996, 0.0010678470134735107, 0.0011324882507324219, 0.001197129487991333, 0.0012617707252502441, 0.0013264119625091553, 0.0013910531997680664, 0.0014556944370269775, 0.0015203356742858887, 0.0015849769115447998, 0.001649618148803711, 0.001714259386062622, 0.0017789006233215332, 0.0018435418605804443, 0.0019081830978393555, 0.0019728243350982666, 0.0020374655723571777, 0.002102106809616089, 0.002166748046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 6.0, 10.0, 21.0, 25.0, 36.0, 63.0, 95.0, 135.0, 231.0, 371.0, 624.0, 1047.0, 1950.0, 3646.0, 6980.0, 14358.0, 31961.0, 88294.0, 389440.0, 363297.0, 85603.0, 31502.0, 13874.0, 6814.0, 3603.0, 1884.0, 1093.0, 615.0, 353.0, 214.0, 134.0, 83.0, 63.0, 37.0, 34.0, 21.0, 9.0, 9.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.25, -67.0849609375, -64.919921875, -62.7548828125, -60.58984375, -58.4248046875, -56.259765625, -54.0947265625, -51.9296875, -49.7646484375, -47.599609375, -45.4345703125, -43.26953125, -41.1044921875, -38.939453125, -36.7744140625, -34.609375, -32.4443359375, -30.279296875, -28.1142578125, -25.94921875, -23.7841796875, -21.619140625, -19.4541015625, -17.2890625, -15.1240234375, -12.958984375, -10.7939453125, -8.62890625, -6.4638671875, -4.298828125, -2.1337890625, 0.03125, 2.1962890625, 4.361328125, 6.5263671875, 8.69140625, 10.8564453125, 13.021484375, 15.1865234375, 17.3515625, 19.5166015625, 21.681640625, 23.8466796875, 26.01171875, 28.1767578125, 30.341796875, 32.5068359375, 34.671875, 36.8369140625, 39.001953125, 41.1669921875, 43.33203125, 45.4970703125, 47.662109375, 49.8271484375, 51.9921875, 54.1572265625, 56.322265625, 58.4873046875, 60.65234375, 62.8173828125, 64.982421875, 67.1474609375, 69.3125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 13.0, 14.0, 18.0, 22.0, 25.0, 19.0, 31.0, 39.0, 48.0, 51.0, 77.0, 88.0, 95.0, 69.0, 59.0, 52.0, 42.0, 39.0, 28.0, 25.0, 19.0, 25.0, 17.0, 16.0, 13.0, 13.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.140625, -8.7945556640625, -8.448486328125, -8.1024169921875, -7.75634765625, -7.4102783203125, -7.064208984375, -6.7181396484375, -6.3720703125, -6.0260009765625, -5.679931640625, -5.3338623046875, -4.98779296875, -4.6417236328125, -4.295654296875, -3.9495849609375, -3.603515625, -3.2574462890625, -2.911376953125, -2.5653076171875, -2.21923828125, -1.8731689453125, -1.527099609375, -1.1810302734375, -0.8349609375, -0.4888916015625, -0.142822265625, 0.2032470703125, 0.54931640625, 0.8953857421875, 1.241455078125, 1.5875244140625, 1.93359375, 2.2796630859375, 2.625732421875, 2.9718017578125, 3.31787109375, 3.6639404296875, 4.010009765625, 4.3560791015625, 4.7021484375, 5.0482177734375, 5.394287109375, 5.7403564453125, 6.08642578125, 6.4324951171875, 6.778564453125, 7.1246337890625, 7.470703125, 7.8167724609375, 8.162841796875, 8.5089111328125, 8.85498046875, 9.2010498046875, 9.547119140625, 9.8931884765625, 10.2392578125, 10.5853271484375, 10.931396484375, 11.2774658203125, 11.62353515625, 11.9696044921875, 12.315673828125, 12.6617431640625, 13.0078125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 12.0, 7.0, 9.0, 17.0, 25.0, 26.0, 44.0, 69.0, 83.0, 107.0, 145.0, 125.0, 86.0, 62.0, 46.0, 28.0, 19.0, 15.0, 12.0, 7.0, 10.0, 4.0, 9.0, 2.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.72271728515625, -67.87286376953125, -65.02301025390625, -62.173160552978516, -59.32331085205078, -56.47345733642578, -53.62360382080078, -50.77375030517578, -47.92390060424805, -45.07404708862305, -42.22419738769531, -39.37434387207031, -36.52449035644531, -33.67464065551758, -30.824787139892578, -27.97493553161621, -25.125083923339844, -22.275232315063477, -19.42538070678711, -16.57552719116211, -13.725675582885742, -10.875823974609375, -8.025970458984375, -5.176118850708008, -2.3262672424316406, 0.5235848426818848, 3.37343692779541, 6.223289489746094, 9.073141098022461, 11.922992706298828, 14.772846221923828, 17.622697830200195, 20.472549438476562, 23.32240104675293, 26.172252655029297, 29.022106170654297, 31.871957778930664, 34.72180938720703, 37.57166290283203, 40.42151641845703, 43.271366119384766, 46.121219635009766, 48.9710693359375, 51.8209228515625, 54.6707763671875, 57.520626068115234, 60.370479583740234, 63.22032928466797, 66.07018280029297, 68.92003631591797, 71.76988983154297, 74.61973571777344, 77.46958923339844, 80.31944274902344, 83.16929626464844, 86.01914978027344, 88.86900329589844, 91.71885681152344, 94.56871032714844, 97.41856384277344, 100.2684097290039, 103.1182632446289, 105.9681167602539, 108.8179702758789, 111.66781616210938]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 3.0, 9.0, 12.0, 8.0, 11.0, 13.0, 10.0, 8.0, 23.0, 15.0, 23.0, 16.0, 23.0, 18.0, 22.0, 25.0, 43.0, 33.0, 38.0, 28.0, 50.0, 36.0, 41.0, 33.0, 46.0, 37.0, 36.0, 32.0, 27.0, 30.0, 22.0, 21.0, 25.0, 24.0, 21.0, 19.0, 18.0, 19.0, 11.0, 16.0, 11.0, 5.0, 4.0, 7.0, 10.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-37.795108795166016, -36.66645050048828, -35.53779602050781, -34.40913772583008, -33.280479431152344, -32.151824951171875, -31.02316665649414, -29.89451026916504, -28.765853881835938, -27.637197494506836, -26.5085391998291, -25.3798828125, -24.2512264251709, -23.122570037841797, -21.993911743164062, -20.86525535583496, -19.736597061157227, -18.607940673828125, -17.47928237915039, -16.35062599182129, -15.221969604492188, -14.09331226348877, -12.964654922485352, -11.83599853515625, -10.707341194152832, -9.578683853149414, -8.450027465820312, -7.3213701248168945, -6.192713260650635, -5.064056396484375, -3.935399055480957, -2.8067421913146973, -1.6780853271484375, -0.5494283437728882, 0.5792286396026611, 1.7078857421875, 2.8365426063537598, 3.9651994705200195, 5.0938568115234375, 6.222513675689697, 7.351170539855957, 8.479827880859375, 9.608484268188477, 10.737141609191895, 11.865798950195312, 12.994455337524414, 14.123112678527832, 15.25177001953125, 16.38042640686035, 17.509082794189453, 18.637741088867188, 19.76639747619629, 20.89505386352539, 22.023712158203125, 23.152368545532227, 24.281024932861328, 25.409683227539062, 26.538339614868164, 27.6669979095459, 28.795654296875, 29.9243106842041, 31.052967071533203, 32.18162536621094, 33.31028366088867, 34.43893814086914]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 8.0, 14.0, 19.0, 35.0, 46.0, 72.0, 101.0, 146.0, 180.0, 287.0, 413.0, 615.0, 877.0, 1277.0, 1999.0, 3143.0, 4860.0, 7771.0, 12220.0, 20161.0, 32195.0, 52488.0, 86078.0, 140565.0, 207628.0, 180526.0, 112451.0, 69557.0, 42395.0, 26218.0, 16077.0, 10085.0, 6295.0, 4062.0, 2595.0, 1656.0, 1069.0, 691.0, 527.0, 361.0, 240.0, 176.0, 114.0, 75.0, 44.0, 48.0, 27.0, 30.0, 7.0, 7.0, 9.0, 5.0, 5.0, 0.0, 1.0], "bins": [-78.375, -76.0546875, -73.734375, -71.4140625, -69.09375, -66.7734375, -64.453125, -62.1328125, -59.8125, -57.4921875, -55.171875, -52.8515625, -50.53125, -48.2109375, -45.890625, -43.5703125, -41.25, -38.9296875, -36.609375, -34.2890625, -31.96875, -29.6484375, -27.328125, -25.0078125, -22.6875, -20.3671875, -18.046875, -15.7265625, -13.40625, -11.0859375, -8.765625, -6.4453125, -4.125, -1.8046875, 0.515625, 2.8359375, 5.15625, 7.4765625, 9.796875, 12.1171875, 14.4375, 16.7578125, 19.078125, 21.3984375, 23.71875, 26.0390625, 28.359375, 30.6796875, 33.0, 35.3203125, 37.640625, 39.9609375, 42.28125, 44.6015625, 46.921875, 49.2421875, 51.5625, 53.8828125, 56.203125, 58.5234375, 60.84375, 63.1640625, 65.484375, 67.8046875, 70.125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 3.0, 9.0, 6.0, 6.0, 10.0, 10.0, 20.0, 12.0, 14.0, 21.0, 19.0, 29.0, 27.0, 22.0, 41.0, 28.0, 30.0, 29.0, 33.0, 37.0, 39.0, 36.0, 42.0, 41.0, 38.0, 49.0, 40.0, 29.0, 26.0, 22.0, 40.0, 30.0, 22.0, 17.0, 11.0, 17.0, 18.0, 14.0, 17.0, 5.0, 8.0, 11.0, 6.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-35.1875, -34.1552734375, -33.123046875, -32.0908203125, -31.05859375, -30.0263671875, -28.994140625, -27.9619140625, -26.9296875, -25.8974609375, -24.865234375, -23.8330078125, -22.80078125, -21.7685546875, -20.736328125, -19.7041015625, -18.671875, -17.6396484375, -16.607421875, -15.5751953125, -14.54296875, -13.5107421875, -12.478515625, -11.4462890625, -10.4140625, -9.3818359375, -8.349609375, -7.3173828125, -6.28515625, -5.2529296875, -4.220703125, -3.1884765625, -2.15625, -1.1240234375, -0.091796875, 0.9404296875, 1.97265625, 3.0048828125, 4.037109375, 5.0693359375, 6.1015625, 7.1337890625, 8.166015625, 9.1982421875, 10.23046875, 11.2626953125, 12.294921875, 13.3271484375, 14.359375, 15.3916015625, 16.423828125, 17.4560546875, 18.48828125, 19.5205078125, 20.552734375, 21.5849609375, 22.6171875, 23.6494140625, 24.681640625, 25.7138671875, 26.74609375, 27.7783203125, 28.810546875, 29.8427734375, 30.875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 15.0, 9.0, 20.0, 31.0, 44.0, 64.0, 109.0, 177.0, 247.0, 376.0, 561.0, 870.0, 1312.0, 2042.0, 3195.0, 5083.0, 8476.0, 14059.0, 24764.0, 43771.0, 82524.0, 163631.0, 275619.0, 197833.0, 99987.0, 52098.0, 29056.0, 16633.0, 9733.0, 5981.0, 3625.0, 2237.0, 1477.0, 994.0, 596.0, 409.0, 282.0, 202.0, 129.0, 87.0, 58.0, 38.0, 37.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0], "bins": [-90.1875, -87.6572265625, -85.126953125, -82.5966796875, -80.06640625, -77.5361328125, -75.005859375, -72.4755859375, -69.9453125, -67.4150390625, -64.884765625, -62.3544921875, -59.82421875, -57.2939453125, -54.763671875, -52.2333984375, -49.703125, -47.1728515625, -44.642578125, -42.1123046875, -39.58203125, -37.0517578125, -34.521484375, -31.9912109375, -29.4609375, -26.9306640625, -24.400390625, -21.8701171875, -19.33984375, -16.8095703125, -14.279296875, -11.7490234375, -9.21875, -6.6884765625, -4.158203125, -1.6279296875, 0.90234375, 3.4326171875, 5.962890625, 8.4931640625, 11.0234375, 13.5537109375, 16.083984375, 18.6142578125, 21.14453125, 23.6748046875, 26.205078125, 28.7353515625, 31.265625, 33.7958984375, 36.326171875, 38.8564453125, 41.38671875, 43.9169921875, 46.447265625, 48.9775390625, 51.5078125, 54.0380859375, 56.568359375, 59.0986328125, 61.62890625, 64.1591796875, 66.689453125, 69.2197265625, 71.75]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 10.0, 10.0, 13.0, 4.0, 16.0, 19.0, 26.0, 24.0, 22.0, 27.0, 28.0, 32.0, 33.0, 33.0, 30.0, 26.0, 44.0, 41.0, 35.0, 39.0, 38.0, 46.0, 47.0, 31.0, 33.0, 31.0, 26.0, 25.0, 31.0, 20.0, 17.0, 15.0, 16.0, 16.0, 10.0, 17.0, 9.0, 10.0, 3.0, 7.0, 3.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0], "bins": [-29.0625, -28.242919921875, -27.42333984375, -26.603759765625, -25.7841796875, -24.964599609375, -24.14501953125, -23.325439453125, -22.505859375, -21.686279296875, -20.86669921875, -20.047119140625, -19.2275390625, -18.407958984375, -17.58837890625, -16.768798828125, -15.94921875, -15.129638671875, -14.31005859375, -13.490478515625, -12.6708984375, -11.851318359375, -11.03173828125, -10.212158203125, -9.392578125, -8.572998046875, -7.75341796875, -6.933837890625, -6.1142578125, -5.294677734375, -4.47509765625, -3.655517578125, -2.8359375, -2.016357421875, -1.19677734375, -0.377197265625, 0.4423828125, 1.261962890625, 2.08154296875, 2.901123046875, 3.720703125, 4.540283203125, 5.35986328125, 6.179443359375, 6.9990234375, 7.818603515625, 8.63818359375, 9.457763671875, 10.27734375, 11.096923828125, 11.91650390625, 12.736083984375, 13.5556640625, 14.375244140625, 15.19482421875, 16.014404296875, 16.833984375, 17.653564453125, 18.47314453125, 19.292724609375, 20.1123046875, 20.931884765625, 21.75146484375, 22.571044921875, 23.390625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 23.0, 13.0, 23.0, 22.0, 31.0, 36.0, 61.0, 74.0, 141.0, 180.0, 263.0, 373.0, 609.0, 1115.0, 2178.0, 5503.0, 20731.0, 209966.0, 758386.0, 34694.0, 7785.0, 2865.0, 1335.0, 699.0, 435.0, 325.0, 169.0, 136.0, 108.0, 71.0, 69.0, 41.0, 26.0, 19.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-486.25, -472.01171875, -457.7734375, -443.53515625, -429.296875, -415.05859375, -400.8203125, -386.58203125, -372.34375, -358.10546875, -343.8671875, -329.62890625, -315.390625, -301.15234375, -286.9140625, -272.67578125, -258.4375, -244.19921875, -229.9609375, -215.72265625, -201.484375, -187.24609375, -173.0078125, -158.76953125, -144.53125, -130.29296875, -116.0546875, -101.81640625, -87.578125, -73.33984375, -59.1015625, -44.86328125, -30.625, -16.38671875, -2.1484375, 12.08984375, 26.328125, 40.56640625, 54.8046875, 69.04296875, 83.28125, 97.51953125, 111.7578125, 125.99609375, 140.234375, 154.47265625, 168.7109375, 182.94921875, 197.1875, 211.42578125, 225.6640625, 239.90234375, 254.140625, 268.37890625, 282.6171875, 296.85546875, 311.09375, 325.33203125, 339.5703125, 353.80859375, 368.046875, 382.28515625, 396.5234375, 410.76171875, 425.0]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 8.0, 21.0, 20.0, 33.0, 77.0, 115.0, 180.0, 206.0, 119.0, 72.0, 46.0, 29.0, 20.0, 11.0, 8.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.012542724609375, -0.012204885482788086, -0.011867046356201172, -0.011529207229614258, -0.011191368103027344, -0.01085352897644043, -0.010515689849853516, -0.010177850723266602, -0.009840011596679688, -0.009502172470092773, -0.00916433334350586, -0.008826494216918945, -0.008488655090332031, -0.008150815963745117, -0.007812976837158203, -0.007475137710571289, -0.007137298583984375, -0.006799459457397461, -0.006461620330810547, -0.006123781204223633, -0.005785942077636719, -0.005448102951049805, -0.005110263824462891, -0.0047724246978759766, -0.0044345855712890625, -0.0040967464447021484, -0.0037589073181152344, -0.0034210681915283203, -0.0030832290649414062, -0.002745389938354492, -0.002407550811767578, -0.002069711685180664, -0.00173187255859375, -0.001394033432006836, -0.0010561943054199219, -0.0007183551788330078, -0.00038051605224609375, -4.267692565917969e-05, 0.0002951622009277344, 0.0006330013275146484, 0.0009708404541015625, 0.0013086795806884766, 0.0016465187072753906, 0.0019843578338623047, 0.0023221969604492188, 0.002660036087036133, 0.002997875213623047, 0.003335714340209961, 0.003673553466796875, 0.004011392593383789, 0.004349231719970703, 0.004687070846557617, 0.005024909973144531, 0.005362749099731445, 0.005700588226318359, 0.0060384273529052734, 0.0063762664794921875, 0.0067141056060791016, 0.007051944732666016, 0.00738978385925293, 0.007727622985839844, 0.008065462112426758, 0.008403301239013672, 0.008741140365600586, 0.0090789794921875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 7.0, 9.0, 9.0, 18.0, 28.0, 39.0, 32.0, 53.0, 58.0, 87.0, 136.0, 158.0, 232.0, 349.0, 455.0, 746.0, 1051.0, 1802.0, 3515.0, 8798.0, 35209.0, 719803.0, 239665.0, 22092.0, 6589.0, 2920.0, 1541.0, 980.0, 603.0, 464.0, 299.0, 204.0, 142.0, 110.0, 82.0, 57.0, 53.0, 42.0, 18.0, 17.0, 23.0, 17.0, 9.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-392.75, -380.0234375, -367.296875, -354.5703125, -341.84375, -329.1171875, -316.390625, -303.6640625, -290.9375, -278.2109375, -265.484375, -252.7578125, -240.03125, -227.3046875, -214.578125, -201.8515625, -189.125, -176.3984375, -163.671875, -150.9453125, -138.21875, -125.4921875, -112.765625, -100.0390625, -87.3125, -74.5859375, -61.859375, -49.1328125, -36.40625, -23.6796875, -10.953125, 1.7734375, 14.5, 27.2265625, 39.953125, 52.6796875, 65.40625, 78.1328125, 90.859375, 103.5859375, 116.3125, 129.0390625, 141.765625, 154.4921875, 167.21875, 179.9453125, 192.671875, 205.3984375, 218.125, 230.8515625, 243.578125, 256.3046875, 269.03125, 281.7578125, 294.484375, 307.2109375, 319.9375, 332.6640625, 345.390625, 358.1171875, 370.84375, 383.5703125, 396.296875, 409.0234375, 421.75]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 9.0, 12.0, 18.0, 56.0, 80.0, 181.0, 230.0, 167.0, 133.0, 48.0, 26.0, 8.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.875, -108.6533203125, -105.431640625, -102.2099609375, -98.98828125, -95.7666015625, -92.544921875, -89.3232421875, -86.1015625, -82.8798828125, -79.658203125, -76.4365234375, -73.21484375, -69.9931640625, -66.771484375, -63.5498046875, -60.328125, -57.1064453125, -53.884765625, -50.6630859375, -47.44140625, -44.2197265625, -40.998046875, -37.7763671875, -34.5546875, -31.3330078125, -28.111328125, -24.8896484375, -21.66796875, -18.4462890625, -15.224609375, -12.0029296875, -8.78125, -5.5595703125, -2.337890625, 0.8837890625, 4.10546875, 7.3271484375, 10.548828125, 13.7705078125, 16.9921875, 20.2138671875, 23.435546875, 26.6572265625, 29.87890625, 33.1005859375, 36.322265625, 39.5439453125, 42.765625, 45.9873046875, 49.208984375, 52.4306640625, 55.65234375, 58.8740234375, 62.095703125, 65.3173828125, 68.5390625, 71.7607421875, 74.982421875, 78.2041015625, 81.42578125, 84.6474609375, 87.869140625, 91.0908203125, 94.3125]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 13.0, 20.0, 39.0, 63.0, 135.0, 198.0, 188.0, 118.0, 61.0, 37.0, 25.0, 25.0, 23.0, 11.0, 9.0, 4.0, 5.0, 7.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.72150421142578, -49.136714935302734, -44.55192565917969, -39.967140197753906, -35.38235092163086, -30.797561645507812, -26.2127742767334, -21.627986907958984, -17.043197631835938, -12.458409309387207, -7.873620986938477, -3.288832664489746, 1.2959556579589844, 5.880744934082031, 10.465532302856445, 15.05031967163086, 19.635108947753906, 24.219898223876953, 28.804685592651367, 33.38947296142578, 37.97426223754883, 42.559051513671875, 47.143836975097656, 51.7286262512207, 56.31341552734375, 60.8982048034668, 65.48299407958984, 70.06777954101562, 74.65257263183594, 79.23735809326172, 83.8221435546875, 88.40693664550781, 92.99172973632812, 97.5765151977539, 102.16130828857422, 106.74609375, 111.33088684082031, 115.9156723022461, 120.50045776367188, 125.08525085449219, 129.6700439453125, 134.2548370361328, 138.83961486816406, 143.42440795898438, 148.0092010498047, 152.593994140625, 157.17877197265625, 161.76356506347656, 166.3483428955078, 170.93313598632812, 175.51791381835938, 180.1027069091797, 184.6875, 189.27227783203125, 193.85707092285156, 198.44186401367188, 203.02664184570312, 207.61143493652344, 212.1962127685547, 216.781005859375, 221.3657989501953, 225.95059204101562, 230.53536987304688, 235.1201629638672, 239.7049560546875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 13.0, 9.0, 13.0, 17.0, 16.0, 10.0, 14.0, 15.0, 18.0, 28.0, 27.0, 25.0, 30.0, 48.0, 35.0, 42.0, 28.0, 39.0, 42.0, 47.0, 34.0, 48.0, 32.0, 33.0, 35.0, 30.0, 39.0, 24.0, 22.0, 29.0, 30.0, 17.0, 17.0, 12.0, 13.0, 8.0, 12.0, 12.0, 3.0, 6.0, 7.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-45.45261001586914, -44.18706130981445, -42.92151641845703, -41.655967712402344, -40.39042282104492, -39.124874114990234, -37.85932922363281, -36.593780517578125, -35.32823181152344, -34.06268310546875, -32.79713821411133, -31.531591415405273, -30.26604461669922, -29.00049591064453, -27.734949111938477, -26.469402313232422, -25.203857421875, -23.938310623168945, -22.67276382446289, -21.407217025756836, -20.14167022705078, -18.876121520996094, -17.61057472229004, -16.345027923583984, -15.07948112487793, -13.813934326171875, -12.54838752746582, -11.28283977508545, -10.017292976379395, -8.75174617767334, -7.486198902130127, -6.220651626586914, -4.955104827880859, -3.6895577907562256, -2.424010753631592, -1.158463716506958, 0.10708332061767578, 1.3726301193237305, 2.6381773948669434, 3.9037246704101562, 5.169271469116211, 6.434818267822266, 7.7003655433654785, 8.965912818908691, 10.231459617614746, 11.4970064163208, 12.762554168701172, 14.028100967407227, 15.293647766113281, 16.559194564819336, 17.82474136352539, 19.090288162231445, 20.3558349609375, 21.621383666992188, 22.886930465698242, 24.152477264404297, 25.41802406311035, 26.683570861816406, 27.94911766052246, 29.214664459228516, 30.480213165283203, 31.745758056640625, 33.01130676269531, 34.27685546875, 35.54240036010742]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 9.0, 10.0, 12.0, 24.0, 34.0, 32.0, 68.0, 90.0, 149.0, 205.0, 311.0, 440.0, 668.0, 966.0, 1504.0, 2222.0, 3311.0, 4994.0, 7774.0, 12559.0, 20460.0, 35309.0, 63384.0, 123844.0, 286025.0, 1015646.0, 1702913.0, 517908.0, 187772.0, 89034.0, 47664.0, 26783.0, 15954.0, 9516.0, 5943.0, 3675.0, 2453.0, 1570.0, 988.0, 652.0, 441.0, 325.0, 201.0, 134.0, 111.0, 56.0, 48.0, 29.0, 21.0, 19.0, 6.0, 11.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-64.875, -62.86376953125, -60.8525390625, -58.84130859375, -56.830078125, -54.81884765625, -52.8076171875, -50.79638671875, -48.78515625, -46.77392578125, -44.7626953125, -42.75146484375, -40.740234375, -38.72900390625, -36.7177734375, -34.70654296875, -32.6953125, -30.68408203125, -28.6728515625, -26.66162109375, -24.650390625, -22.63916015625, -20.6279296875, -18.61669921875, -16.60546875, -14.59423828125, -12.5830078125, -10.57177734375, -8.560546875, -6.54931640625, -4.5380859375, -2.52685546875, -0.515625, 1.49560546875, 3.5068359375, 5.51806640625, 7.529296875, 9.54052734375, 11.5517578125, 13.56298828125, 15.57421875, 17.58544921875, 19.5966796875, 21.60791015625, 23.619140625, 25.63037109375, 27.6416015625, 29.65283203125, 31.6640625, 33.67529296875, 35.6865234375, 37.69775390625, 39.708984375, 41.72021484375, 43.7314453125, 45.74267578125, 47.75390625, 49.76513671875, 51.7763671875, 53.78759765625, 55.798828125, 57.81005859375, 59.8212890625, 61.83251953125, 63.84375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 3.0, 2.0, 6.0, 4.0, 6.0, 9.0, 10.0, 11.0, 11.0, 17.0, 19.0, 14.0, 20.0, 22.0, 31.0, 24.0, 18.0, 40.0, 43.0, 35.0, 38.0, 44.0, 42.0, 35.0, 53.0, 36.0, 46.0, 31.0, 27.0, 39.0, 39.0, 26.0, 22.0, 26.0, 25.0, 12.0, 20.0, 20.0, 18.0, 11.0, 8.0, 6.0, 6.0, 7.0, 3.0, 4.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.62109375, -19.9453125, -19.26953125, -18.59375, -17.91796875, -17.2421875, -16.56640625, -15.890625, -15.21484375, -14.5390625, -13.86328125, -13.1875, -12.51171875, -11.8359375, -11.16015625, -10.484375, -9.80859375, -9.1328125, -8.45703125, -7.78125, -7.10546875, -6.4296875, -5.75390625, -5.078125, -4.40234375, -3.7265625, -3.05078125, -2.375, -1.69921875, -1.0234375, -0.34765625, 0.328125, 1.00390625, 1.6796875, 2.35546875, 3.03125, 3.70703125, 4.3828125, 5.05859375, 5.734375, 6.41015625, 7.0859375, 7.76171875, 8.4375, 9.11328125, 9.7890625, 10.46484375, 11.140625, 11.81640625, 12.4921875, 13.16796875, 13.84375, 14.51953125, 15.1953125, 15.87109375, 16.546875, 17.22265625, 17.8984375, 18.57421875, 19.25, 19.92578125, 20.6015625, 21.27734375, 21.953125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 9.0, 12.0, 15.0, 15.0, 27.0, 31.0, 48.0, 64.0, 96.0, 115.0, 174.0, 217.0, 298.0, 467.0, 659.0, 946.0, 1423.0, 2180.0, 3424.0, 5583.0, 9778.0, 18028.0, 35565.0, 80023.0, 212406.0, 767342.0, 2148176.0, 591014.0, 176447.0, 68209.0, 31489.0, 16313.0, 9131.0, 5258.0, 3290.0, 2054.0, 1314.0, 899.0, 571.0, 366.0, 262.0, 181.0, 125.0, 83.0, 60.0, 26.0, 27.0, 17.0, 9.0, 11.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-79.0, -76.76904296875, -74.5380859375, -72.30712890625, -70.076171875, -67.84521484375, -65.6142578125, -63.38330078125, -61.15234375, -58.92138671875, -56.6904296875, -54.45947265625, -52.228515625, -49.99755859375, -47.7666015625, -45.53564453125, -43.3046875, -41.07373046875, -38.8427734375, -36.61181640625, -34.380859375, -32.14990234375, -29.9189453125, -27.68798828125, -25.45703125, -23.22607421875, -20.9951171875, -18.76416015625, -16.533203125, -14.30224609375, -12.0712890625, -9.84033203125, -7.609375, -5.37841796875, -3.1474609375, -0.91650390625, 1.314453125, 3.54541015625, 5.7763671875, 8.00732421875, 10.23828125, 12.46923828125, 14.7001953125, 16.93115234375, 19.162109375, 21.39306640625, 23.6240234375, 25.85498046875, 28.0859375, 30.31689453125, 32.5478515625, 34.77880859375, 37.009765625, 39.24072265625, 41.4716796875, 43.70263671875, 45.93359375, 48.16455078125, 50.3955078125, 52.62646484375, 54.857421875, 57.08837890625, 59.3193359375, 61.55029296875, 63.78125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 6.0, 9.0, 4.0, 17.0, 25.0, 18.0, 35.0, 43.0, 46.0, 74.0, 85.0, 124.0, 124.0, 169.0, 192.0, 246.0, 320.0, 367.0, 346.0, 372.0, 288.0, 207.0, 191.0, 169.0, 106.0, 80.0, 83.0, 57.0, 45.0, 51.0, 22.0, 31.0, 19.0, 9.0, 16.0, 11.0, 8.0, 10.0, 12.0, 7.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-14.4140625, -13.954833984375, -13.49560546875, -13.036376953125, -12.5771484375, -12.117919921875, -11.65869140625, -11.199462890625, -10.740234375, -10.281005859375, -9.82177734375, -9.362548828125, -8.9033203125, -8.444091796875, -7.98486328125, -7.525634765625, -7.06640625, -6.607177734375, -6.14794921875, -5.688720703125, -5.2294921875, -4.770263671875, -4.31103515625, -3.851806640625, -3.392578125, -2.933349609375, -2.47412109375, -2.014892578125, -1.5556640625, -1.096435546875, -0.63720703125, -0.177978515625, 0.28125, 0.740478515625, 1.19970703125, 1.658935546875, 2.1181640625, 2.577392578125, 3.03662109375, 3.495849609375, 3.955078125, 4.414306640625, 4.87353515625, 5.332763671875, 5.7919921875, 6.251220703125, 6.71044921875, 7.169677734375, 7.62890625, 8.088134765625, 8.54736328125, 9.006591796875, 9.4658203125, 9.925048828125, 10.38427734375, 10.843505859375, 11.302734375, 11.761962890625, 12.22119140625, 12.680419921875, 13.1396484375, 13.598876953125, 14.05810546875, 14.517333984375, 14.9765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 12.0, 8.0, 20.0, 23.0, 55.0, 79.0, 119.0, 209.0, 183.0, 107.0, 56.0, 27.0, 38.0, 17.0, 7.0, 4.0, 4.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.68571472167969, -54.830745697021484, -51.97578048706055, -49.120811462402344, -46.265846252441406, -43.4108772277832, -40.555908203125, -37.70094299316406, -34.845977783203125, -31.991010665893555, -29.136043548583984, -26.28107452392578, -23.426109313964844, -20.57114028930664, -17.71617317199707, -14.8612060546875, -12.006237030029297, -9.151269912719727, -6.296302318572998, -3.4413347244262695, -0.5863676071166992, 2.268599510192871, 5.123567581176758, 7.978534698486328, 10.833501815795898, 13.688468933105469, 16.54343605041504, 19.39840316772461, 22.253372192382812, 25.10833740234375, 27.963306427001953, 30.818273544311523, 33.673240661621094, 36.5282096862793, 39.383174896240234, 42.23814392089844, 45.093109130859375, 47.94807815551758, 50.80304718017578, 53.65801239013672, 56.512977600097656, 59.36794662475586, 62.2229118347168, 65.077880859375, 67.93284606933594, 70.78781127929688, 73.64278411865234, 76.49774932861328, 79.35272216796875, 82.20768737792969, 85.06266021728516, 87.9176254272461, 90.77259063720703, 93.62755584716797, 96.48252868652344, 99.33749389648438, 102.19245910644531, 105.04742431640625, 107.90239715576172, 110.75736236572266, 113.6123275756836, 116.46729278564453, 119.322265625, 122.17723083496094, 125.03219604492188]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 15.0, 6.0, 16.0, 11.0, 11.0, 17.0, 24.0, 27.0, 25.0, 21.0, 39.0, 26.0, 41.0, 33.0, 26.0, 37.0, 48.0, 46.0, 34.0, 49.0, 42.0, 41.0, 53.0, 35.0, 39.0, 30.0, 23.0, 25.0, 21.0, 22.0, 14.0, 18.0, 14.0, 16.0, 7.0, 7.0, 8.0, 6.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-31.70625114440918, -30.815082550048828, -29.923912048339844, -29.032743453979492, -28.14157485961914, -27.250404357910156, -26.359235763549805, -25.468067169189453, -24.5768985748291, -23.68572998046875, -22.794559478759766, -21.903390884399414, -21.012222290039062, -20.121051788330078, -19.229883193969727, -18.338714599609375, -17.44754409790039, -16.55637550354004, -15.665205955505371, -14.774036407470703, -13.882867813110352, -12.991698265075684, -12.100528717041016, -11.209360122680664, -10.318191528320312, -9.427021980285645, -8.535853385925293, -7.644683837890625, -6.753515243530273, -5.8623456954956055, -4.971176624298096, -4.080007553100586, -3.1888389587402344, -2.2976698875427246, -1.4065006971359253, -0.515331506729126, 0.3758375644683838, 1.2670068740844727, 2.1581759452819824, 3.049345016479492, 3.940514087677002, 4.831683158874512, 5.7228522300720215, 6.614021301269531, 7.505190849304199, 8.396360397338867, 9.287528991699219, 10.17869758605957, 11.069867134094238, 11.961036682128906, 12.852205276489258, 13.743374824523926, 14.634543418884277, 15.525712966918945, 16.416881561279297, 17.30805206298828, 18.199220657348633, 19.090389251708984, 19.98155975341797, 20.87272834777832, 21.763896942138672, 22.655067443847656, 23.546236038208008, 24.43740463256836, 25.32857322692871]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 10.0, 17.0, 23.0, 36.0, 44.0, 63.0, 108.0, 139.0, 252.0, 385.0, 551.0, 933.0, 1559.0, 2570.0, 4375.0, 7614.0, 13835.0, 26590.0, 57482.0, 157478.0, 457497.0, 187022.0, 65176.0, 29522.0, 15093.0, 8402.0, 4656.0, 2775.0, 1602.0, 987.0, 604.0, 412.0, 261.0, 151.0, 122.0, 72.0, 47.0, 26.0, 19.0, 17.0, 8.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.71875, -57.8271484375, -55.935546875, -54.0439453125, -52.15234375, -50.2607421875, -48.369140625, -46.4775390625, -44.5859375, -42.6943359375, -40.802734375, -38.9111328125, -37.01953125, -35.1279296875, -33.236328125, -31.3447265625, -29.453125, -27.5615234375, -25.669921875, -23.7783203125, -21.88671875, -19.9951171875, -18.103515625, -16.2119140625, -14.3203125, -12.4287109375, -10.537109375, -8.6455078125, -6.75390625, -4.8623046875, -2.970703125, -1.0791015625, 0.8125, 2.7041015625, 4.595703125, 6.4873046875, 8.37890625, 10.2705078125, 12.162109375, 14.0537109375, 15.9453125, 17.8369140625, 19.728515625, 21.6201171875, 23.51171875, 25.4033203125, 27.294921875, 29.1865234375, 31.078125, 32.9697265625, 34.861328125, 36.7529296875, 38.64453125, 40.5361328125, 42.427734375, 44.3193359375, 46.2109375, 48.1025390625, 49.994140625, 51.8857421875, 53.77734375, 55.6689453125, 57.560546875, 59.4521484375, 61.34375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 4.0, 5.0, 7.0, 13.0, 16.0, 20.0, 23.0, 19.0, 26.0, 31.0, 28.0, 25.0, 37.0, 38.0, 42.0, 42.0, 35.0, 42.0, 32.0, 57.0, 51.0, 49.0, 44.0, 37.0, 49.0, 34.0, 31.0, 23.0, 26.0, 27.0, 21.0, 11.0, 12.0, 5.0, 9.0, 8.0, 8.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.359375, -29.418701171875, -28.47802734375, -27.537353515625, -26.5966796875, -25.656005859375, -24.71533203125, -23.774658203125, -22.833984375, -21.893310546875, -20.95263671875, -20.011962890625, -19.0712890625, -18.130615234375, -17.18994140625, -16.249267578125, -15.30859375, -14.367919921875, -13.42724609375, -12.486572265625, -11.5458984375, -10.605224609375, -9.66455078125, -8.723876953125, -7.783203125, -6.842529296875, -5.90185546875, -4.961181640625, -4.0205078125, -3.079833984375, -2.13916015625, -1.198486328125, -0.2578125, 0.682861328125, 1.62353515625, 2.564208984375, 3.5048828125, 4.445556640625, 5.38623046875, 6.326904296875, 7.267578125, 8.208251953125, 9.14892578125, 10.089599609375, 11.0302734375, 11.970947265625, 12.91162109375, 13.852294921875, 14.79296875, 15.733642578125, 16.67431640625, 17.614990234375, 18.5556640625, 19.496337890625, 20.43701171875, 21.377685546875, 22.318359375, 23.259033203125, 24.19970703125, 25.140380859375, 26.0810546875, 27.021728515625, 27.96240234375, 28.903076171875, 29.84375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 7.0, 14.0, 17.0, 21.0, 41.0, 50.0, 68.0, 100.0, 99.0, 167.0, 229.0, 279.0, 421.0, 618.0, 888.0, 1233.0, 1939.0, 3119.0, 5433.0, 10035.0, 22183.0, 70555.0, 644038.0, 212114.0, 39740.0, 15377.0, 7690.0, 4272.0, 2564.0, 1578.0, 1121.0, 694.0, 522.0, 383.0, 241.0, 208.0, 131.0, 104.0, 78.0, 46.0, 26.0, 22.0, 27.0, 17.0, 12.0, 4.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-85.4375, -82.662109375, -79.88671875, -77.111328125, -74.3359375, -71.560546875, -68.78515625, -66.009765625, -63.234375, -60.458984375, -57.68359375, -54.908203125, -52.1328125, -49.357421875, -46.58203125, -43.806640625, -41.03125, -38.255859375, -35.48046875, -32.705078125, -29.9296875, -27.154296875, -24.37890625, -21.603515625, -18.828125, -16.052734375, -13.27734375, -10.501953125, -7.7265625, -4.951171875, -2.17578125, 0.599609375, 3.375, 6.150390625, 8.92578125, 11.701171875, 14.4765625, 17.251953125, 20.02734375, 22.802734375, 25.578125, 28.353515625, 31.12890625, 33.904296875, 36.6796875, 39.455078125, 42.23046875, 45.005859375, 47.78125, 50.556640625, 53.33203125, 56.107421875, 58.8828125, 61.658203125, 64.43359375, 67.208984375, 69.984375, 72.759765625, 75.53515625, 78.310546875, 81.0859375, 83.861328125, 86.63671875, 89.412109375, 92.1875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 5.0, 11.0, 15.0, 7.0, 10.0, 23.0, 15.0, 22.0, 19.0, 17.0, 30.0, 25.0, 29.0, 31.0, 31.0, 30.0, 37.0, 33.0, 26.0, 45.0, 27.0, 27.0, 36.0, 40.0, 35.0, 28.0, 28.0, 34.0, 28.0, 24.0, 29.0, 26.0, 23.0, 23.0, 10.0, 18.0, 14.0, 13.0, 10.0, 14.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-20.9375, -20.33251953125, -19.7275390625, -19.12255859375, -18.517578125, -17.91259765625, -17.3076171875, -16.70263671875, -16.09765625, -15.49267578125, -14.8876953125, -14.28271484375, -13.677734375, -13.07275390625, -12.4677734375, -11.86279296875, -11.2578125, -10.65283203125, -10.0478515625, -9.44287109375, -8.837890625, -8.23291015625, -7.6279296875, -7.02294921875, -6.41796875, -5.81298828125, -5.2080078125, -4.60302734375, -3.998046875, -3.39306640625, -2.7880859375, -2.18310546875, -1.578125, -0.97314453125, -0.3681640625, 0.23681640625, 0.841796875, 1.44677734375, 2.0517578125, 2.65673828125, 3.26171875, 3.86669921875, 4.4716796875, 5.07666015625, 5.681640625, 6.28662109375, 6.8916015625, 7.49658203125, 8.1015625, 8.70654296875, 9.3115234375, 9.91650390625, 10.521484375, 11.12646484375, 11.7314453125, 12.33642578125, 12.94140625, 13.54638671875, 14.1513671875, 14.75634765625, 15.361328125, 15.96630859375, 16.5712890625, 17.17626953125, 17.78125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 9.0, 17.0, 18.0, 39.0, 48.0, 49.0, 54.0, 103.0, 122.0, 178.0, 247.0, 320.0, 436.0, 635.0, 838.0, 1117.0, 1665.0, 2446.0, 3448.0, 5433.0, 8652.0, 14912.0, 28925.0, 72888.0, 536440.0, 256604.0, 53778.0, 23644.0, 12552.0, 7432.0, 4686.0, 3139.0, 2155.0, 1553.0, 1051.0, 780.0, 545.0, 428.0, 330.0, 252.0, 158.0, 121.0, 91.0, 62.0, 52.0, 28.0, 18.0, 22.0, 10.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-39.25, -38.01806640625, -36.7861328125, -35.55419921875, -34.322265625, -33.09033203125, -31.8583984375, -30.62646484375, -29.39453125, -28.16259765625, -26.9306640625, -25.69873046875, -24.466796875, -23.23486328125, -22.0029296875, -20.77099609375, -19.5390625, -18.30712890625, -17.0751953125, -15.84326171875, -14.611328125, -13.37939453125, -12.1474609375, -10.91552734375, -9.68359375, -8.45166015625, -7.2197265625, -5.98779296875, -4.755859375, -3.52392578125, -2.2919921875, -1.06005859375, 0.171875, 1.40380859375, 2.6357421875, 3.86767578125, 5.099609375, 6.33154296875, 7.5634765625, 8.79541015625, 10.02734375, 11.25927734375, 12.4912109375, 13.72314453125, 14.955078125, 16.18701171875, 17.4189453125, 18.65087890625, 19.8828125, 21.11474609375, 22.3466796875, 23.57861328125, 24.810546875, 26.04248046875, 27.2744140625, 28.50634765625, 29.73828125, 30.97021484375, 32.2021484375, 33.43408203125, 34.666015625, 35.89794921875, 37.1298828125, 38.36181640625, 39.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 8.0, 7.0, 17.0, 20.0, 36.0, 38.0, 61.0, 79.0, 90.0, 112.0, 128.0, 130.0, 75.0, 72.0, 41.0, 30.0, 19.0, 14.0, 12.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019292831420898438, -0.001861080527305603, -0.0017928779125213623, -0.0017246752977371216, -0.0016564726829528809, -0.0015882700681686401, -0.0015200674533843994, -0.0014518648386001587, -0.001383662223815918, -0.0013154596090316772, -0.0012472569942474365, -0.0011790543794631958, -0.001110851764678955, -0.0010426491498947144, -0.0009744465351104736, -0.0009062439203262329, -0.0008380413055419922, -0.0007698386907577515, -0.0007016360759735107, -0.00063343346118927, -0.0005652308464050293, -0.0004970282316207886, -0.00042882561683654785, -0.00036062300205230713, -0.0002924203872680664, -0.00022421777248382568, -0.00015601515769958496, -8.781254291534424e-05, -1.9609928131103516e-05, 4.859268665313721e-05, 0.00011679530143737793, 0.00018499791622161865, 0.0002532005310058594, 0.0003214031457901001, 0.0003896057605743408, 0.00045780837535858154, 0.0005260109901428223, 0.000594213604927063, 0.0006624162197113037, 0.0007306188344955444, 0.0007988214492797852, 0.0008670240640640259, 0.0009352266788482666, 0.0010034292936325073, 0.001071631908416748, 0.0011398345232009888, 0.0012080371379852295, 0.0012762397527694702, 0.001344442367553711, 0.0014126449823379517, 0.0014808475971221924, 0.001549050211906433, 0.0016172528266906738, 0.0016854554414749146, 0.0017536580562591553, 0.001821860671043396, 0.0018900632858276367, 0.0019582659006118774, 0.002026468515396118, 0.002094671130180359, 0.0021628737449645996, 0.0022310763597488403, 0.002299278974533081, 0.0023674815893173218, 0.0024356842041015625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 4.0, 8.0, 13.0, 25.0, 26.0, 45.0, 52.0, 89.0, 175.0, 227.0, 319.0, 493.0, 851.0, 1307.0, 2371.0, 4281.0, 8390.0, 17958.0, 43559.0, 130162.0, 511814.0, 214690.0, 63328.0, 24724.0, 11055.0, 5461.0, 2843.0, 1611.0, 922.0, 597.0, 381.0, 244.0, 160.0, 136.0, 55.0, 68.0, 29.0, 25.0, 15.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.6875, -34.443359375, -33.19921875, -31.955078125, -30.7109375, -29.466796875, -28.22265625, -26.978515625, -25.734375, -24.490234375, -23.24609375, -22.001953125, -20.7578125, -19.513671875, -18.26953125, -17.025390625, -15.78125, -14.537109375, -13.29296875, -12.048828125, -10.8046875, -9.560546875, -8.31640625, -7.072265625, -5.828125, -4.583984375, -3.33984375, -2.095703125, -0.8515625, 0.392578125, 1.63671875, 2.880859375, 4.125, 5.369140625, 6.61328125, 7.857421875, 9.1015625, 10.345703125, 11.58984375, 12.833984375, 14.078125, 15.322265625, 16.56640625, 17.810546875, 19.0546875, 20.298828125, 21.54296875, 22.787109375, 24.03125, 25.275390625, 26.51953125, 27.763671875, 29.0078125, 30.251953125, 31.49609375, 32.740234375, 33.984375, 35.228515625, 36.47265625, 37.716796875, 38.9609375, 40.205078125, 41.44921875, 42.693359375, 43.9375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 10.0, 12.0, 20.0, 16.0, 27.0, 34.0, 51.0, 63.0, 70.0, 76.0, 78.0, 104.0, 88.0, 71.0, 58.0, 49.0, 43.0, 29.0, 25.0, 13.0, 17.0, 7.0, 3.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.73553466796875, -8.4866943359375, -8.23785400390625, -7.989013671875, -7.74017333984375, -7.4913330078125, -7.24249267578125, -6.99365234375, -6.74481201171875, -6.4959716796875, -6.24713134765625, -5.998291015625, -5.74945068359375, -5.5006103515625, -5.25177001953125, -5.0029296875, -4.75408935546875, -4.5052490234375, -4.25640869140625, -4.007568359375, -3.75872802734375, -3.5098876953125, -3.26104736328125, -3.01220703125, -2.76336669921875, -2.5145263671875, -2.26568603515625, -2.016845703125, -1.76800537109375, -1.5191650390625, -1.27032470703125, -1.021484375, -0.77264404296875, -0.5238037109375, -0.27496337890625, -0.026123046875, 0.22271728515625, 0.4715576171875, 0.72039794921875, 0.96923828125, 1.21807861328125, 1.4669189453125, 1.71575927734375, 1.964599609375, 2.21343994140625, 2.4622802734375, 2.71112060546875, 2.9599609375, 3.20880126953125, 3.4576416015625, 3.70648193359375, 3.955322265625, 4.20416259765625, 4.4530029296875, 4.70184326171875, 4.95068359375, 5.19952392578125, 5.4483642578125, 5.69720458984375, 5.946044921875, 6.19488525390625, 6.4437255859375, 6.69256591796875, 6.94140625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 2.0, 8.0, 6.0, 15.0, 12.0, 17.0, 49.0, 51.0, 92.0, 161.0, 199.0, 144.0, 78.0, 48.0, 36.0, 23.0, 17.0, 6.0, 6.0, 4.0, 6.0, 9.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84046936035156, -50.256866455078125, -47.67326354980469, -45.08966064453125, -42.50605773925781, -39.922454833984375, -37.33885192871094, -34.7552490234375, -32.17164611816406, -29.588043212890625, -27.004440307617188, -24.42083740234375, -21.837234497070312, -19.253631591796875, -16.670028686523438, -14.08642578125, -11.502822875976562, -8.919219970703125, -6.3356170654296875, -3.75201416015625, -1.1684112548828125, 1.415191650390625, 3.9987945556640625, 6.5823974609375, 9.166000366210938, 11.749603271484375, 14.333206176757812, 16.91680908203125, 19.500411987304688, 22.084014892578125, 24.667617797851562, 27.251220703125, 29.834823608398438, 32.418426513671875, 35.00202941894531, 37.58563232421875, 40.16923522949219, 42.752838134765625, 45.33644104003906, 47.9200439453125, 50.50364685058594, 53.087249755859375, 55.67085266113281, 58.25445556640625, 60.83805847167969, 63.421661376953125, 66.00526428222656, 68.5888671875, 71.17247009277344, 73.75607299804688, 76.33967590332031, 78.92327880859375, 81.50688171386719, 84.09048461914062, 86.67408752441406, 89.2576904296875, 91.84129333496094, 94.42489624023438, 97.00849914550781, 99.59210205078125, 102.17570495605469, 104.75930786132812, 107.34291076660156, 109.926513671875, 112.51011657714844]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 6.0, 11.0, 8.0, 7.0, 12.0, 14.0, 12.0, 17.0, 20.0, 23.0, 20.0, 27.0, 20.0, 33.0, 43.0, 36.0, 33.0, 40.0, 30.0, 41.0, 38.0, 45.0, 39.0, 43.0, 44.0, 36.0, 36.0, 33.0, 31.0, 39.0, 22.0, 18.0, 20.0, 23.0, 12.0, 12.0, 14.0, 9.0, 8.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.143213272094727, -27.320280075073242, -26.497346878051758, -25.674413681030273, -24.85148048400879, -24.028547286987305, -23.20561408996582, -22.382680892944336, -21.55974769592285, -20.736814498901367, -19.913881301879883, -19.0909481048584, -18.268014907836914, -17.44508171081543, -16.622148513793945, -15.799215316772461, -14.97628116607666, -14.153347969055176, -13.330414772033691, -12.507481575012207, -11.684548377990723, -10.861614227294922, -10.038681030273438, -9.215747833251953, -8.392814636230469, -7.569881439208984, -6.7469482421875, -5.924015045166016, -5.101081848144531, -4.278148174285889, -3.4552149772644043, -2.63228178024292, -1.8093490600585938, -0.9864158034324646, -0.16348254680633545, 0.6594507694244385, 1.4823839664459229, 2.3053174018859863, 3.1282505989074707, 3.951183795928955, 4.7741169929504395, 5.597050189971924, 6.419983386993408, 7.242917060852051, 8.065850257873535, 8.88878345489502, 9.711716651916504, 10.534649848937988, 11.357583045959473, 12.180516242980957, 13.003449440002441, 13.826382637023926, 14.64931583404541, 15.472249984741211, 16.295183181762695, 17.11811637878418, 17.941049575805664, 18.76398277282715, 19.586915969848633, 20.409849166870117, 21.2327823638916, 22.055715560913086, 22.87864875793457, 23.701581954956055, 24.52451515197754]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 14.0, 11.0, 27.0, 41.0, 46.0, 83.0, 135.0, 221.0, 331.0, 523.0, 802.0, 1351.0, 2189.0, 3673.0, 5872.0, 9776.0, 16654.0, 28712.0, 50494.0, 91479.0, 164644.0, 235453.0, 188206.0, 107567.0, 59347.0, 33417.0, 19026.0, 11341.0, 6527.0, 3967.0, 2455.0, 1572.0, 1003.0, 581.0, 366.0, 216.0, 141.0, 124.0, 59.0, 40.0, 24.0, 16.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -50.0732421875, -48.490234375, -46.9072265625, -45.32421875, -43.7412109375, -42.158203125, -40.5751953125, -38.9921875, -37.4091796875, -35.826171875, -34.2431640625, -32.66015625, -31.0771484375, -29.494140625, -27.9111328125, -26.328125, -24.7451171875, -23.162109375, -21.5791015625, -19.99609375, -18.4130859375, -16.830078125, -15.2470703125, -13.6640625, -12.0810546875, -10.498046875, -8.9150390625, -7.33203125, -5.7490234375, -4.166015625, -2.5830078125, -1.0, 0.5830078125, 2.166015625, 3.7490234375, 5.33203125, 6.9150390625, 8.498046875, 10.0810546875, 11.6640625, 13.2470703125, 14.830078125, 16.4130859375, 17.99609375, 19.5791015625, 21.162109375, 22.7451171875, 24.328125, 25.9111328125, 27.494140625, 29.0771484375, 30.66015625, 32.2431640625, 33.826171875, 35.4091796875, 36.9921875, 38.5751953125, 40.158203125, 41.7412109375, 43.32421875, 44.9072265625, 46.490234375, 48.0732421875, 49.65625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 9.0, 7.0, 9.0, 12.0, 15.0, 8.0, 14.0, 21.0, 24.0, 25.0, 33.0, 43.0, 44.0, 32.0, 31.0, 46.0, 42.0, 52.0, 49.0, 48.0, 53.0, 47.0, 41.0, 40.0, 40.0, 27.0, 34.0, 27.0, 19.0, 28.0, 19.0, 17.0, 7.0, 11.0, 3.0, 13.0, 2.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.4375, -32.519287109375, -31.60107421875, -30.682861328125, -29.7646484375, -28.846435546875, -27.92822265625, -27.010009765625, -26.091796875, -25.173583984375, -24.25537109375, -23.337158203125, -22.4189453125, -21.500732421875, -20.58251953125, -19.664306640625, -18.74609375, -17.827880859375, -16.90966796875, -15.991455078125, -15.0732421875, -14.155029296875, -13.23681640625, -12.318603515625, -11.400390625, -10.482177734375, -9.56396484375, -8.645751953125, -7.7275390625, -6.809326171875, -5.89111328125, -4.972900390625, -4.0546875, -3.136474609375, -2.21826171875, -1.300048828125, -0.3818359375, 0.536376953125, 1.45458984375, 2.372802734375, 3.291015625, 4.209228515625, 5.12744140625, 6.045654296875, 6.9638671875, 7.882080078125, 8.80029296875, 9.718505859375, 10.63671875, 11.554931640625, 12.47314453125, 13.391357421875, 14.3095703125, 15.227783203125, 16.14599609375, 17.064208984375, 17.982421875, 18.900634765625, 19.81884765625, 20.737060546875, 21.6552734375, 22.573486328125, 23.49169921875, 24.409912109375, 25.328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 6.0, 3.0, 7.0, 7.0, 8.0, 9.0, 22.0, 28.0, 29.0, 52.0, 71.0, 103.0, 153.0, 214.0, 310.0, 475.0, 651.0, 1073.0, 1600.0, 2713.0, 4328.0, 7326.0, 12918.0, 24339.0, 47402.0, 103244.0, 239646.0, 319636.0, 144164.0, 65534.0, 31991.0, 16775.0, 9330.0, 5404.0, 3154.0, 1994.0, 1308.0, 826.0, 551.0, 385.0, 237.0, 164.0, 120.0, 84.0, 57.0, 31.0, 27.0, 18.0, 12.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-66.0625, -64.13134765625, -62.2001953125, -60.26904296875, -58.337890625, -56.40673828125, -54.4755859375, -52.54443359375, -50.61328125, -48.68212890625, -46.7509765625, -44.81982421875, -42.888671875, -40.95751953125, -39.0263671875, -37.09521484375, -35.1640625, -33.23291015625, -31.3017578125, -29.37060546875, -27.439453125, -25.50830078125, -23.5771484375, -21.64599609375, -19.71484375, -17.78369140625, -15.8525390625, -13.92138671875, -11.990234375, -10.05908203125, -8.1279296875, -6.19677734375, -4.265625, -2.33447265625, -0.4033203125, 1.52783203125, 3.458984375, 5.39013671875, 7.3212890625, 9.25244140625, 11.18359375, 13.11474609375, 15.0458984375, 16.97705078125, 18.908203125, 20.83935546875, 22.7705078125, 24.70166015625, 26.6328125, 28.56396484375, 30.4951171875, 32.42626953125, 34.357421875, 36.28857421875, 38.2197265625, 40.15087890625, 42.08203125, 44.01318359375, 45.9443359375, 47.87548828125, 49.806640625, 51.73779296875, 53.6689453125, 55.60009765625, 57.53125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 4.0, 4.0, 6.0, 16.0, 14.0, 12.0, 22.0, 23.0, 26.0, 24.0, 25.0, 28.0, 37.0, 31.0, 35.0, 44.0, 30.0, 42.0, 41.0, 40.0, 29.0, 35.0, 36.0, 39.0, 35.0, 37.0, 37.0, 36.0, 29.0, 24.0, 18.0, 16.0, 22.0, 6.0, 20.0, 11.0, 7.0, 11.0, 9.0, 7.0, 10.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.125, -17.478759765625, -16.83251953125, -16.186279296875, -15.5400390625, -14.893798828125, -14.24755859375, -13.601318359375, -12.955078125, -12.308837890625, -11.66259765625, -11.016357421875, -10.3701171875, -9.723876953125, -9.07763671875, -8.431396484375, -7.78515625, -7.138916015625, -6.49267578125, -5.846435546875, -5.2001953125, -4.553955078125, -3.90771484375, -3.261474609375, -2.615234375, -1.968994140625, -1.32275390625, -0.676513671875, -0.0302734375, 0.615966796875, 1.26220703125, 1.908447265625, 2.5546875, 3.200927734375, 3.84716796875, 4.493408203125, 5.1396484375, 5.785888671875, 6.43212890625, 7.078369140625, 7.724609375, 8.370849609375, 9.01708984375, 9.663330078125, 10.3095703125, 10.955810546875, 11.60205078125, 12.248291015625, 12.89453125, 13.540771484375, 14.18701171875, 14.833251953125, 15.4794921875, 16.125732421875, 16.77197265625, 17.418212890625, 18.064453125, 18.710693359375, 19.35693359375, 20.003173828125, 20.6494140625, 21.295654296875, 21.94189453125, 22.588134765625, 23.234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 7.0, 10.0, 16.0, 17.0, 28.0, 45.0, 51.0, 80.0, 143.0, 217.0, 385.0, 688.0, 1398.0, 3317.0, 9706.0, 38262.0, 613080.0, 335265.0, 31645.0, 8290.0, 3048.0, 1250.0, 664.0, 315.0, 200.0, 140.0, 88.0, 55.0, 37.0, 27.0, 21.0, 20.0, 9.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.5, -282.60546875, -271.7109375, -260.81640625, -249.921875, -239.02734375, -228.1328125, -217.23828125, -206.34375, -195.44921875, -184.5546875, -173.66015625, -162.765625, -151.87109375, -140.9765625, -130.08203125, -119.1875, -108.29296875, -97.3984375, -86.50390625, -75.609375, -64.71484375, -53.8203125, -42.92578125, -32.03125, -21.13671875, -10.2421875, 0.65234375, 11.546875, 22.44140625, 33.3359375, 44.23046875, 55.125, 66.01953125, 76.9140625, 87.80859375, 98.703125, 109.59765625, 120.4921875, 131.38671875, 142.28125, 153.17578125, 164.0703125, 174.96484375, 185.859375, 196.75390625, 207.6484375, 218.54296875, 229.4375, 240.33203125, 251.2265625, 262.12109375, 273.015625, 283.91015625, 294.8046875, 305.69921875, 316.59375, 327.48828125, 338.3828125, 349.27734375, 360.171875, 371.06640625, 381.9609375, 392.85546875, 403.75]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 6.0, 10.0, 26.0, 35.0, 47.0, 80.0, 83.0, 141.0, 179.0, 133.0, 83.0, 55.0, 31.0, 30.0, 16.0, 6.0, 5.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.008209228515625, -0.007918477058410645, -0.007627725601196289, -0.007336974143981934, -0.007046222686767578, -0.006755471229553223, -0.006464719772338867, -0.006173968315124512, -0.005883216857910156, -0.005592465400695801, -0.005301713943481445, -0.00501096248626709, -0.004720211029052734, -0.004429459571838379, -0.0041387081146240234, -0.003847956657409668, -0.0035572052001953125, -0.003266453742980957, -0.0029757022857666016, -0.002684950828552246, -0.0023941993713378906, -0.002103447914123535, -0.0018126964569091797, -0.0015219449996948242, -0.0012311935424804688, -0.0009404420852661133, -0.0006496906280517578, -0.00035893917083740234, -6.818771362304688e-05, 0.0002225637435913086, 0.0005133152008056641, 0.0008040666580200195, 0.001094818115234375, 0.0013855695724487305, 0.001676321029663086, 0.0019670724868774414, 0.002257823944091797, 0.0025485754013061523, 0.002839326858520508, 0.0031300783157348633, 0.0034208297729492188, 0.0037115812301635742, 0.00400233268737793, 0.004293084144592285, 0.004583835601806641, 0.004874587059020996, 0.0051653385162353516, 0.005456089973449707, 0.0057468414306640625, 0.006037592887878418, 0.0063283443450927734, 0.006619095802307129, 0.006909847259521484, 0.00720059871673584, 0.007491350173950195, 0.007782101631164551, 0.008072853088378906, 0.008363604545593262, 0.008654356002807617, 0.008945107460021973, 0.009235858917236328, 0.009526610374450684, 0.009817361831665039, 0.010108113288879395, 0.01039886474609375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 8.0, 18.0, 13.0, 32.0, 36.0, 45.0, 60.0, 80.0, 102.0, 151.0, 246.0, 372.0, 586.0, 1006.0, 1940.0, 4630.0, 13910.0, 74563.0, 822857.0, 100777.0, 16826.0, 5124.0, 2208.0, 1093.0, 630.0, 377.0, 261.0, 159.0, 117.0, 78.0, 67.0, 50.0, 43.0, 12.0, 18.0, 16.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-335.25, -325.26171875, -315.2734375, -305.28515625, -295.296875, -285.30859375, -275.3203125, -265.33203125, -255.34375, -245.35546875, -235.3671875, -225.37890625, -215.390625, -205.40234375, -195.4140625, -185.42578125, -175.4375, -165.44921875, -155.4609375, -145.47265625, -135.484375, -125.49609375, -115.5078125, -105.51953125, -95.53125, -85.54296875, -75.5546875, -65.56640625, -55.578125, -45.58984375, -35.6015625, -25.61328125, -15.625, -5.63671875, 4.3515625, 14.33984375, 24.328125, 34.31640625, 44.3046875, 54.29296875, 64.28125, 74.26953125, 84.2578125, 94.24609375, 104.234375, 114.22265625, 124.2109375, 134.19921875, 144.1875, 154.17578125, 164.1640625, 174.15234375, 184.140625, 194.12890625, 204.1171875, 214.10546875, 224.09375, 234.08203125, 244.0703125, 254.05859375, 264.046875, 274.03515625, 284.0234375, 294.01171875, 304.0]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 5.0, 1.0, 7.0, 10.0, 19.0, 38.0, 55.0, 92.0, 119.0, 146.0, 144.0, 139.0, 79.0, 46.0, 45.0, 12.0, 17.0, 4.0, 8.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.6875, -57.6943359375, -55.701171875, -53.7080078125, -51.71484375, -49.7216796875, -47.728515625, -45.7353515625, -43.7421875, -41.7490234375, -39.755859375, -37.7626953125, -35.76953125, -33.7763671875, -31.783203125, -29.7900390625, -27.796875, -25.8037109375, -23.810546875, -21.8173828125, -19.82421875, -17.8310546875, -15.837890625, -13.8447265625, -11.8515625, -9.8583984375, -7.865234375, -5.8720703125, -3.87890625, -1.8857421875, 0.107421875, 2.1005859375, 4.09375, 6.0869140625, 8.080078125, 10.0732421875, 12.06640625, 14.0595703125, 16.052734375, 18.0458984375, 20.0390625, 22.0322265625, 24.025390625, 26.0185546875, 28.01171875, 30.0048828125, 31.998046875, 33.9912109375, 35.984375, 37.9775390625, 39.970703125, 41.9638671875, 43.95703125, 45.9501953125, 47.943359375, 49.9365234375, 51.9296875, 53.9228515625, 55.916015625, 57.9091796875, 59.90234375, 61.8955078125, 63.888671875, 65.8818359375, 67.875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 14.0, 19.0, 41.0, 55.0, 107.0, 155.0, 200.0, 103.0, 74.0, 46.0, 30.0, 27.0, 17.0, 18.0, 15.0, 9.0, 16.0, 5.0, 4.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.27420425415039, -33.833919525146484, -31.393634796142578, -28.953350067138672, -26.513065338134766, -24.07278060913086, -21.63249397277832, -19.192209243774414, -16.751924514770508, -14.311639785766602, -11.871355056762695, -9.431069374084473, -6.990784645080566, -4.55049991607666, -2.1102142333984375, 0.33007049560546875, 2.770355224609375, 5.210639953613281, 7.650925159454346, 10.09121036529541, 12.531495094299316, 14.971779823303223, 17.412065505981445, 19.85235023498535, 22.292634963989258, 24.732919692993164, 27.17320442199707, 29.61349105834961, 32.053775787353516, 34.49406051635742, 36.93434524536133, 39.374629974365234, 41.814918518066406, 44.25520324707031, 46.69548797607422, 49.135772705078125, 51.57605743408203, 54.01634216308594, 56.456626892089844, 58.89691162109375, 61.337196350097656, 63.77748107910156, 66.21776580810547, 68.65805053710938, 71.09833526611328, 73.53861999511719, 75.9789047241211, 78.419189453125, 80.85948181152344, 83.29976654052734, 85.74005126953125, 88.18033599853516, 90.62062072753906, 93.06090545654297, 95.50119018554688, 97.94147491455078, 100.38175964355469, 102.8220443725586, 105.2623291015625, 107.7026138305664, 110.14289855957031, 112.58318328857422, 115.02346801757812, 117.46375274658203, 119.90403747558594]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 1.0, 6.0, 5.0, 10.0, 6.0, 6.0, 14.0, 8.0, 16.0, 23.0, 17.0, 25.0, 17.0, 31.0, 25.0, 35.0, 26.0, 43.0, 38.0, 27.0, 40.0, 42.0, 39.0, 42.0, 43.0, 52.0, 37.0, 37.0, 31.0, 40.0, 28.0, 26.0, 24.0, 17.0, 22.0, 27.0, 25.0, 4.0, 10.0, 9.0, 5.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.479450225830078, -29.516387939453125, -28.553325653076172, -27.59026527404785, -26.6272029876709, -25.664140701293945, -24.701078414916992, -23.738018035888672, -22.77495574951172, -21.811893463134766, -20.848831176757812, -19.885770797729492, -18.92270851135254, -17.959646224975586, -16.996583938598633, -16.033523559570312, -15.070460319519043, -14.10739803314209, -13.144336700439453, -12.1812744140625, -11.218213081359863, -10.25515079498291, -9.292089462280273, -8.32902717590332, -7.365965366363525, -6.4029035568237305, -5.4398417472839355, -4.476779937744141, -3.5137178897857666, -2.5506558418273926, -1.5875940322875977, -0.6245322227478027, 0.3385295867919922, 1.301591396331787, 2.264653205871582, 3.227715253829956, 4.190776824951172, 5.153839111328125, 6.11690092086792, 7.079962730407715, 8.043024063110352, 9.006086349487305, 9.969147682189941, 10.932209968566895, 11.895271301269531, 12.858333587646484, 13.821395874023438, 14.784457206726074, 15.747519493103027, 16.710580825805664, 17.673643112182617, 18.63670539855957, 19.599767684936523, 20.562828063964844, 21.525890350341797, 22.48895263671875, 23.452014923095703, 24.415077209472656, 25.37813949584961, 26.34119987487793, 27.304262161254883, 28.267324447631836, 29.23038673400879, 30.19344711303711, 31.156509399414062]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 8.0, 3.0, 8.0, 13.0, 27.0, 35.0, 43.0, 62.0, 85.0, 98.0, 164.0, 266.0, 343.0, 518.0, 800.0, 1145.0, 1723.0, 2627.0, 4143.0, 6510.0, 10540.0, 17598.0, 31060.0, 57714.0, 120320.0, 325144.0, 1540298.0, 1486963.0, 332009.0, 121585.0, 57800.0, 30675.0, 17261.0, 10165.0, 6088.0, 3818.0, 2304.0, 1476.0, 1045.0, 641.0, 416.0, 254.0, 179.0, 103.0, 71.0, 47.0, 28.0, 23.0, 23.0, 10.0, 9.0, 1.0, 0.0, 1.0], "bins": [-57.0, -55.458984375, -53.91796875, -52.376953125, -50.8359375, -49.294921875, -47.75390625, -46.212890625, -44.671875, -43.130859375, -41.58984375, -40.048828125, -38.5078125, -36.966796875, -35.42578125, -33.884765625, -32.34375, -30.802734375, -29.26171875, -27.720703125, -26.1796875, -24.638671875, -23.09765625, -21.556640625, -20.015625, -18.474609375, -16.93359375, -15.392578125, -13.8515625, -12.310546875, -10.76953125, -9.228515625, -7.6875, -6.146484375, -4.60546875, -3.064453125, -1.5234375, 0.017578125, 1.55859375, 3.099609375, 4.640625, 6.181640625, 7.72265625, 9.263671875, 10.8046875, 12.345703125, 13.88671875, 15.427734375, 16.96875, 18.509765625, 20.05078125, 21.591796875, 23.1328125, 24.673828125, 26.21484375, 27.755859375, 29.296875, 30.837890625, 32.37890625, 33.919921875, 35.4609375, 37.001953125, 38.54296875, 40.083984375, 41.625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 10.0, 8.0, 4.0, 7.0, 9.0, 19.0, 9.0, 10.0, 17.0, 12.0, 23.0, 28.0, 33.0, 32.0, 29.0, 39.0, 36.0, 40.0, 45.0, 39.0, 44.0, 50.0, 38.0, 36.0, 40.0, 37.0, 45.0, 34.0, 35.0, 28.0, 32.0, 26.0, 13.0, 18.0, 13.0, 15.0, 17.0, 7.0, 6.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.78125, -18.24462890625, -17.7080078125, -17.17138671875, -16.634765625, -16.09814453125, -15.5615234375, -15.02490234375, -14.48828125, -13.95166015625, -13.4150390625, -12.87841796875, -12.341796875, -11.80517578125, -11.2685546875, -10.73193359375, -10.1953125, -9.65869140625, -9.1220703125, -8.58544921875, -8.048828125, -7.51220703125, -6.9755859375, -6.43896484375, -5.90234375, -5.36572265625, -4.8291015625, -4.29248046875, -3.755859375, -3.21923828125, -2.6826171875, -2.14599609375, -1.609375, -1.07275390625, -0.5361328125, 0.00048828125, 0.537109375, 1.07373046875, 1.6103515625, 2.14697265625, 2.68359375, 3.22021484375, 3.7568359375, 4.29345703125, 4.830078125, 5.36669921875, 5.9033203125, 6.43994140625, 6.9765625, 7.51318359375, 8.0498046875, 8.58642578125, 9.123046875, 9.65966796875, 10.1962890625, 10.73291015625, 11.26953125, 11.80615234375, 12.3427734375, 12.87939453125, 13.416015625, 13.95263671875, 14.4892578125, 15.02587890625, 15.5625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 8.0, 6.0, 20.0, 33.0, 33.0, 44.0, 61.0, 85.0, 149.0, 204.0, 314.0, 472.0, 790.0, 1255.0, 2123.0, 3717.0, 6825.0, 13618.0, 29629.0, 74860.0, 246439.0, 1425632.0, 1932050.0, 301615.0, 87498.0, 33599.0, 15351.0, 7676.0, 4119.0, 2340.0, 1381.0, 851.0, 534.0, 352.0, 202.0, 135.0, 85.0, 55.0, 33.0, 36.0, 11.0, 11.0, 8.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-65.5, -63.57763671875, -61.6552734375, -59.73291015625, -57.810546875, -55.88818359375, -53.9658203125, -52.04345703125, -50.12109375, -48.19873046875, -46.2763671875, -44.35400390625, -42.431640625, -40.50927734375, -38.5869140625, -36.66455078125, -34.7421875, -32.81982421875, -30.8974609375, -28.97509765625, -27.052734375, -25.13037109375, -23.2080078125, -21.28564453125, -19.36328125, -17.44091796875, -15.5185546875, -13.59619140625, -11.673828125, -9.75146484375, -7.8291015625, -5.90673828125, -3.984375, -2.06201171875, -0.1396484375, 1.78271484375, 3.705078125, 5.62744140625, 7.5498046875, 9.47216796875, 11.39453125, 13.31689453125, 15.2392578125, 17.16162109375, 19.083984375, 21.00634765625, 22.9287109375, 24.85107421875, 26.7734375, 28.69580078125, 30.6181640625, 32.54052734375, 34.462890625, 36.38525390625, 38.3076171875, 40.22998046875, 42.15234375, 44.07470703125, 45.9970703125, 47.91943359375, 49.841796875, 51.76416015625, 53.6865234375, 55.60888671875, 57.53125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 11.0, 8.0, 11.0, 11.0, 23.0, 29.0, 37.0, 63.0, 66.0, 96.0, 131.0, 164.0, 220.0, 250.0, 337.0, 412.0, 410.0, 405.0, 303.0, 210.0, 195.0, 134.0, 104.0, 80.0, 70.0, 51.0, 48.0, 32.0, 26.0, 25.0, 12.0, 21.0, 16.0, 14.0, 3.0, 6.0, 8.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.6640625, -10.301513671875, -9.93896484375, -9.576416015625, -9.2138671875, -8.851318359375, -8.48876953125, -8.126220703125, -7.763671875, -7.401123046875, -7.03857421875, -6.676025390625, -6.3134765625, -5.950927734375, -5.58837890625, -5.225830078125, -4.86328125, -4.500732421875, -4.13818359375, -3.775634765625, -3.4130859375, -3.050537109375, -2.68798828125, -2.325439453125, -1.962890625, -1.600341796875, -1.23779296875, -0.875244140625, -0.5126953125, -0.150146484375, 0.21240234375, 0.574951171875, 0.9375, 1.300048828125, 1.66259765625, 2.025146484375, 2.3876953125, 2.750244140625, 3.11279296875, 3.475341796875, 3.837890625, 4.200439453125, 4.56298828125, 4.925537109375, 5.2880859375, 5.650634765625, 6.01318359375, 6.375732421875, 6.73828125, 7.100830078125, 7.46337890625, 7.825927734375, 8.1884765625, 8.551025390625, 8.91357421875, 9.276123046875, 9.638671875, 10.001220703125, 10.36376953125, 10.726318359375, 11.0888671875, 11.451416015625, 11.81396484375, 12.176513671875, 12.5390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 2.0, 14.0, 11.0, 19.0, 36.0, 49.0, 62.0, 129.0, 202.0, 201.0, 85.0, 55.0, 38.0, 21.0, 23.0, 12.0, 9.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.578548431396484, -49.67729568481445, -47.776039123535156, -45.874786376953125, -43.973533630371094, -42.07228088378906, -40.171024322509766, -38.269771575927734, -36.36851501464844, -34.467262268066406, -32.56600570678711, -30.664752960205078, -28.763500213623047, -26.862245559692383, -24.96099090576172, -23.059738159179688, -21.158485412597656, -19.257230758666992, -17.35597801208496, -15.454723358154297, -13.55346965789795, -11.652215957641602, -9.750961303710938, -7.84970760345459, -5.948453903198242, -4.0472002029418945, -2.1459460258483887, -0.2446918487548828, 1.6565618515014648, 3.5578155517578125, 5.459070205688477, 7.360323905944824, 9.261581420898438, 11.162835121154785, 13.064088821411133, 14.965343475341797, 16.866596221923828, 18.767850875854492, 20.669105529785156, 22.570358276367188, 24.47161293029785, 26.372867584228516, 28.274120330810547, 30.17537498474121, 32.076629638671875, 33.977882385253906, 35.87913513183594, 37.780391693115234, 39.681644439697266, 41.5828971862793, 43.484153747558594, 45.385406494140625, 47.286659240722656, 49.18791198730469, 51.089168548583984, 52.990421295166016, 54.89167785644531, 56.792930603027344, 58.69418716430664, 60.59543991088867, 62.4966926574707, 64.39794921875, 66.29920196533203, 68.20045471191406, 70.1017074584961]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 11.0, 5.0, 13.0, 21.0, 19.0, 8.0, 16.0, 20.0, 20.0, 17.0, 28.0, 30.0, 18.0, 31.0, 40.0, 28.0, 34.0, 25.0, 33.0, 38.0, 36.0, 41.0, 37.0, 37.0, 28.0, 27.0, 28.0, 30.0, 27.0, 26.0, 24.0, 18.0, 23.0, 25.0, 14.0, 11.0, 18.0, 11.0, 10.0, 12.0, 7.0, 5.0, 7.0, 8.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.62067413330078, -16.076560974121094, -15.532445907592773, -14.988332748413086, -14.444218635559082, -13.900104522705078, -13.355990409851074, -12.81187629699707, -12.267763137817383, -11.723649024963379, -11.179534912109375, -10.635421752929688, -10.091307640075684, -9.54719352722168, -9.003079414367676, -8.458965301513672, -7.914851188659668, -7.370737075805664, -6.826623439788818, -6.2825093269348145, -5.738395690917969, -5.194281578063965, -4.650167465209961, -4.106053352355957, -3.5619397163391113, -3.0178258419036865, -2.4737119674682617, -1.9295978546142578, -1.385483980178833, -0.8413701057434082, -0.2972559928894043, 0.2468578815460205, 0.7909717559814453, 1.3350856304168701, 1.8791996240615845, 2.423313617706299, 2.9674274921417236, 3.5115413665771484, 4.055655479431152, 4.599769592285156, 5.143883228302002, 5.687997341156006, 6.232110977172852, 6.7762250900268555, 7.320339202880859, 7.864452838897705, 8.408567428588867, 8.952680587768555, 9.496794700622559, 10.040908813476562, 10.585022926330566, 11.12913703918457, 11.673250198364258, 12.217364311218262, 12.761478424072266, 13.30559253692627, 13.849706649780273, 14.393820762634277, 14.937934875488281, 15.482048034667969, 16.02616310119629, 16.570276260375977, 17.114391326904297, 17.658504486083984, 18.202617645263672]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 9.0, 7.0, 8.0, 19.0, 18.0, 28.0, 38.0, 57.0, 78.0, 97.0, 155.0, 203.0, 301.0, 426.0, 614.0, 879.0, 1276.0, 1938.0, 2889.0, 4412.0, 7184.0, 11933.0, 21065.0, 42438.0, 100798.0, 382711.0, 295949.0, 86178.0, 37490.0, 19281.0, 10902.0, 6545.0, 4170.0, 2678.0, 1789.0, 1242.0, 820.0, 577.0, 387.0, 267.0, 199.0, 147.0, 106.0, 74.0, 56.0, 39.0, 26.0, 20.0, 11.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.71875, -34.52490234375, -33.3310546875, -32.13720703125, -30.943359375, -29.74951171875, -28.5556640625, -27.36181640625, -26.16796875, -24.97412109375, -23.7802734375, -22.58642578125, -21.392578125, -20.19873046875, -19.0048828125, -17.81103515625, -16.6171875, -15.42333984375, -14.2294921875, -13.03564453125, -11.841796875, -10.64794921875, -9.4541015625, -8.26025390625, -7.06640625, -5.87255859375, -4.6787109375, -3.48486328125, -2.291015625, -1.09716796875, 0.0966796875, 1.29052734375, 2.484375, 3.67822265625, 4.8720703125, 6.06591796875, 7.259765625, 8.45361328125, 9.6474609375, 10.84130859375, 12.03515625, 13.22900390625, 14.4228515625, 15.61669921875, 16.810546875, 18.00439453125, 19.1982421875, 20.39208984375, 21.5859375, 22.77978515625, 23.9736328125, 25.16748046875, 26.361328125, 27.55517578125, 28.7490234375, 29.94287109375, 31.13671875, 32.33056640625, 33.5244140625, 34.71826171875, 35.912109375, 37.10595703125, 38.2998046875, 39.49365234375, 40.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 10.0, 12.0, 15.0, 18.0, 19.0, 16.0, 11.0, 31.0, 27.0, 30.0, 34.0, 37.0, 50.0, 31.0, 38.0, 35.0, 38.0, 41.0, 45.0, 37.0, 34.0, 42.0, 33.0, 33.0, 35.0, 37.0, 18.0, 21.0, 22.0, 15.0, 17.0, 18.0, 13.0, 11.0, 9.0, 8.0, 11.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.953125, -19.35498046875, -18.7568359375, -18.15869140625, -17.560546875, -16.96240234375, -16.3642578125, -15.76611328125, -15.16796875, -14.56982421875, -13.9716796875, -13.37353515625, -12.775390625, -12.17724609375, -11.5791015625, -10.98095703125, -10.3828125, -9.78466796875, -9.1865234375, -8.58837890625, -7.990234375, -7.39208984375, -6.7939453125, -6.19580078125, -5.59765625, -4.99951171875, -4.4013671875, -3.80322265625, -3.205078125, -2.60693359375, -2.0087890625, -1.41064453125, -0.8125, -0.21435546875, 0.3837890625, 0.98193359375, 1.580078125, 2.17822265625, 2.7763671875, 3.37451171875, 3.97265625, 4.57080078125, 5.1689453125, 5.76708984375, 6.365234375, 6.96337890625, 7.5615234375, 8.15966796875, 8.7578125, 9.35595703125, 9.9541015625, 10.55224609375, 11.150390625, 11.74853515625, 12.3466796875, 12.94482421875, 13.54296875, 14.14111328125, 14.7392578125, 15.33740234375, 15.935546875, 16.53369140625, 17.1318359375, 17.72998046875, 18.328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 13.0, 15.0, 30.0, 34.0, 46.0, 58.0, 89.0, 109.0, 152.0, 185.0, 271.0, 364.0, 480.0, 682.0, 958.0, 1249.0, 1935.0, 2969.0, 4760.0, 8425.0, 16355.0, 41489.0, 339272.0, 538964.0, 47705.0, 17895.0, 8898.0, 5086.0, 3133.0, 1978.0, 1373.0, 973.0, 674.0, 514.0, 342.0, 254.0, 220.0, 161.0, 109.0, 82.0, 58.0, 51.0, 35.0, 21.0, 19.0, 13.0, 11.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-57.0, -55.16455078125, -53.3291015625, -51.49365234375, -49.658203125, -47.82275390625, -45.9873046875, -44.15185546875, -42.31640625, -40.48095703125, -38.6455078125, -36.81005859375, -34.974609375, -33.13916015625, -31.3037109375, -29.46826171875, -27.6328125, -25.79736328125, -23.9619140625, -22.12646484375, -20.291015625, -18.45556640625, -16.6201171875, -14.78466796875, -12.94921875, -11.11376953125, -9.2783203125, -7.44287109375, -5.607421875, -3.77197265625, -1.9365234375, -0.10107421875, 1.734375, 3.56982421875, 5.4052734375, 7.24072265625, 9.076171875, 10.91162109375, 12.7470703125, 14.58251953125, 16.41796875, 18.25341796875, 20.0888671875, 21.92431640625, 23.759765625, 25.59521484375, 27.4306640625, 29.26611328125, 31.1015625, 32.93701171875, 34.7724609375, 36.60791015625, 38.443359375, 40.27880859375, 42.1142578125, 43.94970703125, 45.78515625, 47.62060546875, 49.4560546875, 51.29150390625, 53.126953125, 54.96240234375, 56.7978515625, 58.63330078125, 60.46875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 12.0, 13.0, 24.0, 18.0, 20.0, 14.0, 27.0, 45.0, 19.0, 26.0, 26.0, 45.0, 46.0, 32.0, 48.0, 44.0, 44.0, 40.0, 36.0, 44.0, 35.0, 40.0, 38.0, 31.0, 33.0, 34.0, 24.0, 18.0, 23.0, 15.0, 10.0, 10.0, 16.0, 4.0, 6.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.442626953125, -13.90087890625, -13.359130859375, -12.8173828125, -12.275634765625, -11.73388671875, -11.192138671875, -10.650390625, -10.108642578125, -9.56689453125, -9.025146484375, -8.4833984375, -7.941650390625, -7.39990234375, -6.858154296875, -6.31640625, -5.774658203125, -5.23291015625, -4.691162109375, -4.1494140625, -3.607666015625, -3.06591796875, -2.524169921875, -1.982421875, -1.440673828125, -0.89892578125, -0.357177734375, 0.1845703125, 0.726318359375, 1.26806640625, 1.809814453125, 2.3515625, 2.893310546875, 3.43505859375, 3.976806640625, 4.5185546875, 5.060302734375, 5.60205078125, 6.143798828125, 6.685546875, 7.227294921875, 7.76904296875, 8.310791015625, 8.8525390625, 9.394287109375, 9.93603515625, 10.477783203125, 11.01953125, 11.561279296875, 12.10302734375, 12.644775390625, 13.1865234375, 13.728271484375, 14.27001953125, 14.811767578125, 15.353515625, 15.895263671875, 16.43701171875, 16.978759765625, 17.5205078125, 18.062255859375, 18.60400390625, 19.145751953125, 19.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 13.0, 16.0, 22.0, 29.0, 44.0, 46.0, 81.0, 125.0, 157.0, 260.0, 328.0, 553.0, 866.0, 1443.0, 2769.0, 5806.0, 13560.0, 42424.0, 507421.0, 406914.0, 40060.0, 13161.0, 5751.0, 2748.0, 1483.0, 854.0, 524.0, 316.0, 220.0, 154.0, 117.0, 79.0, 55.0, 42.0, 24.0, 23.0, 14.0, 9.0, 6.0, 9.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-44.0625, -42.7265625, -41.390625, -40.0546875, -38.71875, -37.3828125, -36.046875, -34.7109375, -33.375, -32.0390625, -30.703125, -29.3671875, -28.03125, -26.6953125, -25.359375, -24.0234375, -22.6875, -21.3515625, -20.015625, -18.6796875, -17.34375, -16.0078125, -14.671875, -13.3359375, -12.0, -10.6640625, -9.328125, -7.9921875, -6.65625, -5.3203125, -3.984375, -2.6484375, -1.3125, 0.0234375, 1.359375, 2.6953125, 4.03125, 5.3671875, 6.703125, 8.0390625, 9.375, 10.7109375, 12.046875, 13.3828125, 14.71875, 16.0546875, 17.390625, 18.7265625, 20.0625, 21.3984375, 22.734375, 24.0703125, 25.40625, 26.7421875, 28.078125, 29.4140625, 30.75, 32.0859375, 33.421875, 34.7578125, 36.09375, 37.4296875, 38.765625, 40.1015625, 41.4375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 13.0, 9.0, 26.0, 33.0, 68.0, 91.0, 153.0, 205.0, 143.0, 104.0, 60.0, 32.0, 17.0, 9.0, 10.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020580291748046875, -0.0019996613264083862, -0.001941293478012085, -0.0018829256296157837, -0.0018245577812194824, -0.0017661899328231812, -0.0017078220844268799, -0.0016494542360305786, -0.0015910863876342773, -0.001532718539237976, -0.0014743506908416748, -0.0014159828424453735, -0.0013576149940490723, -0.001299247145652771, -0.0012408792972564697, -0.0011825114488601685, -0.0011241436004638672, -0.001065775752067566, -0.0010074079036712646, -0.0009490400552749634, -0.0008906722068786621, -0.0008323043584823608, -0.0007739365100860596, -0.0007155686616897583, -0.000657200813293457, -0.0005988329648971558, -0.0005404651165008545, -0.0004820972681045532, -0.00042372941970825195, -0.0003653615713119507, -0.0003069937229156494, -0.00024862587451934814, -0.00019025802612304688, -0.0001318901777267456, -7.352232933044434e-05, -1.5154480934143066e-05, 4.32133674621582e-05, 0.00010158121585845947, 0.00015994906425476074, 0.000218316912651062, 0.0002766847610473633, 0.00033505260944366455, 0.0003934204578399658, 0.0004517883062362671, 0.0005101561546325684, 0.0005685240030288696, 0.0006268918514251709, 0.0006852596998214722, 0.0007436275482177734, 0.0008019953966140747, 0.000860363245010376, 0.0009187310934066772, 0.0009770989418029785, 0.0010354667901992798, 0.001093834638595581, 0.0011522024869918823, 0.0012105703353881836, 0.0012689381837844849, 0.0013273060321807861, 0.0013856738805770874, 0.0014440417289733887, 0.00150240957736969, 0.0015607774257659912, 0.0016191452741622925, 0.0016775131225585938]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 15.0, 17.0, 38.0, 43.0, 49.0, 68.0, 113.0, 157.0, 249.0, 337.0, 517.0, 818.0, 1299.0, 2007.0, 3380.0, 5699.0, 9990.0, 19192.0, 40321.0, 103468.0, 431950.0, 280599.0, 77821.0, 32645.0, 16090.0, 8570.0, 4988.0, 2832.0, 1897.0, 1130.0, 722.0, 446.0, 318.0, 215.0, 171.0, 103.0, 77.0, 63.0, 33.0, 27.0, 15.0, 12.0, 12.0, 4.0, 4.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.8203125, -15.2906494140625, -14.760986328125, -14.2313232421875, -13.70166015625, -13.1719970703125, -12.642333984375, -12.1126708984375, -11.5830078125, -11.0533447265625, -10.523681640625, -9.9940185546875, -9.46435546875, -8.9346923828125, -8.405029296875, -7.8753662109375, -7.345703125, -6.8160400390625, -6.286376953125, -5.7567138671875, -5.22705078125, -4.6973876953125, -4.167724609375, -3.6380615234375, -3.1083984375, -2.5787353515625, -2.049072265625, -1.5194091796875, -0.98974609375, -0.4600830078125, 0.069580078125, 0.5992431640625, 1.12890625, 1.6585693359375, 2.188232421875, 2.7178955078125, 3.24755859375, 3.7772216796875, 4.306884765625, 4.8365478515625, 5.3662109375, 5.8958740234375, 6.425537109375, 6.9552001953125, 7.48486328125, 8.0145263671875, 8.544189453125, 9.0738525390625, 9.603515625, 10.1331787109375, 10.662841796875, 11.1925048828125, 11.72216796875, 12.2518310546875, 12.781494140625, 13.3111572265625, 13.8408203125, 14.3704833984375, 14.900146484375, 15.4298095703125, 15.95947265625, 16.4891357421875, 17.018798828125, 17.5484619140625, 18.078125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 5.0, 6.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 10.0, 12.0, 20.0, 16.0, 19.0, 33.0, 34.0, 58.0, 68.0, 97.0, 90.0, 114.0, 95.0, 57.0, 45.0, 38.0, 37.0, 22.0, 24.0, 17.0, 16.0, 10.0, 12.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75, -2.64129638671875, -2.5325927734375, -2.42388916015625, -2.315185546875, -2.20648193359375, -2.0977783203125, -1.98907470703125, -1.88037109375, -1.77166748046875, -1.6629638671875, -1.55426025390625, -1.445556640625, -1.33685302734375, -1.2281494140625, -1.11944580078125, -1.0107421875, -0.90203857421875, -0.7933349609375, -0.68463134765625, -0.575927734375, -0.46722412109375, -0.3585205078125, -0.24981689453125, -0.14111328125, -0.03240966796875, 0.0762939453125, 0.18499755859375, 0.293701171875, 0.40240478515625, 0.5111083984375, 0.61981201171875, 0.728515625, 0.83721923828125, 0.9459228515625, 1.05462646484375, 1.163330078125, 1.27203369140625, 1.3807373046875, 1.48944091796875, 1.59814453125, 1.70684814453125, 1.8155517578125, 1.92425537109375, 2.032958984375, 2.14166259765625, 2.2503662109375, 2.35906982421875, 2.4677734375, 2.57647705078125, 2.6851806640625, 2.79388427734375, 2.902587890625, 3.01129150390625, 3.1199951171875, 3.22869873046875, 3.33740234375, 3.44610595703125, 3.5548095703125, 3.66351318359375, 3.772216796875, 3.88092041015625, 3.9896240234375, 4.09832763671875, 4.20703125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 22.0, 27.0, 47.0, 99.0, 163.0, 262.0, 138.0, 74.0, 47.0, 26.0, 25.0, 17.0, 10.0, 6.0, 6.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.34966278076172, -43.42988586425781, -41.510108947753906, -39.59033203125, -37.670555114746094, -35.75077819824219, -33.83100128173828, -31.911226272583008, -29.9914493560791, -28.071672439575195, -26.15189552307129, -24.232120513916016, -22.31234359741211, -20.392566680908203, -18.472789764404297, -16.55301284790039, -14.633235931396484, -12.713459014892578, -10.793682098388672, -8.873906135559082, -6.954129219055176, -5.0343523025512695, -3.1145763397216797, -1.1947994232177734, 0.7249774932861328, 2.64475417137146, 4.564530849456787, 6.484307289123535, 8.404084205627441, 10.323861122131348, 12.243637084960938, 14.163414001464844, 16.08319091796875, 18.002967834472656, 19.922744750976562, 21.84252166748047, 23.762298583984375, 25.68207550048828, 27.601850509643555, 29.52162742614746, 31.441404342651367, 33.36117935180664, 35.28095626831055, 37.20073318481445, 39.12051010131836, 41.040287017822266, 42.96006393432617, 44.87984085083008, 46.799617767333984, 48.71939468383789, 50.6391716003418, 52.5589485168457, 54.47872543334961, 56.398502349853516, 58.318275451660156, 60.23805236816406, 62.15782928466797, 64.07760620117188, 65.99738311767578, 67.91716003417969, 69.8369369506836, 71.7567138671875, 73.6764907836914, 75.59626770019531, 77.51604461669922]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 3.0, 13.0, 8.0, 16.0, 16.0, 15.0, 21.0, 16.0, 31.0, 18.0, 18.0, 36.0, 32.0, 22.0, 28.0, 31.0, 38.0, 33.0, 35.0, 30.0, 32.0, 32.0, 31.0, 38.0, 42.0, 29.0, 29.0, 28.0, 22.0, 28.0, 23.0, 27.0, 23.0, 14.0, 16.0, 17.0, 13.0, 9.0, 10.0, 10.0, 6.0, 11.0, 3.0, 2.0, 4.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.123363494873047, -14.638275146484375, -14.153185844421387, -13.668097496032715, -13.183009147644043, -12.697919845581055, -12.212831497192383, -11.727743148803711, -11.242654800415039, -10.757566452026367, -10.272477149963379, -9.787388801574707, -9.302300453186035, -8.817211151123047, -8.332122802734375, -7.847034454345703, -7.361945152282715, -6.876856327056885, -6.391767978668213, -5.906679153442383, -5.421590805053711, -4.936501979827881, -4.451413154602051, -3.9663245677948, -3.481235980987549, -2.996147394180298, -2.511058807373047, -2.025969982147217, -1.5408813953399658, -1.0557928085327148, -0.5707039833068848, -0.08561539649963379, 0.3994722366333008, 0.8845608830451965, 1.3696495294570923, 1.8547382354736328, 2.339826822280884, 2.8249154090881348, 3.310004234313965, 3.795092821121216, 4.280181407928467, 4.765270233154297, 5.250358581542969, 5.735447406768799, 6.220536231994629, 6.705624580383301, 7.190713405609131, 7.675802230834961, 8.160890579223633, 8.645978927612305, 9.131068229675293, 9.616156578063965, 10.101244926452637, 10.586334228515625, 11.071422576904297, 11.556510925292969, 12.04159927368164, 12.526687622070312, 13.0117769241333, 13.496865272521973, 13.981953620910645, 14.467042922973633, 14.952131271362305, 15.437219619750977, 15.922308921813965]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 12.0, 13.0, 14.0, 26.0, 36.0, 60.0, 80.0, 104.0, 167.0, 209.0, 322.0, 495.0, 774.0, 1134.0, 1789.0, 2936.0, 4651.0, 7478.0, 12424.0, 20902.0, 35336.0, 60699.0, 104903.0, 182049.0, 234797.0, 156912.0, 90402.0, 52378.0, 30617.0, 18185.0, 10841.0, 6591.0, 4049.0, 2501.0, 1584.0, 961.0, 680.0, 462.0, 305.0, 213.0, 153.0, 88.0, 61.0, 55.0, 37.0, 24.0, 13.0, 11.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-29.171875, -28.2705078125, -27.369140625, -26.4677734375, -25.56640625, -24.6650390625, -23.763671875, -22.8623046875, -21.9609375, -21.0595703125, -20.158203125, -19.2568359375, -18.35546875, -17.4541015625, -16.552734375, -15.6513671875, -14.75, -13.8486328125, -12.947265625, -12.0458984375, -11.14453125, -10.2431640625, -9.341796875, -8.4404296875, -7.5390625, -6.6376953125, -5.736328125, -4.8349609375, -3.93359375, -3.0322265625, -2.130859375, -1.2294921875, -0.328125, 0.5732421875, 1.474609375, 2.3759765625, 3.27734375, 4.1787109375, 5.080078125, 5.9814453125, 6.8828125, 7.7841796875, 8.685546875, 9.5869140625, 10.48828125, 11.3896484375, 12.291015625, 13.1923828125, 14.09375, 14.9951171875, 15.896484375, 16.7978515625, 17.69921875, 18.6005859375, 19.501953125, 20.4033203125, 21.3046875, 22.2060546875, 23.107421875, 24.0087890625, 24.91015625, 25.8115234375, 26.712890625, 27.6142578125, 28.515625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 2.0, 3.0, 15.0, 8.0, 9.0, 7.0, 16.0, 22.0, 20.0, 23.0, 20.0, 34.0, 38.0, 33.0, 41.0, 40.0, 30.0, 41.0, 37.0, 38.0, 47.0, 40.0, 44.0, 37.0, 42.0, 36.0, 30.0, 23.0, 35.0, 28.0, 25.0, 14.0, 13.0, 18.0, 18.0, 15.0, 7.0, 10.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.953125, -14.433349609375, -13.91357421875, -13.393798828125, -12.8740234375, -12.354248046875, -11.83447265625, -11.314697265625, -10.794921875, -10.275146484375, -9.75537109375, -9.235595703125, -8.7158203125, -8.196044921875, -7.67626953125, -7.156494140625, -6.63671875, -6.116943359375, -5.59716796875, -5.077392578125, -4.5576171875, -4.037841796875, -3.51806640625, -2.998291015625, -2.478515625, -1.958740234375, -1.43896484375, -0.919189453125, -0.3994140625, 0.120361328125, 0.64013671875, 1.159912109375, 1.6796875, 2.199462890625, 2.71923828125, 3.239013671875, 3.7587890625, 4.278564453125, 4.79833984375, 5.318115234375, 5.837890625, 6.357666015625, 6.87744140625, 7.397216796875, 7.9169921875, 8.436767578125, 8.95654296875, 9.476318359375, 9.99609375, 10.515869140625, 11.03564453125, 11.555419921875, 12.0751953125, 12.594970703125, 13.11474609375, 13.634521484375, 14.154296875, 14.674072265625, 15.19384765625, 15.713623046875, 16.2333984375, 16.753173828125, 17.27294921875, 17.792724609375, 18.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 2.0, 8.0, 15.0, 20.0, 34.0, 42.0, 68.0, 100.0, 145.0, 247.0, 407.0, 667.0, 1044.0, 1800.0, 3004.0, 5355.0, 10120.0, 20035.0, 42124.0, 97654.0, 249860.0, 348615.0, 148126.0, 60865.0, 27640.0, 13644.0, 7284.0, 3969.0, 2241.0, 1270.0, 828.0, 457.0, 302.0, 194.0, 135.0, 69.0, 54.0, 38.0, 26.0, 15.0, 13.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-45.40625, -44.15283203125, -42.8994140625, -41.64599609375, -40.392578125, -39.13916015625, -37.8857421875, -36.63232421875, -35.37890625, -34.12548828125, -32.8720703125, -31.61865234375, -30.365234375, -29.11181640625, -27.8583984375, -26.60498046875, -25.3515625, -24.09814453125, -22.8447265625, -21.59130859375, -20.337890625, -19.08447265625, -17.8310546875, -16.57763671875, -15.32421875, -14.07080078125, -12.8173828125, -11.56396484375, -10.310546875, -9.05712890625, -7.8037109375, -6.55029296875, -5.296875, -4.04345703125, -2.7900390625, -1.53662109375, -0.283203125, 0.97021484375, 2.2236328125, 3.47705078125, 4.73046875, 5.98388671875, 7.2373046875, 8.49072265625, 9.744140625, 10.99755859375, 12.2509765625, 13.50439453125, 14.7578125, 16.01123046875, 17.2646484375, 18.51806640625, 19.771484375, 21.02490234375, 22.2783203125, 23.53173828125, 24.78515625, 26.03857421875, 27.2919921875, 28.54541015625, 29.798828125, 31.05224609375, 32.3056640625, 33.55908203125, 34.8125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 0.0, 8.0, 7.0, 7.0, 17.0, 12.0, 19.0, 15.0, 28.0, 22.0, 29.0, 39.0, 25.0, 42.0, 45.0, 49.0, 39.0, 54.0, 40.0, 57.0, 38.0, 41.0, 51.0, 34.0, 31.0, 41.0, 27.0, 30.0, 27.0, 22.0, 23.0, 16.0, 12.0, 11.0, 7.0, 10.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5859375, -12.1697998046875, -11.753662109375, -11.3375244140625, -10.92138671875, -10.5052490234375, -10.089111328125, -9.6729736328125, -9.2568359375, -8.8406982421875, -8.424560546875, -8.0084228515625, -7.59228515625, -7.1761474609375, -6.760009765625, -6.3438720703125, -5.927734375, -5.5115966796875, -5.095458984375, -4.6793212890625, -4.26318359375, -3.8470458984375, -3.430908203125, -3.0147705078125, -2.5986328125, -2.1824951171875, -1.766357421875, -1.3502197265625, -0.93408203125, -0.5179443359375, -0.101806640625, 0.3143310546875, 0.73046875, 1.1466064453125, 1.562744140625, 1.9788818359375, 2.39501953125, 2.8111572265625, 3.227294921875, 3.6434326171875, 4.0595703125, 4.4757080078125, 4.891845703125, 5.3079833984375, 5.72412109375, 6.1402587890625, 6.556396484375, 6.9725341796875, 7.388671875, 7.8048095703125, 8.220947265625, 8.6370849609375, 9.05322265625, 9.4693603515625, 9.885498046875, 10.3016357421875, 10.7177734375, 11.1339111328125, 11.550048828125, 11.9661865234375, 12.38232421875, 12.7984619140625, 13.214599609375, 13.6307373046875, 14.046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 10.0, 10.0, 11.0, 8.0, 18.0, 28.0, 50.0, 73.0, 129.0, 175.0, 253.0, 465.0, 692.0, 1132.0, 2057.0, 4185.0, 8959.0, 23739.0, 85553.0, 715135.0, 149632.0, 33178.0, 11801.0, 5194.0, 2465.0, 1364.0, 860.0, 499.0, 279.0, 191.0, 125.0, 98.0, 68.0, 39.0, 34.0, 14.0, 4.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-99.5625, -96.4169921875, -93.271484375, -90.1259765625, -86.98046875, -83.8349609375, -80.689453125, -77.5439453125, -74.3984375, -71.2529296875, -68.107421875, -64.9619140625, -61.81640625, -58.6708984375, -55.525390625, -52.3798828125, -49.234375, -46.0888671875, -42.943359375, -39.7978515625, -36.65234375, -33.5068359375, -30.361328125, -27.2158203125, -24.0703125, -20.9248046875, -17.779296875, -14.6337890625, -11.48828125, -8.3427734375, -5.197265625, -2.0517578125, 1.09375, 4.2392578125, 7.384765625, 10.5302734375, 13.67578125, 16.8212890625, 19.966796875, 23.1123046875, 26.2578125, 29.4033203125, 32.548828125, 35.6943359375, 38.83984375, 41.9853515625, 45.130859375, 48.2763671875, 51.421875, 54.5673828125, 57.712890625, 60.8583984375, 64.00390625, 67.1494140625, 70.294921875, 73.4404296875, 76.5859375, 79.7314453125, 82.876953125, 86.0224609375, 89.16796875, 92.3134765625, 95.458984375, 98.6044921875, 101.75]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 7.0, 13.0, 15.0, 15.0, 33.0, 47.0, 49.0, 61.0, 107.0, 170.0, 132.0, 75.0, 71.0, 52.0, 34.0, 41.0, 12.0, 14.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0039520263671875, -0.0038504600524902344, -0.0037488937377929688, -0.003647327423095703, -0.0035457611083984375, -0.003444194793701172, -0.0033426284790039062, -0.0032410621643066406, -0.003139495849609375, -0.0030379295349121094, -0.0029363632202148438, -0.002834796905517578, -0.0027332305908203125, -0.002631664276123047, -0.0025300979614257812, -0.0024285316467285156, -0.00232696533203125, -0.0022253990173339844, -0.0021238327026367188, -0.002022266387939453, -0.0019207000732421875, -0.0018191337585449219, -0.0017175674438476562, -0.0016160011291503906, -0.001514434814453125, -0.0014128684997558594, -0.0013113021850585938, -0.0012097358703613281, -0.0011081695556640625, -0.0010066032409667969, -0.0009050369262695312, -0.0008034706115722656, -0.000701904296875, -0.0006003379821777344, -0.0004987716674804688, -0.0003972053527832031, -0.0002956390380859375, -0.00019407272338867188, -9.250640869140625e-05, 9.059906005859375e-06, 0.000110626220703125, 0.00021219253540039062, 0.00031375885009765625, 0.0004153251647949219, 0.0005168914794921875, 0.0006184577941894531, 0.0007200241088867188, 0.0008215904235839844, 0.00092315673828125, 0.0010247230529785156, 0.0011262893676757812, 0.0012278556823730469, 0.0013294219970703125, 0.0014309883117675781, 0.0015325546264648438, 0.0016341209411621094, 0.001735687255859375, 0.0018372535705566406, 0.0019388198852539062, 0.002040386199951172, 0.0021419525146484375, 0.002243518829345703, 0.0023450851440429688, 0.0024466514587402344, 0.0025482177734375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 3.0, 11.0, 6.0, 9.0, 20.0, 26.0, 42.0, 54.0, 76.0, 128.0, 172.0, 281.0, 426.0, 683.0, 1259.0, 2329.0, 5047.0, 13683.0, 55939.0, 756397.0, 170190.0, 25920.0, 8222.0, 3447.0, 1653.0, 950.0, 578.0, 337.0, 199.0, 127.0, 105.0, 74.0, 50.0, 36.0, 18.0, 20.0, 10.0, 8.0, 3.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.5625, -89.2275390625, -85.892578125, -82.5576171875, -79.22265625, -75.8876953125, -72.552734375, -69.2177734375, -65.8828125, -62.5478515625, -59.212890625, -55.8779296875, -52.54296875, -49.2080078125, -45.873046875, -42.5380859375, -39.203125, -35.8681640625, -32.533203125, -29.1982421875, -25.86328125, -22.5283203125, -19.193359375, -15.8583984375, -12.5234375, -9.1884765625, -5.853515625, -2.5185546875, 0.81640625, 4.1513671875, 7.486328125, 10.8212890625, 14.15625, 17.4912109375, 20.826171875, 24.1611328125, 27.49609375, 30.8310546875, 34.166015625, 37.5009765625, 40.8359375, 44.1708984375, 47.505859375, 50.8408203125, 54.17578125, 57.5107421875, 60.845703125, 64.1806640625, 67.515625, 70.8505859375, 74.185546875, 77.5205078125, 80.85546875, 84.1904296875, 87.525390625, 90.8603515625, 94.1953125, 97.5302734375, 100.865234375, 104.2001953125, 107.53515625, 110.8701171875, 114.205078125, 117.5400390625, 120.875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 3.0, 8.0, 10.0, 9.0, 17.0, 38.0, 49.0, 66.0, 74.0, 111.0, 208.0, 116.0, 82.0, 52.0, 43.0, 32.0, 19.0, 12.0, 10.0, 8.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.984375, -23.3780517578125, -22.771728515625, -22.1654052734375, -21.55908203125, -20.9527587890625, -20.346435546875, -19.7401123046875, -19.1337890625, -18.5274658203125, -17.921142578125, -17.3148193359375, -16.70849609375, -16.1021728515625, -15.495849609375, -14.8895263671875, -14.283203125, -13.6768798828125, -13.070556640625, -12.4642333984375, -11.85791015625, -11.2515869140625, -10.645263671875, -10.0389404296875, -9.4326171875, -8.8262939453125, -8.219970703125, -7.6136474609375, -7.00732421875, -6.4010009765625, -5.794677734375, -5.1883544921875, -4.58203125, -3.9757080078125, -3.369384765625, -2.7630615234375, -2.15673828125, -1.5504150390625, -0.944091796875, -0.3377685546875, 0.2685546875, 0.8748779296875, 1.481201171875, 2.0875244140625, 2.69384765625, 3.3001708984375, 3.906494140625, 4.5128173828125, 5.119140625, 5.7254638671875, 6.331787109375, 6.9381103515625, 7.54443359375, 8.1507568359375, 8.757080078125, 9.3634033203125, 9.9697265625, 10.5760498046875, 11.182373046875, 11.7886962890625, 12.39501953125, 13.0013427734375, 13.607666015625, 14.2139892578125, 14.8203125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 13.0, 30.0, 59.0, 92.0, 194.0, 217.0, 121.0, 72.0, 52.0, 28.0, 25.0, 20.0, 12.0, 13.0, 9.0, 1.0, 11.0, 4.0, 7.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.573490142822266, -41.906944274902344, -40.24039840698242, -38.5738525390625, -36.90730667114258, -35.240760803222656, -33.57421112060547, -31.907665252685547, -30.241119384765625, -28.574573516845703, -26.90802764892578, -25.24148178100586, -23.574934005737305, -21.908388137817383, -20.24184226989746, -18.575294494628906, -16.908750534057617, -15.242204666137695, -13.575657844543457, -11.909111976623535, -10.242565155029297, -8.576019287109375, -6.909473419189453, -5.242926597595215, -3.576380729675293, -1.9098345041275024, -0.24328827857971191, 1.423257827758789, 3.089804172515869, 4.756350517272949, 6.422896385192871, 8.08944320678711, 9.755989074707031, 11.422534942626953, 13.089081764221191, 14.755627632141113, 16.42217445373535, 18.088720321655273, 19.755266189575195, 21.42181396484375, 23.088359832763672, 24.754905700683594, 26.421451568603516, 28.087997436523438, 29.754545211791992, 31.421091079711914, 33.08763885498047, 34.75418472290039, 36.42073059082031, 38.087276458740234, 39.753822326660156, 41.42036819458008, 43.0869140625, 44.75346374511719, 46.420005798339844, 48.08655548095703, 49.75309753417969, 51.41964340209961, 53.08618927001953, 54.75273513793945, 56.419281005859375, 58.08583068847656, 59.75237274169922, 61.418922424316406, 63.08546829223633]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 20.0, 13.0, 21.0, 23.0, 29.0, 13.0, 29.0, 28.0, 33.0, 35.0, 24.0, 36.0, 46.0, 34.0, 42.0, 57.0, 38.0, 36.0, 45.0, 42.0, 33.0, 42.0, 32.0, 35.0, 19.0, 20.0, 17.0, 24.0, 17.0, 17.0, 16.0, 12.0, 11.0, 5.0, 5.0, 7.0, 9.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.829206466674805, -16.264965057373047, -15.700721740722656, -15.136479377746582, -14.572237014770508, -14.00799560546875, -13.443753242492676, -12.879510879516602, -12.315268516540527, -11.751026153564453, -11.186783790588379, -10.622541427612305, -10.058300018310547, -9.494056701660156, -8.929815292358398, -8.365572929382324, -7.80133056640625, -7.237088203430176, -6.672845840454102, -6.1086039543151855, -5.544361591339111, -4.980119228363037, -4.415877342224121, -3.851634979248047, -3.2873926162719727, -2.7231502532958984, -2.1589081287384033, -1.5946658849716187, -1.030423641204834, -0.46618127822875977, 0.09806084632873535, 0.6623029708862305, 1.2265472412109375, 1.7907894849777222, 2.355031728744507, 2.919273853302002, 3.483516216278076, 4.04775857925415, 4.612000465393066, 5.176242828369141, 5.740485191345215, 6.304727554321289, 6.868969917297363, 7.433211803436279, 7.9974541664123535, 8.561697006225586, 9.125938415527344, 9.690180778503418, 10.254423141479492, 10.818665504455566, 11.38290786743164, 11.947150230407715, 12.511392593383789, 13.075634002685547, 13.639876365661621, 14.204118728637695, 14.76836109161377, 15.332603454589844, 15.896845817565918, 16.461088180541992, 17.02532958984375, 17.58957290649414, 18.1538143157959, 18.718055725097656, 19.282299041748047]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 13.0, 27.0, 35.0, 46.0, 67.0, 103.0, 139.0, 215.0, 301.0, 528.0, 787.0, 1148.0, 1703.0, 2766.0, 4323.0, 6707.0, 10810.0, 17829.0, 30597.0, 55231.0, 111427.0, 288500.0, 1226827.0, 1727739.0, 404846.0, 142383.0, 68294.0, 36281.0, 20978.0, 12485.0, 7812.0, 4947.0, 3020.0, 2001.0, 1208.0, 830.0, 532.0, 285.0, 197.0, 114.0, 73.0, 51.0, 23.0, 22.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.265625, -27.412841796875, -26.56005859375, -25.707275390625, -24.8544921875, -24.001708984375, -23.14892578125, -22.296142578125, -21.443359375, -20.590576171875, -19.73779296875, -18.885009765625, -18.0322265625, -17.179443359375, -16.32666015625, -15.473876953125, -14.62109375, -13.768310546875, -12.91552734375, -12.062744140625, -11.2099609375, -10.357177734375, -9.50439453125, -8.651611328125, -7.798828125, -6.946044921875, -6.09326171875, -5.240478515625, -4.3876953125, -3.534912109375, -2.68212890625, -1.829345703125, -0.9765625, -0.123779296875, 0.72900390625, 1.581787109375, 2.4345703125, 3.287353515625, 4.14013671875, 4.992919921875, 5.845703125, 6.698486328125, 7.55126953125, 8.404052734375, 9.2568359375, 10.109619140625, 10.96240234375, 11.815185546875, 12.66796875, 13.520751953125, 14.37353515625, 15.226318359375, 16.0791015625, 16.931884765625, 17.78466796875, 18.637451171875, 19.490234375, 20.343017578125, 21.19580078125, 22.048583984375, 22.9013671875, 23.754150390625, 24.60693359375, 25.459716796875, 26.3125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 5.0, 9.0, 11.0, 15.0, 14.0, 24.0, 30.0, 25.0, 28.0, 25.0, 35.0, 34.0, 35.0, 46.0, 43.0, 46.0, 52.0, 36.0, 38.0, 53.0, 46.0, 44.0, 46.0, 38.0, 29.0, 33.0, 27.0, 26.0, 18.0, 17.0, 18.0, 12.0, 11.0, 5.0, 7.0, 8.0, 4.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.2802734375, -9.943359375, -9.6064453125, -9.26953125, -8.9326171875, -8.595703125, -8.2587890625, -7.921875, -7.5849609375, -7.248046875, -6.9111328125, -6.57421875, -6.2373046875, -5.900390625, -5.5634765625, -5.2265625, -4.8896484375, -4.552734375, -4.2158203125, -3.87890625, -3.5419921875, -3.205078125, -2.8681640625, -2.53125, -2.1943359375, -1.857421875, -1.5205078125, -1.18359375, -0.8466796875, -0.509765625, -0.1728515625, 0.1640625, 0.5009765625, 0.837890625, 1.1748046875, 1.51171875, 1.8486328125, 2.185546875, 2.5224609375, 2.859375, 3.1962890625, 3.533203125, 3.8701171875, 4.20703125, 4.5439453125, 4.880859375, 5.2177734375, 5.5546875, 5.8916015625, 6.228515625, 6.5654296875, 6.90234375, 7.2392578125, 7.576171875, 7.9130859375, 8.25, 8.5869140625, 8.923828125, 9.2607421875, 9.59765625, 9.9345703125, 10.271484375, 10.6083984375, 10.9453125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 26.0, 21.0, 31.0, 49.0, 66.0, 90.0, 125.0, 177.0, 248.0, 369.0, 574.0, 828.0, 1190.0, 1831.0, 2733.0, 4467.0, 7000.0, 11807.0, 20697.0, 38613.0, 79645.0, 186859.0, 558586.0, 1944172.0, 865237.0, 255500.0, 101664.0, 48415.0, 25300.0, 14357.0, 8622.0, 5280.0, 3297.0, 2191.0, 1382.0, 908.0, 620.0, 444.0, 281.0, 167.0, 126.0, 84.0, 72.0, 35.0, 39.0, 16.0, 13.0, 10.0, 3.0, 2.0, 4.0, 2.0, 2.0], "bins": [-25.84375, -25.09814453125, -24.3525390625, -23.60693359375, -22.861328125, -22.11572265625, -21.3701171875, -20.62451171875, -19.87890625, -19.13330078125, -18.3876953125, -17.64208984375, -16.896484375, -16.15087890625, -15.4052734375, -14.65966796875, -13.9140625, -13.16845703125, -12.4228515625, -11.67724609375, -10.931640625, -10.18603515625, -9.4404296875, -8.69482421875, -7.94921875, -7.20361328125, -6.4580078125, -5.71240234375, -4.966796875, -4.22119140625, -3.4755859375, -2.72998046875, -1.984375, -1.23876953125, -0.4931640625, 0.25244140625, 0.998046875, 1.74365234375, 2.4892578125, 3.23486328125, 3.98046875, 4.72607421875, 5.4716796875, 6.21728515625, 6.962890625, 7.70849609375, 8.4541015625, 9.19970703125, 9.9453125, 10.69091796875, 11.4365234375, 12.18212890625, 12.927734375, 13.67333984375, 14.4189453125, 15.16455078125, 15.91015625, 16.65576171875, 17.4013671875, 18.14697265625, 18.892578125, 19.63818359375, 20.3837890625, 21.12939453125, 21.875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 18.0, 13.0, 23.0, 17.0, 30.0, 34.0, 41.0, 49.0, 79.0, 72.0, 96.0, 119.0, 117.0, 158.0, 207.0, 243.0, 314.0, 309.0, 321.0, 329.0, 232.0, 214.0, 172.0, 142.0, 109.0, 100.0, 83.0, 74.0, 56.0, 44.0, 37.0, 26.0, 21.0, 22.0, 16.0, 18.0, 17.0, 18.0, 18.0, 9.0, 10.0, 10.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.921875, -4.76043701171875, -4.5989990234375, -4.43756103515625, -4.276123046875, -4.11468505859375, -3.9532470703125, -3.79180908203125, -3.63037109375, -3.46893310546875, -3.3074951171875, -3.14605712890625, -2.984619140625, -2.82318115234375, -2.6617431640625, -2.50030517578125, -2.3388671875, -2.17742919921875, -2.0159912109375, -1.85455322265625, -1.693115234375, -1.53167724609375, -1.3702392578125, -1.20880126953125, -1.04736328125, -0.88592529296875, -0.7244873046875, -0.56304931640625, -0.401611328125, -0.24017333984375, -0.0787353515625, 0.08270263671875, 0.244140625, 0.40557861328125, 0.5670166015625, 0.72845458984375, 0.889892578125, 1.05133056640625, 1.2127685546875, 1.37420654296875, 1.53564453125, 1.69708251953125, 1.8585205078125, 2.01995849609375, 2.181396484375, 2.34283447265625, 2.5042724609375, 2.66571044921875, 2.8271484375, 2.98858642578125, 3.1500244140625, 3.31146240234375, 3.472900390625, 3.63433837890625, 3.7957763671875, 3.95721435546875, 4.11865234375, 4.28009033203125, 4.4415283203125, 4.60296630859375, 4.764404296875, 4.92584228515625, 5.0872802734375, 5.24871826171875, 5.41015625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 4.0, 8.0, 18.0, 20.0, 20.0, 34.0, 57.0, 63.0, 137.0, 148.0, 157.0, 82.0, 73.0, 54.0, 38.0, 17.0, 12.0, 10.0, 4.0, 11.0, 3.0, 4.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.900720596313477, -24.07403564453125, -23.24734878540039, -22.420663833618164, -21.593978881835938, -20.767292022705078, -19.94060707092285, -19.113922119140625, -18.287235260009766, -17.46055030822754, -16.63386344909668, -15.807178497314453, -14.980493545532227, -14.153807640075684, -13.32712173461914, -12.500436782836914, -11.673751831054688, -10.847065925598145, -10.020380973815918, -9.193695068359375, -8.367010116577148, -7.5403242111206055, -6.7136383056640625, -5.886952877044678, -5.060267448425293, -4.233582019805908, -3.4068963527679443, -2.5802106857299805, -1.7535252571105957, -0.9268398284912109, -0.10015392303466797, 0.7265315055847168, 1.5532188415527344, 2.379904270172119, 3.206589937210083, 4.033275604248047, 4.859961032867432, 5.686646461486816, 6.513332366943359, 7.340017795562744, 8.166703224182129, 8.993389129638672, 9.820074081420898, 10.646759986877441, 11.473445892333984, 12.300130844116211, 13.126816749572754, 13.953502655029297, 14.780187606811523, 15.606873512268066, 16.43355941772461, 17.260244369506836, 18.086929321289062, 18.913616180419922, 19.74030113220215, 20.566986083984375, 21.393672943115234, 22.22035789489746, 23.04704475402832, 23.873729705810547, 24.700414657592773, 25.527099609375, 26.35378646850586, 27.180471420288086, 28.007156372070312]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 2.0, 8.0, 10.0, 9.0, 9.0, 8.0, 26.0, 12.0, 16.0, 23.0, 25.0, 27.0, 28.0, 28.0, 31.0, 30.0, 31.0, 28.0, 41.0, 41.0, 44.0, 35.0, 40.0, 38.0, 32.0, 33.0, 41.0, 35.0, 23.0, 26.0, 31.0, 27.0, 28.0, 14.0, 21.0, 14.0, 12.0, 11.0, 9.0, 8.0, 7.0, 5.0, 8.0, 2.0, 9.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.787965774536133, -9.46242904663086, -9.136892318725586, -8.811356544494629, -8.485819816589355, -8.160283088684082, -7.834746837615967, -7.509210586547852, -7.183673858642578, -6.858137130737305, -6.5326008796691895, -6.207064628601074, -5.881527900695801, -5.555991172790527, -5.230454921722412, -4.904918670654297, -4.579381942749023, -4.25384521484375, -3.9283089637756348, -3.6027724742889404, -3.277235984802246, -2.9516994953155518, -2.6261630058288574, -2.300626516342163, -1.9750900268554688, -1.6495535373687744, -1.32401704788208, -0.9984805583953857, -0.6729440689086914, -0.34740757942199707, -0.021871089935302734, 0.3036653995513916, 0.6292018890380859, 0.9547383785247803, 1.2802748680114746, 1.605811357498169, 1.9313478469848633, 2.2568843364715576, 2.582420825958252, 2.9079573154449463, 3.2334938049316406, 3.559030294418335, 3.8845667839050293, 4.2101030349731445, 4.535639762878418, 4.861176490783691, 5.186712741851807, 5.512248992919922, 5.837785720825195, 6.163322448730469, 6.488858699798584, 6.814394950866699, 7.139931678771973, 7.465468406677246, 7.791004657745361, 8.116540908813477, 8.44207763671875, 8.767614364624023, 9.093151092529297, 9.418686866760254, 9.744223594665527, 10.0697603225708, 10.395296096801758, 10.720832824707031, 11.046369552612305]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 4.0, 7.0, 9.0, 15.0, 22.0, 48.0, 65.0, 75.0, 117.0, 146.0, 239.0, 343.0, 512.0, 795.0, 1124.0, 1668.0, 2663.0, 4103.0, 6646.0, 11252.0, 20200.0, 39471.0, 89296.0, 295751.0, 371620.0, 103205.0, 44104.0, 22699.0, 12194.0, 7340.0, 4492.0, 2789.0, 1868.0, 1195.0, 825.0, 536.0, 359.0, 266.0, 155.0, 109.0, 72.0, 53.0, 42.0, 25.0, 11.0, 11.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.7822265625, -16.205078125, -15.6279296875, -15.05078125, -14.4736328125, -13.896484375, -13.3193359375, -12.7421875, -12.1650390625, -11.587890625, -11.0107421875, -10.43359375, -9.8564453125, -9.279296875, -8.7021484375, -8.125, -7.5478515625, -6.970703125, -6.3935546875, -5.81640625, -5.2392578125, -4.662109375, -4.0849609375, -3.5078125, -2.9306640625, -2.353515625, -1.7763671875, -1.19921875, -0.6220703125, -0.044921875, 0.5322265625, 1.109375, 1.6865234375, 2.263671875, 2.8408203125, 3.41796875, 3.9951171875, 4.572265625, 5.1494140625, 5.7265625, 6.3037109375, 6.880859375, 7.4580078125, 8.03515625, 8.6123046875, 9.189453125, 9.7666015625, 10.34375, 10.9208984375, 11.498046875, 12.0751953125, 12.65234375, 13.2294921875, 13.806640625, 14.3837890625, 14.9609375, 15.5380859375, 16.115234375, 16.6923828125, 17.26953125, 17.8466796875, 18.423828125, 19.0009765625, 19.578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 9.0, 15.0, 18.0, 15.0, 16.0, 16.0, 27.0, 18.0, 24.0, 28.0, 30.0, 35.0, 41.0, 43.0, 42.0, 40.0, 37.0, 47.0, 44.0, 40.0, 43.0, 47.0, 31.0, 37.0, 37.0, 29.0, 25.0, 17.0, 21.0, 23.0, 7.0, 16.0, 8.0, 6.0, 9.0, 9.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-12.1171875, -11.7724609375, -11.427734375, -11.0830078125, -10.73828125, -10.3935546875, -10.048828125, -9.7041015625, -9.359375, -9.0146484375, -8.669921875, -8.3251953125, -7.98046875, -7.6357421875, -7.291015625, -6.9462890625, -6.6015625, -6.2568359375, -5.912109375, -5.5673828125, -5.22265625, -4.8779296875, -4.533203125, -4.1884765625, -3.84375, -3.4990234375, -3.154296875, -2.8095703125, -2.46484375, -2.1201171875, -1.775390625, -1.4306640625, -1.0859375, -0.7412109375, -0.396484375, -0.0517578125, 0.29296875, 0.6376953125, 0.982421875, 1.3271484375, 1.671875, 2.0166015625, 2.361328125, 2.7060546875, 3.05078125, 3.3955078125, 3.740234375, 4.0849609375, 4.4296875, 4.7744140625, 5.119140625, 5.4638671875, 5.80859375, 6.1533203125, 6.498046875, 6.8427734375, 7.1875, 7.5322265625, 7.876953125, 8.2216796875, 8.56640625, 8.9111328125, 9.255859375, 9.6005859375, 9.9453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 5.0, 6.0, 11.0, 18.0, 36.0, 44.0, 52.0, 51.0, 99.0, 127.0, 185.0, 211.0, 317.0, 432.0, 566.0, 798.0, 1106.0, 1760.0, 2744.0, 4486.0, 8241.0, 16833.0, 47299.0, 604867.0, 287673.0, 36929.0, 14268.0, 7244.0, 4036.0, 2541.0, 1653.0, 1098.0, 773.0, 514.0, 431.0, 306.0, 207.0, 156.0, 116.0, 68.0, 65.0, 53.0, 35.0, 23.0, 19.0, 10.0, 17.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-27.515625, -26.625244140625, -25.73486328125, -24.844482421875, -23.9541015625, -23.063720703125, -22.17333984375, -21.282958984375, -20.392578125, -19.502197265625, -18.61181640625, -17.721435546875, -16.8310546875, -15.940673828125, -15.05029296875, -14.159912109375, -13.26953125, -12.379150390625, -11.48876953125, -10.598388671875, -9.7080078125, -8.817626953125, -7.92724609375, -7.036865234375, -6.146484375, -5.256103515625, -4.36572265625, -3.475341796875, -2.5849609375, -1.694580078125, -0.80419921875, 0.086181640625, 0.9765625, 1.866943359375, 2.75732421875, 3.647705078125, 4.5380859375, 5.428466796875, 6.31884765625, 7.209228515625, 8.099609375, 8.989990234375, 9.88037109375, 10.770751953125, 11.6611328125, 12.551513671875, 13.44189453125, 14.332275390625, 15.22265625, 16.113037109375, 17.00341796875, 17.893798828125, 18.7841796875, 19.674560546875, 20.56494140625, 21.455322265625, 22.345703125, 23.236083984375, 24.12646484375, 25.016845703125, 25.9072265625, 26.797607421875, 27.68798828125, 28.578369140625, 29.46875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 4.0, 14.0, 11.0, 15.0, 12.0, 20.0, 23.0, 29.0, 32.0, 30.0, 30.0, 40.0, 46.0, 34.0, 48.0, 59.0, 48.0, 48.0, 33.0, 42.0, 42.0, 41.0, 41.0, 35.0, 35.0, 30.0, 22.0, 27.0, 15.0, 16.0, 9.0, 8.0, 12.0, 3.0, 6.0, 8.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.0859375, -8.78173828125, -8.4775390625, -8.17333984375, -7.869140625, -7.56494140625, -7.2607421875, -6.95654296875, -6.65234375, -6.34814453125, -6.0439453125, -5.73974609375, -5.435546875, -5.13134765625, -4.8271484375, -4.52294921875, -4.21875, -3.91455078125, -3.6103515625, -3.30615234375, -3.001953125, -2.69775390625, -2.3935546875, -2.08935546875, -1.78515625, -1.48095703125, -1.1767578125, -0.87255859375, -0.568359375, -0.26416015625, 0.0400390625, 0.34423828125, 0.6484375, 0.95263671875, 1.2568359375, 1.56103515625, 1.865234375, 2.16943359375, 2.4736328125, 2.77783203125, 3.08203125, 3.38623046875, 3.6904296875, 3.99462890625, 4.298828125, 4.60302734375, 4.9072265625, 5.21142578125, 5.515625, 5.81982421875, 6.1240234375, 6.42822265625, 6.732421875, 7.03662109375, 7.3408203125, 7.64501953125, 7.94921875, 8.25341796875, 8.5576171875, 8.86181640625, 9.166015625, 9.47021484375, 9.7744140625, 10.07861328125, 10.3828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 6.0, 13.0, 12.0, 11.0, 8.0, 21.0, 31.0, 39.0, 63.0, 51.0, 103.0, 155.0, 187.0, 303.0, 465.0, 663.0, 1044.0, 1803.0, 3252.0, 6575.0, 15694.0, 48434.0, 608509.0, 295336.0, 38981.0, 13473.0, 5859.0, 2971.0, 1625.0, 966.0, 587.0, 377.0, 282.0, 166.0, 127.0, 90.0, 79.0, 44.0, 32.0, 26.0, 30.0, 22.0, 11.0, 5.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-15.875, -15.361572265625, -14.84814453125, -14.334716796875, -13.8212890625, -13.307861328125, -12.79443359375, -12.281005859375, -11.767578125, -11.254150390625, -10.74072265625, -10.227294921875, -9.7138671875, -9.200439453125, -8.68701171875, -8.173583984375, -7.66015625, -7.146728515625, -6.63330078125, -6.119873046875, -5.6064453125, -5.093017578125, -4.57958984375, -4.066162109375, -3.552734375, -3.039306640625, -2.52587890625, -2.012451171875, -1.4990234375, -0.985595703125, -0.47216796875, 0.041259765625, 0.5546875, 1.068115234375, 1.58154296875, 2.094970703125, 2.6083984375, 3.121826171875, 3.63525390625, 4.148681640625, 4.662109375, 5.175537109375, 5.68896484375, 6.202392578125, 6.7158203125, 7.229248046875, 7.74267578125, 8.256103515625, 8.76953125, 9.282958984375, 9.79638671875, 10.309814453125, 10.8232421875, 11.336669921875, 11.85009765625, 12.363525390625, 12.876953125, 13.390380859375, 13.90380859375, 14.417236328125, 14.9306640625, 15.444091796875, 15.95751953125, 16.470947265625, 16.984375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 3.0, 6.0, 9.0, 14.0, 15.0, 19.0, 25.0, 42.0, 64.0, 110.0, 164.0, 146.0, 125.0, 88.0, 56.0, 29.0, 29.0, 18.0, 11.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009851455688476562, -0.0009617507457733154, -0.0009383559226989746, -0.0009149610996246338, -0.000891566276550293, -0.0008681714534759521, -0.0008447766304016113, -0.0008213818073272705, -0.0007979869842529297, -0.0007745921611785889, -0.000751197338104248, -0.0007278025150299072, -0.0007044076919555664, -0.0006810128688812256, -0.0006576180458068848, -0.0006342232227325439, -0.0006108283996582031, -0.0005874335765838623, -0.0005640387535095215, -0.0005406439304351807, -0.0005172491073608398, -0.000493854284286499, -0.0004704594612121582, -0.0004470646381378174, -0.00042366981506347656, -0.00040027499198913574, -0.0003768801689147949, -0.0003534853458404541, -0.0003300905227661133, -0.00030669569969177246, -0.00028330087661743164, -0.0002599060535430908, -0.00023651123046875, -0.00021311640739440918, -0.00018972158432006836, -0.00016632676124572754, -0.00014293193817138672, -0.0001195371150970459, -9.614229202270508e-05, -7.274746894836426e-05, -4.935264587402344e-05, -2.5957822799682617e-05, -2.562999725341797e-06, 2.0831823348999023e-05, 4.4226646423339844e-05, 6.762146949768066e-05, 9.101629257202148e-05, 0.0001144111156463623, 0.00013780593872070312, 0.00016120076179504395, 0.00018459558486938477, 0.00020799040794372559, 0.0002313852310180664, 0.0002547800540924072, 0.00027817487716674805, 0.00030156970024108887, 0.0003249645233154297, 0.0003483593463897705, 0.00037175416946411133, 0.00039514899253845215, 0.00041854381561279297, 0.0004419386386871338, 0.0004653334617614746, 0.0004887282848358154, 0.0005121231079101562]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 14.0, 22.0, 27.0, 29.0, 42.0, 67.0, 97.0, 123.0, 208.0, 281.0, 431.0, 673.0, 1047.0, 1745.0, 2975.0, 5470.0, 10687.0, 24638.0, 71593.0, 522950.0, 305914.0, 57497.0, 20710.0, 9386.0, 4831.0, 2703.0, 1575.0, 973.0, 632.0, 384.0, 259.0, 162.0, 112.0, 76.0, 61.0, 42.0, 36.0, 12.0, 17.0, 14.0, 10.0, 7.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.296875, -9.9141845703125, -9.531494140625, -9.1488037109375, -8.76611328125, -8.3834228515625, -8.000732421875, -7.6180419921875, -7.2353515625, -6.8526611328125, -6.469970703125, -6.0872802734375, -5.70458984375, -5.3218994140625, -4.939208984375, -4.5565185546875, -4.173828125, -3.7911376953125, -3.408447265625, -3.0257568359375, -2.64306640625, -2.2603759765625, -1.877685546875, -1.4949951171875, -1.1123046875, -0.7296142578125, -0.346923828125, 0.0357666015625, 0.41845703125, 0.8011474609375, 1.183837890625, 1.5665283203125, 1.94921875, 2.3319091796875, 2.714599609375, 3.0972900390625, 3.47998046875, 3.8626708984375, 4.245361328125, 4.6280517578125, 5.0107421875, 5.3934326171875, 5.776123046875, 6.1588134765625, 6.54150390625, 6.9241943359375, 7.306884765625, 7.6895751953125, 8.072265625, 8.4549560546875, 8.837646484375, 9.2203369140625, 9.60302734375, 9.9857177734375, 10.368408203125, 10.7510986328125, 11.1337890625, 11.5164794921875, 11.899169921875, 12.2818603515625, 12.66455078125, 13.0472412109375, 13.429931640625, 13.8126220703125, 14.1953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 5.0, 2.0, 10.0, 6.0, 7.0, 15.0, 22.0, 21.0, 22.0, 36.0, 70.0, 80.0, 90.0, 117.0, 128.0, 86.0, 50.0, 47.0, 38.0, 27.0, 14.0, 11.0, 12.0, 9.0, 9.0, 11.0, 10.0, 5.0, 5.0, 6.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.19921875, -2.13592529296875, -2.0726318359375, -2.00933837890625, -1.946044921875, -1.88275146484375, -1.8194580078125, -1.75616455078125, -1.69287109375, -1.62957763671875, -1.5662841796875, -1.50299072265625, -1.439697265625, -1.37640380859375, -1.3131103515625, -1.24981689453125, -1.1865234375, -1.12322998046875, -1.0599365234375, -0.99664306640625, -0.933349609375, -0.87005615234375, -0.8067626953125, -0.74346923828125, -0.68017578125, -0.61688232421875, -0.5535888671875, -0.49029541015625, -0.427001953125, -0.36370849609375, -0.3004150390625, -0.23712158203125, -0.173828125, -0.11053466796875, -0.0472412109375, 0.01605224609375, 0.079345703125, 0.14263916015625, 0.2059326171875, 0.26922607421875, 0.33251953125, 0.39581298828125, 0.4591064453125, 0.52239990234375, 0.585693359375, 0.64898681640625, 0.7122802734375, 0.77557373046875, 0.8388671875, 0.90216064453125, 0.9654541015625, 1.02874755859375, 1.092041015625, 1.15533447265625, 1.2186279296875, 1.28192138671875, 1.34521484375, 1.40850830078125, 1.4718017578125, 1.53509521484375, 1.598388671875, 1.66168212890625, 1.7249755859375, 1.78826904296875, 1.8515625]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 21.0, 32.0, 42.0, 65.0, 84.0, 164.0, 195.0, 130.0, 78.0, 49.0, 39.0, 18.0, 13.0, 13.0, 11.0, 6.0, 3.0, 7.0, 8.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.304847717285156, -29.42697525024414, -28.549100875854492, -27.671228408813477, -26.793354034423828, -25.915481567382812, -25.037609100341797, -24.15973663330078, -23.281862258911133, -22.403989791870117, -21.52611541748047, -20.648242950439453, -19.770370483398438, -18.89249610900879, -18.014623641967773, -17.136749267578125, -16.25887680053711, -15.381003379821777, -14.503129959106445, -13.62525749206543, -12.747384071350098, -11.869510650634766, -10.99163818359375, -10.113764762878418, -9.235891342163086, -8.358017921447754, -7.48014497756958, -6.602272033691406, -5.724398612976074, -4.846525192260742, -3.9686522483825684, -3.0907793045043945, -2.2129058837890625, -1.3350327014923096, -0.45715951919555664, 0.4207136631011963, 1.2985868453979492, 2.1764602661132812, 3.054333209991455, 3.932206153869629, 4.810079574584961, 5.687952995300293, 6.565825939178467, 7.443698883056641, 8.321572303771973, 9.199445724487305, 10.07731819152832, 10.955191612243652, 11.833065032958984, 12.710938453674316, 13.588811874389648, 14.466684341430664, 15.344557762145996, 16.222431182861328, 17.100303649902344, 17.97817611694336, 18.856050491333008, 19.733922958374023, 20.611797332763672, 21.489669799804688, 22.367542266845703, 23.24541664123535, 24.123289108276367, 25.001163482666016, 25.87903594970703]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 6.0, 9.0, 16.0, 2.0, 20.0, 12.0, 15.0, 18.0, 20.0, 23.0, 26.0, 29.0, 28.0, 26.0, 30.0, 25.0, 41.0, 40.0, 38.0, 28.0, 39.0, 45.0, 35.0, 26.0, 43.0, 43.0, 32.0, 23.0, 33.0, 20.0, 31.0, 24.0, 16.0, 28.0, 9.0, 15.0, 9.0, 8.0, 7.0, 10.0, 7.0, 6.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.379477500915527, -9.082643508911133, -8.785808563232422, -8.488974571228027, -8.192140579223633, -7.895305633544922, -7.598471641540527, -7.301637172698975, -7.004802703857422, -6.707968235015869, -6.411133766174316, -6.114299774169922, -5.817465305328369, -5.520630836486816, -5.223796844482422, -4.926962375640869, -4.630127906799316, -4.333293437957764, -4.036458969116211, -3.7396249771118164, -3.4427905082702637, -3.145956039428711, -2.8491218090057373, -2.5522875785827637, -2.255453109741211, -1.9586187601089478, -1.6617844104766846, -1.3649500608444214, -1.0681157112121582, -0.771281361579895, -0.47444701194763184, -0.1776127815246582, 0.11922264099121094, 0.4160569906234741, 0.7128913402557373, 1.0097256898880005, 1.3065600395202637, 1.6033943891525269, 1.90022873878479, 2.1970629692077637, 2.4938974380493164, 2.790731906890869, 3.0875661373138428, 3.3844003677368164, 3.681234836578369, 3.978069305419922, 4.274903297424316, 4.571737766265869, 4.868572235107422, 5.165406703948975, 5.462241172790527, 5.759075164794922, 6.055909633636475, 6.352744102478027, 6.649578094482422, 6.946412563323975, 7.243247032165527, 7.54008150100708, 7.836915969848633, 8.133749961853027, 8.430583953857422, 8.727418899536133, 9.024252891540527, 9.321086883544922, 9.617921829223633]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 11.0, 5.0, 19.0, 22.0, 33.0, 75.0, 99.0, 182.0, 279.0, 419.0, 634.0, 1049.0, 1658.0, 2949.0, 4881.0, 8537.0, 14727.0, 25828.0, 47280.0, 87402.0, 163468.0, 261290.0, 194359.0, 104631.0, 56407.0, 30639.0, 17293.0, 9960.0, 5601.0, 3429.0, 2095.0, 1279.0, 749.0, 479.0, 307.0, 193.0, 101.0, 70.0, 46.0, 24.0, 24.0, 10.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.49169921875, -16.9208984375, -16.35009765625, -15.779296875, -15.20849609375, -14.6376953125, -14.06689453125, -13.49609375, -12.92529296875, -12.3544921875, -11.78369140625, -11.212890625, -10.64208984375, -10.0712890625, -9.50048828125, -8.9296875, -8.35888671875, -7.7880859375, -7.21728515625, -6.646484375, -6.07568359375, -5.5048828125, -4.93408203125, -4.36328125, -3.79248046875, -3.2216796875, -2.65087890625, -2.080078125, -1.50927734375, -0.9384765625, -0.36767578125, 0.203125, 0.77392578125, 1.3447265625, 1.91552734375, 2.486328125, 3.05712890625, 3.6279296875, 4.19873046875, 4.76953125, 5.34033203125, 5.9111328125, 6.48193359375, 7.052734375, 7.62353515625, 8.1943359375, 8.76513671875, 9.3359375, 9.90673828125, 10.4775390625, 11.04833984375, 11.619140625, 12.18994140625, 12.7607421875, 13.33154296875, 13.90234375, 14.47314453125, 15.0439453125, 15.61474609375, 16.185546875, 16.75634765625, 17.3271484375, 17.89794921875, 18.46875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 11.0, 12.0, 9.0, 10.0, 16.0, 24.0, 22.0, 27.0, 35.0, 35.0, 15.0, 36.0, 46.0, 46.0, 40.0, 44.0, 39.0, 48.0, 45.0, 39.0, 40.0, 49.0, 35.0, 45.0, 34.0, 27.0, 24.0, 25.0, 21.0, 12.0, 18.0, 11.0, 12.0, 4.0, 9.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3984375, -10.065673828125, -9.73291015625, -9.400146484375, -9.0673828125, -8.734619140625, -8.40185546875, -8.069091796875, -7.736328125, -7.403564453125, -7.07080078125, -6.738037109375, -6.4052734375, -6.072509765625, -5.73974609375, -5.406982421875, -5.07421875, -4.741455078125, -4.40869140625, -4.075927734375, -3.7431640625, -3.410400390625, -3.07763671875, -2.744873046875, -2.412109375, -2.079345703125, -1.74658203125, -1.413818359375, -1.0810546875, -0.748291015625, -0.41552734375, -0.082763671875, 0.25, 0.582763671875, 0.91552734375, 1.248291015625, 1.5810546875, 1.913818359375, 2.24658203125, 2.579345703125, 2.912109375, 3.244873046875, 3.57763671875, 3.910400390625, 4.2431640625, 4.575927734375, 4.90869140625, 5.241455078125, 5.57421875, 5.906982421875, 6.23974609375, 6.572509765625, 6.9052734375, 7.238037109375, 7.57080078125, 7.903564453125, 8.236328125, 8.569091796875, 8.90185546875, 9.234619140625, 9.5673828125, 9.900146484375, 10.23291015625, 10.565673828125, 10.8984375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 6.0, 6.0, 7.0, 8.0, 6.0, 14.0, 22.0, 38.0, 50.0, 81.0, 122.0, 175.0, 278.0, 402.0, 639.0, 1018.0, 1637.0, 2646.0, 4541.0, 7525.0, 13721.0, 25395.0, 49484.0, 100307.0, 212716.0, 305634.0, 160262.0, 76556.0, 37930.0, 20392.0, 11075.0, 6220.0, 3673.0, 2208.0, 1381.0, 845.0, 537.0, 340.0, 216.0, 160.0, 93.0, 50.0, 47.0, 34.0, 22.0, 19.0, 7.0, 10.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-20.140625, -19.517333984375, -18.89404296875, -18.270751953125, -17.6474609375, -17.024169921875, -16.40087890625, -15.777587890625, -15.154296875, -14.531005859375, -13.90771484375, -13.284423828125, -12.6611328125, -12.037841796875, -11.41455078125, -10.791259765625, -10.16796875, -9.544677734375, -8.92138671875, -8.298095703125, -7.6748046875, -7.051513671875, -6.42822265625, -5.804931640625, -5.181640625, -4.558349609375, -3.93505859375, -3.311767578125, -2.6884765625, -2.065185546875, -1.44189453125, -0.818603515625, -0.1953125, 0.427978515625, 1.05126953125, 1.674560546875, 2.2978515625, 2.921142578125, 3.54443359375, 4.167724609375, 4.791015625, 5.414306640625, 6.03759765625, 6.660888671875, 7.2841796875, 7.907470703125, 8.53076171875, 9.154052734375, 9.77734375, 10.400634765625, 11.02392578125, 11.647216796875, 12.2705078125, 12.893798828125, 13.51708984375, 14.140380859375, 14.763671875, 15.386962890625, 16.01025390625, 16.633544921875, 17.2568359375, 17.880126953125, 18.50341796875, 19.126708984375, 19.75]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 16.0, 11.0, 20.0, 17.0, 28.0, 24.0, 17.0, 24.0, 26.0, 35.0, 29.0, 34.0, 26.0, 44.0, 44.0, 44.0, 41.0, 46.0, 30.0, 45.0, 43.0, 39.0, 29.0, 35.0, 30.0, 28.0, 31.0, 15.0, 20.0, 26.0, 16.0, 18.0, 5.0, 9.0, 9.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.53228759765625, -6.3067626953125, -6.08123779296875, -5.855712890625, -5.63018798828125, -5.4046630859375, -5.17913818359375, -4.95361328125, -4.72808837890625, -4.5025634765625, -4.27703857421875, -4.051513671875, -3.82598876953125, -3.6004638671875, -3.37493896484375, -3.1494140625, -2.92388916015625, -2.6983642578125, -2.47283935546875, -2.247314453125, -2.02178955078125, -1.7962646484375, -1.57073974609375, -1.34521484375, -1.11968994140625, -0.8941650390625, -0.66864013671875, -0.443115234375, -0.21759033203125, 0.0079345703125, 0.23345947265625, 0.458984375, 0.68450927734375, 0.9100341796875, 1.13555908203125, 1.361083984375, 1.58660888671875, 1.8121337890625, 2.03765869140625, 2.26318359375, 2.48870849609375, 2.7142333984375, 2.93975830078125, 3.165283203125, 3.39080810546875, 3.6163330078125, 3.84185791015625, 4.0673828125, 4.29290771484375, 4.5184326171875, 4.74395751953125, 4.969482421875, 5.19500732421875, 5.4205322265625, 5.64605712890625, 5.87158203125, 6.09710693359375, 6.3226318359375, 6.54815673828125, 6.773681640625, 6.99920654296875, 7.2247314453125, 7.45025634765625, 7.67578125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 7.0, 6.0, 12.0, 21.0, 25.0, 37.0, 38.0, 59.0, 97.0, 149.0, 200.0, 347.0, 593.0, 1133.0, 2039.0, 4007.0, 8862.0, 22683.0, 77740.0, 634395.0, 224232.0, 43794.0, 15091.0, 6335.0, 2898.0, 1570.0, 873.0, 509.0, 280.0, 179.0, 98.0, 70.0, 51.0, 35.0, 19.0, 19.0, 10.0, 11.0, 12.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.875, -41.3857421875, -39.896484375, -38.4072265625, -36.91796875, -35.4287109375, -33.939453125, -32.4501953125, -30.9609375, -29.4716796875, -27.982421875, -26.4931640625, -25.00390625, -23.5146484375, -22.025390625, -20.5361328125, -19.046875, -17.5576171875, -16.068359375, -14.5791015625, -13.08984375, -11.6005859375, -10.111328125, -8.6220703125, -7.1328125, -5.6435546875, -4.154296875, -2.6650390625, -1.17578125, 0.3134765625, 1.802734375, 3.2919921875, 4.78125, 6.2705078125, 7.759765625, 9.2490234375, 10.73828125, 12.2275390625, 13.716796875, 15.2060546875, 16.6953125, 18.1845703125, 19.673828125, 21.1630859375, 22.65234375, 24.1416015625, 25.630859375, 27.1201171875, 28.609375, 30.0986328125, 31.587890625, 33.0771484375, 34.56640625, 36.0556640625, 37.544921875, 39.0341796875, 40.5234375, 42.0126953125, 43.501953125, 44.9912109375, 46.48046875, 47.9697265625, 49.458984375, 50.9482421875, 52.4375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 11.0, 8.0, 5.0, 15.0, 17.0, 30.0, 31.0, 45.0, 64.0, 72.0, 113.0, 150.0, 121.0, 80.0, 66.0, 44.0, 39.0, 20.0, 16.0, 16.0, 13.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001186370849609375, -0.0011431872844696045, -0.001100003719329834, -0.0010568201541900635, -0.001013636589050293, -0.0009704530239105225, -0.000927269458770752, -0.0008840858936309814, -0.0008409023284912109, -0.0007977187633514404, -0.0007545351982116699, -0.0007113516330718994, -0.0006681680679321289, -0.0006249845027923584, -0.0005818009376525879, -0.0005386173725128174, -0.0004954338073730469, -0.00045225024223327637, -0.00040906667709350586, -0.00036588311195373535, -0.00032269954681396484, -0.00027951598167419434, -0.00023633241653442383, -0.00019314885139465332, -0.0001499652862548828, -0.0001067817211151123, -6.35981559753418e-05, -2.041459083557129e-05, 2.276897430419922e-05, 6.595253944396973e-05, 0.00010913610458374023, 0.00015231966972351074, 0.00019550323486328125, 0.00023868680000305176, 0.00028187036514282227, 0.0003250539302825928, 0.0003682374954223633, 0.0004114210605621338, 0.0004546046257019043, 0.0004977881908416748, 0.0005409717559814453, 0.0005841553211212158, 0.0006273388862609863, 0.0006705224514007568, 0.0007137060165405273, 0.0007568895816802979, 0.0008000731468200684, 0.0008432567119598389, 0.0008864402770996094, 0.0009296238422393799, 0.0009728074073791504, 0.001015990972518921, 0.0010591745376586914, 0.001102358102798462, 0.0011455416679382324, 0.001188725233078003, 0.0012319087982177734, 0.001275092363357544, 0.0013182759284973145, 0.001361459493637085, 0.0014046430587768555, 0.001447826623916626, 0.0014910101890563965, 0.001534193754196167, 0.0015773773193359375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 10.0, 15.0, 15.0, 17.0, 27.0, 34.0, 50.0, 68.0, 88.0, 110.0, 163.0, 247.0, 394.0, 569.0, 932.0, 1527.0, 2720.0, 5403.0, 12294.0, 37752.0, 223061.0, 658021.0, 69424.0, 19214.0, 7604.0, 3613.0, 1942.0, 1089.0, 658.0, 424.0, 312.0, 199.0, 143.0, 110.0, 70.0, 57.0, 38.0, 24.0, 23.0, 16.0, 11.0, 20.0, 9.0, 5.0, 5.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-42.6875, -41.3623046875, -40.037109375, -38.7119140625, -37.38671875, -36.0615234375, -34.736328125, -33.4111328125, -32.0859375, -30.7607421875, -29.435546875, -28.1103515625, -26.78515625, -25.4599609375, -24.134765625, -22.8095703125, -21.484375, -20.1591796875, -18.833984375, -17.5087890625, -16.18359375, -14.8583984375, -13.533203125, -12.2080078125, -10.8828125, -9.5576171875, -8.232421875, -6.9072265625, -5.58203125, -4.2568359375, -2.931640625, -1.6064453125, -0.28125, 1.0439453125, 2.369140625, 3.6943359375, 5.01953125, 6.3447265625, 7.669921875, 8.9951171875, 10.3203125, 11.6455078125, 12.970703125, 14.2958984375, 15.62109375, 16.9462890625, 18.271484375, 19.5966796875, 20.921875, 22.2470703125, 23.572265625, 24.8974609375, 26.22265625, 27.5478515625, 28.873046875, 30.1982421875, 31.5234375, 32.8486328125, 34.173828125, 35.4990234375, 36.82421875, 38.1494140625, 39.474609375, 40.7998046875, 42.125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 17.0, 26.0, 45.0, 74.0, 103.0, 126.0, 146.0, 108.0, 102.0, 72.0, 36.0, 31.0, 23.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8046875, -8.4927978515625, -8.180908203125, -7.8690185546875, -7.55712890625, -7.2452392578125, -6.933349609375, -6.6214599609375, -6.3095703125, -5.9976806640625, -5.685791015625, -5.3739013671875, -5.06201171875, -4.7501220703125, -4.438232421875, -4.1263427734375, -3.814453125, -3.5025634765625, -3.190673828125, -2.8787841796875, -2.56689453125, -2.2550048828125, -1.943115234375, -1.6312255859375, -1.3193359375, -1.0074462890625, -0.695556640625, -0.3836669921875, -0.07177734375, 0.2401123046875, 0.552001953125, 0.8638916015625, 1.17578125, 1.4876708984375, 1.799560546875, 2.1114501953125, 2.42333984375, 2.7352294921875, 3.047119140625, 3.3590087890625, 3.6708984375, 3.9827880859375, 4.294677734375, 4.6065673828125, 4.91845703125, 5.2303466796875, 5.542236328125, 5.8541259765625, 6.166015625, 6.4779052734375, 6.789794921875, 7.1016845703125, 7.41357421875, 7.7254638671875, 8.037353515625, 8.3492431640625, 8.6611328125, 8.9730224609375, 9.284912109375, 9.5968017578125, 9.90869140625, 10.2205810546875, 10.532470703125, 10.8443603515625, 11.15625]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 7.0, 6.0, 10.0, 30.0, 51.0, 95.0, 151.0, 252.0, 146.0, 79.0, 53.0, 28.0, 20.0, 17.0, 11.0, 12.0, 7.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.832868576049805, -18.856258392333984, -17.879648208618164, -16.903038024902344, -15.926427841186523, -14.949817657470703, -13.9732084274292, -12.996598243713379, -12.019988059997559, -11.043377876281738, -10.066767692565918, -9.090158462524414, -8.113548278808594, -7.136937618255615, -6.160327911376953, -5.183717727661133, -4.2071075439453125, -3.230497360229492, -2.253887414932251, -1.2772774696350098, -0.30066728591918945, 0.6759428977966309, 1.652552604675293, 2.6291627883911133, 3.6057729721069336, 4.582383155822754, 5.558993339538574, 6.535603046417236, 7.512213230133057, 8.488822937011719, 9.465433120727539, 10.44204330444336, 11.418651580810547, 12.395261764526367, 13.371871948242188, 14.348482131958008, 15.325092315673828, 16.30170249938965, 17.27831268310547, 18.254920959472656, 19.23153305053711, 20.20814323425293, 21.18475341796875, 22.16136360168457, 23.13797378540039, 24.11458396911621, 25.09119415283203, 26.06780242919922, 27.04441261291504, 28.02102279663086, 28.99763298034668, 29.9742431640625, 30.95085334777832, 31.92746353149414, 32.90407180786133, 33.88068389892578, 34.85729217529297, 35.833900451660156, 36.81051254272461, 37.7871208190918, 38.76373291015625, 39.74034118652344, 40.71695327758789, 41.69356155395508, 42.67017364501953]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 2.0, 4.0, 4.0, 11.0, 9.0, 22.0, 13.0, 21.0, 24.0, 21.0, 16.0, 27.0, 20.0, 32.0, 37.0, 31.0, 32.0, 45.0, 37.0, 37.0, 46.0, 41.0, 39.0, 48.0, 33.0, 34.0, 40.0, 33.0, 28.0, 29.0, 17.0, 28.0, 18.0, 20.0, 18.0, 10.0, 17.0, 7.0, 16.0, 8.0, 4.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.943132400512695, -9.624908447265625, -9.306684494018555, -8.988460540771484, -8.670236587524414, -8.352012634277344, -8.033788681030273, -7.715564250946045, -7.397340297698975, -7.079116344451904, -6.760892391204834, -6.442668437957764, -6.124444007873535, -5.806220054626465, -5.4879961013793945, -5.169772148132324, -4.851548194885254, -4.533324241638184, -4.215100288391113, -3.896876096725464, -3.5786521434783936, -3.2604281902313232, -2.942203998565674, -2.6239800453186035, -2.305756092071533, -1.987532138824463, -1.669308066368103, -1.3510839939117432, -1.0328600406646729, -0.7146360874176025, -0.3964120149612427, -0.07818794250488281, 0.2400369644165039, 0.558260977268219, 0.8764849901199341, 1.194709062576294, 1.5129330158233643, 1.8311569690704346, 2.149381160736084, 2.4676051139831543, 2.7858290672302246, 3.104053020477295, 3.4222769737243652, 3.7405011653900146, 4.058725357055664, 4.376949310302734, 4.695173263549805, 5.013397216796875, 5.331621170043945, 5.649845123291016, 5.968069076538086, 6.286293029785156, 6.604516983032227, 6.922740936279297, 7.240965366363525, 7.559189319610596, 7.877413272857666, 8.195637702941895, 8.513861656188965, 8.832085609436035, 9.150309562683105, 9.468533515930176, 9.786757469177246, 10.104981422424316, 10.423205375671387]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 11.0, 8.0, 25.0, 25.0, 40.0, 66.0, 84.0, 145.0, 252.0, 361.0, 521.0, 821.0, 1260.0, 2031.0, 2996.0, 4596.0, 7522.0, 12416.0, 21371.0, 39895.0, 79237.0, 179758.0, 609342.0, 2079330.0, 755067.0, 205157.0, 87872.0, 43628.0, 23415.0, 13371.0, 8288.0, 5105.0, 3459.0, 2131.0, 1504.0, 1032.0, 658.0, 443.0, 325.0, 206.0, 145.0, 107.0, 92.0, 52.0, 45.0, 18.0, 13.0, 13.0, 6.0, 11.0, 2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.390625, -13.86865234375, -13.3466796875, -12.82470703125, -12.302734375, -11.78076171875, -11.2587890625, -10.73681640625, -10.21484375, -9.69287109375, -9.1708984375, -8.64892578125, -8.126953125, -7.60498046875, -7.0830078125, -6.56103515625, -6.0390625, -5.51708984375, -4.9951171875, -4.47314453125, -3.951171875, -3.42919921875, -2.9072265625, -2.38525390625, -1.86328125, -1.34130859375, -0.8193359375, -0.29736328125, 0.224609375, 0.74658203125, 1.2685546875, 1.79052734375, 2.3125, 2.83447265625, 3.3564453125, 3.87841796875, 4.400390625, 4.92236328125, 5.4443359375, 5.96630859375, 6.48828125, 7.01025390625, 7.5322265625, 8.05419921875, 8.576171875, 9.09814453125, 9.6201171875, 10.14208984375, 10.6640625, 11.18603515625, 11.7080078125, 12.22998046875, 12.751953125, 13.27392578125, 13.7958984375, 14.31787109375, 14.83984375, 15.36181640625, 15.8837890625, 16.40576171875, 16.927734375, 17.44970703125, 17.9716796875, 18.49365234375, 19.015625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 10.0, 5.0, 8.0, 15.0, 12.0, 19.0, 12.0, 27.0, 36.0, 23.0, 17.0, 30.0, 26.0, 41.0, 33.0, 54.0, 44.0, 46.0, 65.0, 51.0, 36.0, 36.0, 35.0, 42.0, 36.0, 37.0, 31.0, 27.0, 23.0, 20.0, 13.0, 12.0, 19.0, 10.0, 8.0, 11.0, 11.0, 5.0, 3.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.58203125, -5.38720703125, -5.1923828125, -4.99755859375, -4.802734375, -4.60791015625, -4.4130859375, -4.21826171875, -4.0234375, -3.82861328125, -3.6337890625, -3.43896484375, -3.244140625, -3.04931640625, -2.8544921875, -2.65966796875, -2.46484375, -2.27001953125, -2.0751953125, -1.88037109375, -1.685546875, -1.49072265625, -1.2958984375, -1.10107421875, -0.90625, -0.71142578125, -0.5166015625, -0.32177734375, -0.126953125, 0.06787109375, 0.2626953125, 0.45751953125, 0.65234375, 0.84716796875, 1.0419921875, 1.23681640625, 1.431640625, 1.62646484375, 1.8212890625, 2.01611328125, 2.2109375, 2.40576171875, 2.6005859375, 2.79541015625, 2.990234375, 3.18505859375, 3.3798828125, 3.57470703125, 3.76953125, 3.96435546875, 4.1591796875, 4.35400390625, 4.548828125, 4.74365234375, 4.9384765625, 5.13330078125, 5.328125, 5.52294921875, 5.7177734375, 5.91259765625, 6.107421875, 6.30224609375, 6.4970703125, 6.69189453125, 6.88671875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 11.0, 11.0, 10.0, 9.0, 23.0, 21.0, 44.0, 48.0, 82.0, 107.0, 179.0, 238.0, 399.0, 493.0, 786.0, 1263.0, 1722.0, 3006.0, 4725.0, 7690.0, 13209.0, 23375.0, 43683.0, 90008.0, 213553.0, 634261.0, 1931264.0, 765849.0, 246246.0, 101044.0, 48710.0, 25515.0, 14184.0, 8490.0, 5105.0, 3036.0, 2033.0, 1230.0, 858.0, 598.0, 350.0, 291.0, 166.0, 115.0, 76.0, 42.0, 45.0, 26.0, 14.0, 17.0, 11.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0546875, -12.627685546875, -12.20068359375, -11.773681640625, -11.3466796875, -10.919677734375, -10.49267578125, -10.065673828125, -9.638671875, -9.211669921875, -8.78466796875, -8.357666015625, -7.9306640625, -7.503662109375, -7.07666015625, -6.649658203125, -6.22265625, -5.795654296875, -5.36865234375, -4.941650390625, -4.5146484375, -4.087646484375, -3.66064453125, -3.233642578125, -2.806640625, -2.379638671875, -1.95263671875, -1.525634765625, -1.0986328125, -0.671630859375, -0.24462890625, 0.182373046875, 0.609375, 1.036376953125, 1.46337890625, 1.890380859375, 2.3173828125, 2.744384765625, 3.17138671875, 3.598388671875, 4.025390625, 4.452392578125, 4.87939453125, 5.306396484375, 5.7333984375, 6.160400390625, 6.58740234375, 7.014404296875, 7.44140625, 7.868408203125, 8.29541015625, 8.722412109375, 9.1494140625, 9.576416015625, 10.00341796875, 10.430419921875, 10.857421875, 11.284423828125, 11.71142578125, 12.138427734375, 12.5654296875, 12.992431640625, 13.41943359375, 13.846435546875, 14.2734375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 9.0, 17.0, 13.0, 20.0, 39.0, 32.0, 45.0, 45.0, 69.0, 98.0, 106.0, 126.0, 163.0, 201.0, 229.0, 280.0, 319.0, 385.0, 314.0, 299.0, 229.0, 200.0, 139.0, 109.0, 110.0, 78.0, 83.0, 56.0, 53.0, 36.0, 39.0, 18.0, 24.0, 16.0, 14.0, 10.0, 4.0, 5.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.48046875, -3.373748779296875, -3.26702880859375, -3.160308837890625, -3.0535888671875, -2.946868896484375, -2.84014892578125, -2.733428955078125, -2.626708984375, -2.519989013671875, -2.41326904296875, -2.306549072265625, -2.1998291015625, -2.093109130859375, -1.98638916015625, -1.879669189453125, -1.77294921875, -1.666229248046875, -1.55950927734375, -1.452789306640625, -1.3460693359375, -1.239349365234375, -1.13262939453125, -1.025909423828125, -0.919189453125, -0.812469482421875, -0.70574951171875, -0.599029541015625, -0.4923095703125, -0.385589599609375, -0.27886962890625, -0.172149658203125, -0.0654296875, 0.041290283203125, 0.14801025390625, 0.254730224609375, 0.3614501953125, 0.468170166015625, 0.57489013671875, 0.681610107421875, 0.788330078125, 0.895050048828125, 1.00177001953125, 1.108489990234375, 1.2152099609375, 1.321929931640625, 1.42864990234375, 1.535369873046875, 1.64208984375, 1.748809814453125, 1.85552978515625, 1.962249755859375, 2.0689697265625, 2.175689697265625, 2.28240966796875, 2.389129638671875, 2.495849609375, 2.602569580078125, 2.70928955078125, 2.816009521484375, 2.9227294921875, 3.029449462890625, 3.13616943359375, 3.242889404296875, 3.349609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 11.0, 11.0, 13.0, 14.0, 16.0, 32.0, 31.0, 41.0, 71.0, 91.0, 151.0, 143.0, 105.0, 72.0, 42.0, 47.0, 31.0, 16.0, 12.0, 7.0, 5.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.33967399597168, -9.929840087890625, -9.52000617980957, -9.110173225402832, -8.700339317321777, -8.290505409240723, -7.880671501159668, -7.4708380699157715, -7.061004638671875, -6.65117073059082, -6.241337299346924, -5.831503391265869, -5.421669960021973, -5.011836051940918, -4.602002143859863, -4.192168712615967, -3.782334804534912, -3.3725011348724365, -2.962667465209961, -2.5528335571289062, -2.1430001258850098, -1.733166217803955, -1.3233325481414795, -0.9134988784790039, -0.5036652088165283, -0.09383150935173035, 0.3160021901130676, 0.725835919380188, 1.1356695890426636, 1.5455033779144287, 1.9553370475769043, 2.36517071723938, 2.7750043869018555, 3.184838056564331, 3.5946717262268066, 4.004505634307861, 4.414339065551758, 4.8241729736328125, 5.234006881713867, 5.643840312957764, 6.05367374420166, 6.463507652282715, 6.873341083526611, 7.283174991607666, 7.6930084228515625, 8.102842330932617, 8.512676239013672, 8.922510147094727, 9.332344055175781, 9.742177963256836, 10.15201187133789, 10.561844825744629, 10.971678733825684, 11.381512641906738, 11.791346549987793, 12.201179504394531, 12.611013412475586, 13.02084732055664, 13.430681228637695, 13.840514183044434, 14.250348091125488, 14.660181999206543, 15.070015907287598, 15.479848861694336, 15.88968276977539]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 5.0, 13.0, 13.0, 14.0, 19.0, 26.0, 30.0, 26.0, 35.0, 25.0, 48.0, 47.0, 36.0, 36.0, 45.0, 51.0, 39.0, 43.0, 42.0, 51.0, 51.0, 32.0, 39.0, 37.0, 22.0, 32.0, 20.0, 21.0, 19.0, 17.0, 13.0, 8.0, 13.0, 8.0, 2.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.224446773529053, -6.994480133056641, -6.7645134925842285, -6.534546852111816, -6.304580211639404, -6.074613571166992, -5.84464693069458, -5.614680290222168, -5.384713649749756, -5.154747009277344, -4.924780368804932, -4.6948137283325195, -4.464847087860107, -4.234880447387695, -4.004913806915283, -3.774947166442871, -3.544980525970459, -3.315013885498047, -3.0850472450256348, -2.8550806045532227, -2.6251139640808105, -2.3951473236083984, -2.1651806831359863, -1.9352140426635742, -1.705247402191162, -1.47528076171875, -1.245314121246338, -1.0153474807739258, -0.7853808403015137, -0.5554141998291016, -0.32544755935668945, -0.09548091888427734, 0.13448524475097656, 0.36445188522338867, 0.5944185256958008, 0.8243851661682129, 1.054351806640625, 1.284318447113037, 1.5142850875854492, 1.7442517280578613, 1.9742183685302734, 2.2041850090026855, 2.4341516494750977, 2.6641182899475098, 2.894084930419922, 3.124051570892334, 3.354018211364746, 3.583984851837158, 3.8139514923095703, 4.043918132781982, 4.2738847732543945, 4.503851413726807, 4.733818054199219, 4.963784694671631, 5.193751335144043, 5.423717975616455, 5.653684616088867, 5.883651256561279, 6.113617897033691, 6.3435845375061035, 6.573551177978516, 6.803517818450928, 7.03348445892334, 7.263451099395752, 7.493417739868164]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 8.0, 8.0, 15.0, 22.0, 31.0, 42.0, 54.0, 75.0, 118.0, 160.0, 197.0, 295.0, 484.0, 649.0, 990.0, 1435.0, 2305.0, 3680.0, 5982.0, 10098.0, 18823.0, 37817.0, 87605.0, 293486.0, 386140.0, 104457.0, 43158.0, 21200.0, 11294.0, 6487.0, 3961.0, 2484.0, 1661.0, 1010.0, 699.0, 468.0, 332.0, 236.0, 161.0, 121.0, 92.0, 58.0, 38.0, 34.0, 18.0, 14.0, 9.0, 9.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-11.2890625, -10.937255859375, -10.58544921875, -10.233642578125, -9.8818359375, -9.530029296875, -9.17822265625, -8.826416015625, -8.474609375, -8.122802734375, -7.77099609375, -7.419189453125, -7.0673828125, -6.715576171875, -6.36376953125, -6.011962890625, -5.66015625, -5.308349609375, -4.95654296875, -4.604736328125, -4.2529296875, -3.901123046875, -3.54931640625, -3.197509765625, -2.845703125, -2.493896484375, -2.14208984375, -1.790283203125, -1.4384765625, -1.086669921875, -0.73486328125, -0.383056640625, -0.03125, 0.320556640625, 0.67236328125, 1.024169921875, 1.3759765625, 1.727783203125, 2.07958984375, 2.431396484375, 2.783203125, 3.135009765625, 3.48681640625, 3.838623046875, 4.1904296875, 4.542236328125, 4.89404296875, 5.245849609375, 5.59765625, 5.949462890625, 6.30126953125, 6.653076171875, 7.0048828125, 7.356689453125, 7.70849609375, 8.060302734375, 8.412109375, 8.763916015625, 9.11572265625, 9.467529296875, 9.8193359375, 10.171142578125, 10.52294921875, 10.874755859375, 11.2265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 4.0, 10.0, 6.0, 7.0, 15.0, 21.0, 18.0, 19.0, 27.0, 28.0, 24.0, 37.0, 40.0, 40.0, 41.0, 35.0, 46.0, 39.0, 39.0, 41.0, 44.0, 45.0, 48.0, 44.0, 34.0, 34.0, 30.0, 22.0, 24.0, 13.0, 26.0, 18.0, 14.0, 14.0, 10.0, 13.0, 10.0, 8.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-7.62890625, -7.41058349609375, -7.1922607421875, -6.97393798828125, -6.755615234375, -6.53729248046875, -6.3189697265625, -6.10064697265625, -5.88232421875, -5.66400146484375, -5.4456787109375, -5.22735595703125, -5.009033203125, -4.79071044921875, -4.5723876953125, -4.35406494140625, -4.1357421875, -3.91741943359375, -3.6990966796875, -3.48077392578125, -3.262451171875, -3.04412841796875, -2.8258056640625, -2.60748291015625, -2.38916015625, -2.17083740234375, -1.9525146484375, -1.73419189453125, -1.515869140625, -1.29754638671875, -1.0792236328125, -0.86090087890625, -0.642578125, -0.42425537109375, -0.2059326171875, 0.01239013671875, 0.230712890625, 0.44903564453125, 0.6673583984375, 0.88568115234375, 1.10400390625, 1.32232666015625, 1.5406494140625, 1.75897216796875, 1.977294921875, 2.19561767578125, 2.4139404296875, 2.63226318359375, 2.8505859375, 3.06890869140625, 3.2872314453125, 3.50555419921875, 3.723876953125, 3.94219970703125, 4.1605224609375, 4.37884521484375, 4.59716796875, 4.81549072265625, 5.0338134765625, 5.25213623046875, 5.470458984375, 5.68878173828125, 5.9071044921875, 6.12542724609375, 6.34375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 17.0, 15.0, 11.0, 21.0, 27.0, 42.0, 51.0, 76.0, 119.0, 151.0, 214.0, 317.0, 418.0, 723.0, 1034.0, 1720.0, 2860.0, 5598.0, 11496.0, 31428.0, 279446.0, 645453.0, 39282.0, 13173.0, 6137.0, 3307.0, 1830.0, 1206.0, 709.0, 490.0, 342.0, 236.0, 160.0, 134.0, 99.0, 40.0, 41.0, 43.0, 25.0, 15.0, 16.0, 11.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.296875, -23.5625, -22.828125, -22.09375, -21.359375, -20.625, -19.890625, -19.15625, -18.421875, -17.6875, -16.953125, -16.21875, -15.484375, -14.75, -14.015625, -13.28125, -12.546875, -11.8125, -11.078125, -10.34375, -9.609375, -8.875, -8.140625, -7.40625, -6.671875, -5.9375, -5.203125, -4.46875, -3.734375, -3.0, -2.265625, -1.53125, -0.796875, -0.0625, 0.671875, 1.40625, 2.140625, 2.875, 3.609375, 4.34375, 5.078125, 5.8125, 6.546875, 7.28125, 8.015625, 8.75, 9.484375, 10.21875, 10.953125, 11.6875, 12.421875, 13.15625, 13.890625, 14.625, 15.359375, 16.09375, 16.828125, 17.5625, 18.296875, 19.03125, 19.765625, 20.5, 21.234375, 21.96875, 22.703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 5.0, 2.0, 16.0, 17.0, 8.0, 20.0, 20.0, 30.0, 32.0, 36.0, 42.0, 51.0, 63.0, 48.0, 50.0, 54.0, 61.0, 54.0, 74.0, 44.0, 41.0, 45.0, 35.0, 20.0, 26.0, 15.0, 15.0, 14.0, 15.0, 12.0, 10.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.01953125, -6.81781005859375, -6.6160888671875, -6.41436767578125, -6.212646484375, -6.01092529296875, -5.8092041015625, -5.60748291015625, -5.40576171875, -5.20404052734375, -5.0023193359375, -4.80059814453125, -4.598876953125, -4.39715576171875, -4.1954345703125, -3.99371337890625, -3.7919921875, -3.59027099609375, -3.3885498046875, -3.18682861328125, -2.985107421875, -2.78338623046875, -2.5816650390625, -2.37994384765625, -2.17822265625, -1.97650146484375, -1.7747802734375, -1.57305908203125, -1.371337890625, -1.16961669921875, -0.9678955078125, -0.76617431640625, -0.564453125, -0.36273193359375, -0.1610107421875, 0.04071044921875, 0.242431640625, 0.44415283203125, 0.6458740234375, 0.84759521484375, 1.04931640625, 1.25103759765625, 1.4527587890625, 1.65447998046875, 1.856201171875, 2.05792236328125, 2.2596435546875, 2.46136474609375, 2.6630859375, 2.86480712890625, 3.0665283203125, 3.26824951171875, 3.469970703125, 3.67169189453125, 3.8734130859375, 4.07513427734375, 4.27685546875, 4.47857666015625, 4.6802978515625, 4.88201904296875, 5.083740234375, 5.28546142578125, 5.4871826171875, 5.68890380859375, 5.890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 9.0, 7.0, 13.0, 15.0, 15.0, 27.0, 34.0, 40.0, 71.0, 70.0, 133.0, 146.0, 230.0, 351.0, 438.0, 618.0, 886.0, 1212.0, 1741.0, 2670.0, 4253.0, 6984.0, 12766.0, 25435.0, 68367.0, 590181.0, 235765.0, 47886.0, 20418.0, 10543.0, 5883.0, 3644.0, 2310.0, 1573.0, 1111.0, 745.0, 556.0, 398.0, 249.0, 212.0, 169.0, 130.0, 70.0, 51.0, 50.0, 35.0, 19.0, 9.0, 5.0, 3.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.96484375, -3.8363037109375, -3.707763671875, -3.5792236328125, -3.45068359375, -3.3221435546875, -3.193603515625, -3.0650634765625, -2.9365234375, -2.8079833984375, -2.679443359375, -2.5509033203125, -2.42236328125, -2.2938232421875, -2.165283203125, -2.0367431640625, -1.908203125, -1.7796630859375, -1.651123046875, -1.5225830078125, -1.39404296875, -1.2655029296875, -1.136962890625, -1.0084228515625, -0.8798828125, -0.7513427734375, -0.622802734375, -0.4942626953125, -0.36572265625, -0.2371826171875, -0.108642578125, 0.0198974609375, 0.1484375, 0.2769775390625, 0.405517578125, 0.5340576171875, 0.66259765625, 0.7911376953125, 0.919677734375, 1.0482177734375, 1.1767578125, 1.3052978515625, 1.433837890625, 1.5623779296875, 1.69091796875, 1.8194580078125, 1.947998046875, 2.0765380859375, 2.205078125, 2.3336181640625, 2.462158203125, 2.5906982421875, 2.71923828125, 2.8477783203125, 2.976318359375, 3.1048583984375, 3.2333984375, 3.3619384765625, 3.490478515625, 3.6190185546875, 3.74755859375, 3.8760986328125, 4.004638671875, 4.1331787109375, 4.26171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 5.0, 9.0, 7.0, 6.0, 14.0, 16.0, 21.0, 31.0, 26.0, 54.0, 64.0, 119.0, 105.0, 120.0, 84.0, 70.0, 71.0, 43.0, 35.0, 17.0, 20.0, 9.0, 12.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00014591217041015625, -0.0001408495008945465, -0.00013578683137893677, -0.00013072416186332703, -0.00012566149234771729, -0.00012059882283210754, -0.0001155361533164978, -0.00011047348380088806, -0.00010541081428527832, -0.00010034814476966858, -9.528547525405884e-05, -9.02228057384491e-05, -8.516013622283936e-05, -8.009746670722961e-05, -7.503479719161987e-05, -6.997212767601013e-05, -6.490945816040039e-05, -5.984678864479065e-05, -5.478411912918091e-05, -4.972144961357117e-05, -4.4658780097961426e-05, -3.9596110582351685e-05, -3.453344106674194e-05, -2.9470771551132202e-05, -2.440810203552246e-05, -1.934543251991272e-05, -1.4282763004302979e-05, -9.220093488693237e-06, -4.157423973083496e-06, 9.052455425262451e-07, 5.967915058135986e-06, 1.1030584573745728e-05, 1.609325408935547e-05, 2.115592360496521e-05, 2.621859312057495e-05, 3.128126263618469e-05, 3.6343932151794434e-05, 4.1406601667404175e-05, 4.6469271183013916e-05, 5.153194069862366e-05, 5.65946102142334e-05, 6.165727972984314e-05, 6.671994924545288e-05, 7.178261876106262e-05, 7.684528827667236e-05, 8.19079577922821e-05, 8.697062730789185e-05, 9.203329682350159e-05, 9.709596633911133e-05, 0.00010215863585472107, 0.00010722130537033081, 0.00011228397488594055, 0.00011734664440155029, 0.00012240931391716003, 0.00012747198343276978, 0.00013253465294837952, 0.00013759732246398926, 0.000142659991979599, 0.00014772266149520874, 0.00015278533101081848, 0.00015784800052642822, 0.00016291067004203796, 0.0001679733395576477, 0.00017303600907325745, 0.0001780986785888672]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 14.0, 18.0, 29.0, 39.0, 62.0, 94.0, 166.0, 254.0, 398.0, 649.0, 1065.0, 1696.0, 3011.0, 5824.0, 12082.0, 28608.0, 92836.0, 623794.0, 198155.0, 45032.0, 17015.0, 7999.0, 4180.0, 2185.0, 1230.0, 793.0, 458.0, 307.0, 187.0, 120.0, 67.0, 52.0, 38.0, 25.0, 20.0, 14.0, 11.0, 6.0, 4.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3359375, -5.1728515625, -5.009765625, -4.8466796875, -4.68359375, -4.5205078125, -4.357421875, -4.1943359375, -4.03125, -3.8681640625, -3.705078125, -3.5419921875, -3.37890625, -3.2158203125, -3.052734375, -2.8896484375, -2.7265625, -2.5634765625, -2.400390625, -2.2373046875, -2.07421875, -1.9111328125, -1.748046875, -1.5849609375, -1.421875, -1.2587890625, -1.095703125, -0.9326171875, -0.76953125, -0.6064453125, -0.443359375, -0.2802734375, -0.1171875, 0.0458984375, 0.208984375, 0.3720703125, 0.53515625, 0.6982421875, 0.861328125, 1.0244140625, 1.1875, 1.3505859375, 1.513671875, 1.6767578125, 1.83984375, 2.0029296875, 2.166015625, 2.3291015625, 2.4921875, 2.6552734375, 2.818359375, 2.9814453125, 3.14453125, 3.3076171875, 3.470703125, 3.6337890625, 3.796875, 3.9599609375, 4.123046875, 4.2861328125, 4.44921875, 4.6123046875, 4.775390625, 4.9384765625, 5.1015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 3.0, 7.0, 2.0, 2.0, 6.0, 7.0, 23.0, 28.0, 32.0, 56.0, 74.0, 128.0, 170.0, 154.0, 102.0, 59.0, 29.0, 27.0, 17.0, 12.0, 18.0, 8.0, 11.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.1720428466796875, -1.135101318359375, -1.0981597900390625, -1.06121826171875, -1.0242767333984375, -0.987335205078125, -0.9503936767578125, -0.9134521484375, -0.8765106201171875, -0.839569091796875, -0.8026275634765625, -0.76568603515625, -0.7287445068359375, -0.691802978515625, -0.6548614501953125, -0.617919921875, -0.5809783935546875, -0.544036865234375, -0.5070953369140625, -0.47015380859375, -0.4332122802734375, -0.396270751953125, -0.3593292236328125, -0.3223876953125, -0.2854461669921875, -0.248504638671875, -0.2115631103515625, -0.17462158203125, -0.1376800537109375, -0.100738525390625, -0.0637969970703125, -0.02685546875, 0.0100860595703125, 0.047027587890625, 0.0839691162109375, 0.12091064453125, 0.1578521728515625, 0.194793701171875, 0.2317352294921875, 0.2686767578125, 0.3056182861328125, 0.342559814453125, 0.3795013427734375, 0.41644287109375, 0.4533843994140625, 0.490325927734375, 0.5272674560546875, 0.564208984375, 0.6011505126953125, 0.638092041015625, 0.6750335693359375, 0.71197509765625, 0.7489166259765625, 0.785858154296875, 0.8227996826171875, 0.8597412109375, 0.8966827392578125, 0.933624267578125, 0.9705657958984375, 1.00750732421875, 1.0444488525390625, 1.081390380859375, 1.1183319091796875, 1.1552734375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 15.0, 7.0, 17.0, 20.0, 27.0, 31.0, 51.0, 84.0, 113.0, 166.0, 136.0, 80.0, 75.0, 48.0, 27.0, 25.0, 14.0, 12.0, 16.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.902300834655762, -8.493037223815918, -8.083773612976074, -7.674509525299072, -7.2652459144592285, -6.855982303619385, -6.446718215942383, -6.037454605102539, -5.628190994262695, -5.218927383422852, -4.809663772583008, -4.400399684906006, -3.991136074066162, -3.5818724632263184, -3.1726086139678955, -2.7633447647094727, -2.354081153869629, -1.9448174238204956, -1.5355536937713623, -1.126289963722229, -0.7170262336730957, -0.30776262283325195, 0.1015012264251709, 0.5107650756835938, 0.9200286865234375, 1.3292924165725708, 1.738556146621704, 2.147819995880127, 2.5570836067199707, 2.9663472175598145, 3.3756110668182373, 3.78487491607666, 4.1941375732421875, 4.603401184082031, 5.012664794921875, 5.421928882598877, 5.831192493438721, 6.2404561042785645, 6.649720191955566, 7.05898380279541, 7.468247413635254, 7.877511024475098, 8.286774635314941, 8.696038246154785, 9.105302810668945, 9.514566421508789, 9.923830032348633, 10.333093643188477, 10.74235725402832, 11.151620864868164, 11.560884475708008, 11.970148086547852, 12.379411697387695, 12.788675308227539, 13.1979398727417, 13.607203483581543, 14.016467094421387, 14.42573070526123, 14.834994316101074, 15.244257926940918, 15.653522491455078, 16.062786102294922, 16.472049713134766, 16.88131332397461, 17.290576934814453]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 7.0, 18.0, 14.0, 17.0, 27.0, 26.0, 28.0, 45.0, 28.0, 45.0, 51.0, 31.0, 42.0, 43.0, 52.0, 40.0, 41.0, 44.0, 51.0, 39.0, 40.0, 38.0, 30.0, 36.0, 21.0, 18.0, 24.0, 16.0, 19.0, 10.0, 8.0, 9.0, 8.0, 2.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.872030258178711, -6.651519298553467, -6.4310078620910645, -6.21049690246582, -5.989985466003418, -5.769474506378174, -5.54896354675293, -5.328452110290527, -5.107941150665283, -4.887430191040039, -4.666918754577637, -4.446407794952393, -4.225896835327148, -4.005385398864746, -3.784874439239502, -3.5643632411956787, -3.3438520431518555, -3.1233408451080322, -2.902829647064209, -2.682318687438965, -2.4618074893951416, -2.2412962913513184, -2.020785331726074, -1.800274133682251, -1.5797629356384277, -1.3592517375946045, -1.1387406587600708, -0.9182295203208923, -0.6977183818817139, -0.4772071838378906, -0.25669610500335693, -0.03618502616882324, 0.1843266487121582, 0.40483778715133667, 0.6253489255905151, 0.8458600640296936, 1.066371202468872, 1.2868824005126953, 1.507393479347229, 1.7279045581817627, 1.948415756225586, 2.168926954269409, 2.3894381523132324, 2.6099491119384766, 2.8304603099823, 3.050971508026123, 3.271482467651367, 3.4919936656951904, 3.7125048637390137, 3.933016061782837, 4.15352725982666, 4.374038219451904, 4.594549179077148, 4.815060615539551, 5.035571575164795, 5.256082534790039, 5.476593971252441, 5.6971049308776855, 5.917616367340088, 6.138127326965332, 6.358638763427734, 6.5791497230529785, 6.799660682678223, 7.020172119140625, 7.240683078765869]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 6.0, 8.0, 17.0, 15.0, 23.0, 39.0, 55.0, 74.0, 123.0, 141.0, 236.0, 329.0, 485.0, 696.0, 1045.0, 1679.0, 2440.0, 3942.0, 6431.0, 10530.0, 18086.0, 31305.0, 56133.0, 103250.0, 199925.0, 267994.0, 154507.0, 80975.0, 44524.0, 25168.0, 14735.0, 8747.0, 5343.0, 3293.0, 2127.0, 1314.0, 901.0, 572.0, 404.0, 286.0, 180.0, 140.0, 104.0, 65.0, 44.0, 32.0, 34.0, 26.0, 13.0, 12.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.0859375, -10.7427978515625, -10.399658203125, -10.0565185546875, -9.71337890625, -9.3702392578125, -9.027099609375, -8.6839599609375, -8.3408203125, -7.9976806640625, -7.654541015625, -7.3114013671875, -6.96826171875, -6.6251220703125, -6.281982421875, -5.9388427734375, -5.595703125, -5.2525634765625, -4.909423828125, -4.5662841796875, -4.22314453125, -3.8800048828125, -3.536865234375, -3.1937255859375, -2.8505859375, -2.5074462890625, -2.164306640625, -1.8211669921875, -1.47802734375, -1.1348876953125, -0.791748046875, -0.4486083984375, -0.10546875, 0.2376708984375, 0.580810546875, 0.9239501953125, 1.26708984375, 1.6102294921875, 1.953369140625, 2.2965087890625, 2.6396484375, 2.9827880859375, 3.325927734375, 3.6690673828125, 4.01220703125, 4.3553466796875, 4.698486328125, 5.0416259765625, 5.384765625, 5.7279052734375, 6.071044921875, 6.4141845703125, 6.75732421875, 7.1004638671875, 7.443603515625, 7.7867431640625, 8.1298828125, 8.4730224609375, 8.816162109375, 9.1593017578125, 9.50244140625, 9.8455810546875, 10.188720703125, 10.5318603515625, 10.875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 10.0, 10.0, 10.0, 15.0, 14.0, 20.0, 33.0, 31.0, 30.0, 34.0, 39.0, 33.0, 29.0, 29.0, 41.0, 44.0, 49.0, 38.0, 41.0, 41.0, 36.0, 40.0, 30.0, 28.0, 35.0, 25.0, 30.0, 13.0, 24.0, 21.0, 15.0, 10.0, 14.0, 15.0, 11.0, 10.0, 8.0, 4.0, 5.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-5.1015625, -4.933349609375, -4.76513671875, -4.596923828125, -4.4287109375, -4.260498046875, -4.09228515625, -3.924072265625, -3.755859375, -3.587646484375, -3.41943359375, -3.251220703125, -3.0830078125, -2.914794921875, -2.74658203125, -2.578369140625, -2.41015625, -2.241943359375, -2.07373046875, -1.905517578125, -1.7373046875, -1.569091796875, -1.40087890625, -1.232666015625, -1.064453125, -0.896240234375, -0.72802734375, -0.559814453125, -0.3916015625, -0.223388671875, -0.05517578125, 0.113037109375, 0.28125, 0.449462890625, 0.61767578125, 0.785888671875, 0.9541015625, 1.122314453125, 1.29052734375, 1.458740234375, 1.626953125, 1.795166015625, 1.96337890625, 2.131591796875, 2.2998046875, 2.468017578125, 2.63623046875, 2.804443359375, 2.97265625, 3.140869140625, 3.30908203125, 3.477294921875, 3.6455078125, 3.813720703125, 3.98193359375, 4.150146484375, 4.318359375, 4.486572265625, 4.65478515625, 4.822998046875, 4.9912109375, 5.159423828125, 5.32763671875, 5.495849609375, 5.6640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 11.0, 18.0, 14.0, 34.0, 32.0, 41.0, 64.0, 88.0, 129.0, 181.0, 264.0, 364.0, 542.0, 853.0, 1293.0, 1999.0, 3331.0, 5845.0, 10546.0, 18626.0, 36097.0, 71298.0, 155039.0, 300670.0, 227399.0, 104043.0, 50388.0, 25960.0, 13745.0, 7878.0, 4440.0, 2550.0, 1540.0, 1068.0, 665.0, 450.0, 308.0, 211.0, 139.0, 116.0, 73.0, 48.0, 31.0, 22.0, 24.0, 25.0, 16.0, 6.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-11.1328125, -10.770751953125, -10.40869140625, -10.046630859375, -9.6845703125, -9.322509765625, -8.96044921875, -8.598388671875, -8.236328125, -7.874267578125, -7.51220703125, -7.150146484375, -6.7880859375, -6.426025390625, -6.06396484375, -5.701904296875, -5.33984375, -4.977783203125, -4.61572265625, -4.253662109375, -3.8916015625, -3.529541015625, -3.16748046875, -2.805419921875, -2.443359375, -2.081298828125, -1.71923828125, -1.357177734375, -0.9951171875, -0.633056640625, -0.27099609375, 0.091064453125, 0.453125, 0.815185546875, 1.17724609375, 1.539306640625, 1.9013671875, 2.263427734375, 2.62548828125, 2.987548828125, 3.349609375, 3.711669921875, 4.07373046875, 4.435791015625, 4.7978515625, 5.159912109375, 5.52197265625, 5.884033203125, 6.24609375, 6.608154296875, 6.97021484375, 7.332275390625, 7.6943359375, 8.056396484375, 8.41845703125, 8.780517578125, 9.142578125, 9.504638671875, 9.86669921875, 10.228759765625, 10.5908203125, 10.952880859375, 11.31494140625, 11.677001953125, 12.0390625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 13.0, 4.0, 11.0, 4.0, 8.0, 10.0, 12.0, 24.0, 16.0, 22.0, 19.0, 19.0, 23.0, 37.0, 34.0, 38.0, 29.0, 43.0, 42.0, 38.0, 47.0, 46.0, 41.0, 46.0, 31.0, 40.0, 32.0, 50.0, 33.0, 19.0, 30.0, 21.0, 15.0, 21.0, 15.0, 11.0, 10.0, 9.0, 9.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.71484375, -3.597900390625, -3.48095703125, -3.364013671875, -3.2470703125, -3.130126953125, -3.01318359375, -2.896240234375, -2.779296875, -2.662353515625, -2.54541015625, -2.428466796875, -2.3115234375, -2.194580078125, -2.07763671875, -1.960693359375, -1.84375, -1.726806640625, -1.60986328125, -1.492919921875, -1.3759765625, -1.259033203125, -1.14208984375, -1.025146484375, -0.908203125, -0.791259765625, -0.67431640625, -0.557373046875, -0.4404296875, -0.323486328125, -0.20654296875, -0.089599609375, 0.02734375, 0.144287109375, 0.26123046875, 0.378173828125, 0.4951171875, 0.612060546875, 0.72900390625, 0.845947265625, 0.962890625, 1.079833984375, 1.19677734375, 1.313720703125, 1.4306640625, 1.547607421875, 1.66455078125, 1.781494140625, 1.8984375, 2.015380859375, 2.13232421875, 2.249267578125, 2.3662109375, 2.483154296875, 2.60009765625, 2.717041015625, 2.833984375, 2.950927734375, 3.06787109375, 3.184814453125, 3.3017578125, 3.418701171875, 3.53564453125, 3.652587890625, 3.76953125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 13.0, 12.0, 15.0, 20.0, 30.0, 43.0, 73.0, 95.0, 111.0, 166.0, 234.0, 388.0, 507.0, 755.0, 1236.0, 1969.0, 3330.0, 6306.0, 13720.0, 35796.0, 150316.0, 704587.0, 81422.0, 24609.0, 10168.0, 5060.0, 2807.0, 1587.0, 1011.0, 655.0, 441.0, 302.0, 219.0, 147.0, 100.0, 77.0, 58.0, 37.0, 32.0, 25.0, 21.0, 11.0, 3.0, 12.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.25, -17.71826171875, -17.1865234375, -16.65478515625, -16.123046875, -15.59130859375, -15.0595703125, -14.52783203125, -13.99609375, -13.46435546875, -12.9326171875, -12.40087890625, -11.869140625, -11.33740234375, -10.8056640625, -10.27392578125, -9.7421875, -9.21044921875, -8.6787109375, -8.14697265625, -7.615234375, -7.08349609375, -6.5517578125, -6.02001953125, -5.48828125, -4.95654296875, -4.4248046875, -3.89306640625, -3.361328125, -2.82958984375, -2.2978515625, -1.76611328125, -1.234375, -0.70263671875, -0.1708984375, 0.36083984375, 0.892578125, 1.42431640625, 1.9560546875, 2.48779296875, 3.01953125, 3.55126953125, 4.0830078125, 4.61474609375, 5.146484375, 5.67822265625, 6.2099609375, 6.74169921875, 7.2734375, 7.80517578125, 8.3369140625, 8.86865234375, 9.400390625, 9.93212890625, 10.4638671875, 10.99560546875, 11.52734375, 12.05908203125, 12.5908203125, 13.12255859375, 13.654296875, 14.18603515625, 14.7177734375, 15.24951171875, 15.78125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 13.0, 13.0, 9.0, 17.0, 28.0, 28.0, 42.0, 57.0, 88.0, 127.0, 159.0, 110.0, 71.0, 48.0, 39.0, 32.0, 21.0, 19.0, 24.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006008148193359375, -0.0005842819809913635, -0.0005677491426467896, -0.0005512163043022156, -0.0005346834659576416, -0.0005181506276130676, -0.0005016177892684937, -0.0004850849509239197, -0.0004685521125793457, -0.00045201927423477173, -0.00043548643589019775, -0.0004189535975456238, -0.0004024207592010498, -0.00038588792085647583, -0.00036935508251190186, -0.0003528222441673279, -0.0003362894058227539, -0.00031975656747817993, -0.00030322372913360596, -0.000286690890789032, -0.000270158052444458, -0.00025362521409988403, -0.00023709237575531006, -0.00022055953741073608, -0.0002040266990661621, -0.00018749386072158813, -0.00017096102237701416, -0.00015442818403244019, -0.0001378953456878662, -0.00012136250734329224, -0.00010482966899871826, -8.829683065414429e-05, -7.176399230957031e-05, -5.523115396499634e-05, -3.869831562042236e-05, -2.216547727584839e-05, -5.632638931274414e-06, 1.090019941329956e-05, 2.7433037757873535e-05, 4.396587610244751e-05, 6.0498714447021484e-05, 7.703155279159546e-05, 9.356439113616943e-05, 0.00011009722948074341, 0.00012663006782531738, 0.00014316290616989136, 0.00015969574451446533, 0.0001762285828590393, 0.00019276142120361328, 0.00020929425954818726, 0.00022582709789276123, 0.0002423599362373352, 0.0002588927745819092, 0.00027542561292648315, 0.00029195845127105713, 0.0003084912896156311, 0.0003250241279602051, 0.00034155696630477905, 0.00035808980464935303, 0.000374622642993927, 0.000391155481338501, 0.00040768831968307495, 0.0004242211580276489, 0.0004407539963722229, 0.0004572868347167969]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 6.0, 8.0, 5.0, 10.0, 17.0, 12.0, 19.0, 37.0, 38.0, 67.0, 84.0, 108.0, 151.0, 244.0, 291.0, 398.0, 618.0, 889.0, 1366.0, 2024.0, 3263.0, 5738.0, 11132.0, 27406.0, 104196.0, 736967.0, 100635.0, 26631.0, 11155.0, 5501.0, 3137.0, 2036.0, 1341.0, 896.0, 610.0, 422.0, 292.0, 214.0, 166.0, 125.0, 77.0, 55.0, 49.0, 35.0, 22.0, 16.0, 16.0, 11.0, 8.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.3515625, -12.8988037109375, -12.446044921875, -11.9932861328125, -11.54052734375, -11.0877685546875, -10.635009765625, -10.1822509765625, -9.7294921875, -9.2767333984375, -8.823974609375, -8.3712158203125, -7.91845703125, -7.4656982421875, -7.012939453125, -6.5601806640625, -6.107421875, -5.6546630859375, -5.201904296875, -4.7491455078125, -4.29638671875, -3.8436279296875, -3.390869140625, -2.9381103515625, -2.4853515625, -2.0325927734375, -1.579833984375, -1.1270751953125, -0.67431640625, -0.2215576171875, 0.231201171875, 0.6839599609375, 1.13671875, 1.5894775390625, 2.042236328125, 2.4949951171875, 2.94775390625, 3.4005126953125, 3.853271484375, 4.3060302734375, 4.7587890625, 5.2115478515625, 5.664306640625, 6.1170654296875, 6.56982421875, 7.0225830078125, 7.475341796875, 7.9281005859375, 8.380859375, 8.8336181640625, 9.286376953125, 9.7391357421875, 10.19189453125, 10.6446533203125, 11.097412109375, 11.5501708984375, 12.0029296875, 12.4556884765625, 12.908447265625, 13.3612060546875, 13.81396484375, 14.2667236328125, 14.719482421875, 15.1722412109375, 15.625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 7.0, 10.0, 12.0, 21.0, 25.0, 29.0, 42.0, 59.0, 85.0, 254.0, 145.0, 81.0, 52.0, 43.0, 32.0, 17.0, 17.0, 5.0, 9.0, 6.0, 3.0, 2.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.748046875, -3.640716552734375, -3.53338623046875, -3.426055908203125, -3.3187255859375, -3.211395263671875, -3.10406494140625, -2.996734619140625, -2.889404296875, -2.782073974609375, -2.67474365234375, -2.567413330078125, -2.4600830078125, -2.352752685546875, -2.24542236328125, -2.138092041015625, -2.03076171875, -1.923431396484375, -1.81610107421875, -1.708770751953125, -1.6014404296875, -1.494110107421875, -1.38677978515625, -1.279449462890625, -1.172119140625, -1.064788818359375, -0.95745849609375, -0.850128173828125, -0.7427978515625, -0.635467529296875, -0.52813720703125, -0.420806884765625, -0.3134765625, -0.206146240234375, -0.09881591796875, 0.008514404296875, 0.1158447265625, 0.223175048828125, 0.33050537109375, 0.437835693359375, 0.545166015625, 0.652496337890625, 0.75982666015625, 0.867156982421875, 0.9744873046875, 1.081817626953125, 1.18914794921875, 1.296478271484375, 1.40380859375, 1.511138916015625, 1.61846923828125, 1.725799560546875, 1.8331298828125, 1.940460205078125, 2.04779052734375, 2.155120849609375, 2.262451171875, 2.369781494140625, 2.47711181640625, 2.584442138671875, 2.6917724609375, 2.799102783203125, 2.90643310546875, 3.013763427734375, 3.12109375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 2.0, 9.0, 8.0, 9.0, 7.0, 17.0, 25.0, 60.0, 84.0, 102.0, 167.0, 135.0, 97.0, 69.0, 59.0, 40.0, 27.0, 15.0, 13.0, 9.0, 8.0, 5.0, 7.0, 3.0, 2.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.680816650390625, -6.3064093589782715, -5.932002067565918, -5.557595252990723, -5.183187961578369, -4.808780670166016, -4.43437385559082, -4.059966564178467, -3.6855592727661133, -3.3111519813537598, -2.9367449283599854, -2.562337875366211, -2.1879305839538574, -1.8135234117507935, -1.4391162395477295, -1.064709186553955, -0.6903018951416016, -0.3158947229385376, 0.05851244926452637, 0.43291962146759033, 0.8073267936706543, 1.1817339658737183, 1.5561411380767822, 1.9305481910705566, 2.30495548248291, 2.6793627738952637, 3.053769826889038, 3.4281768798828125, 3.802584171295166, 4.1769914627075195, 4.551398277282715, 4.925805568695068, 5.300212860107422, 5.674620151519775, 6.049027442932129, 6.423434257507324, 6.797841548919678, 7.172248840332031, 7.546655654907227, 7.92106294631958, 8.295470237731934, 8.669877052307129, 9.04428482055664, 9.418691635131836, 9.793098449707031, 10.167506217956543, 10.541913032531738, 10.91632080078125, 11.290727615356445, 11.66513442993164, 12.039542198181152, 12.413949012756348, 12.78835678100586, 13.162763595581055, 13.53717041015625, 13.911577224731445, 14.285984992980957, 14.660391807556152, 15.034799575805664, 15.40920639038086, 15.783613204956055, 16.15802001953125, 16.532428741455078, 16.906835556030273, 17.28124237060547]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 9.0, 11.0, 15.0, 17.0, 15.0, 22.0, 26.0, 27.0, 34.0, 35.0, 40.0, 45.0, 49.0, 45.0, 44.0, 54.0, 57.0, 48.0, 43.0, 39.0, 40.0, 39.0, 38.0, 27.0, 29.0, 24.0, 20.0, 16.0, 15.0, 15.0, 3.0, 20.0, 12.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.094730854034424, -6.886653900146484, -6.678576946258545, -6.4704999923706055, -6.262423038482666, -6.054346084594727, -5.846269130706787, -5.638192176818848, -5.430115222930908, -5.222038269042969, -5.013961315155029, -4.80588436126709, -4.59780740737915, -4.389730453491211, -4.1816534996032715, -3.973576545715332, -3.7654998302459717, -3.5574228763580322, -3.3493459224700928, -3.1412689685821533, -2.933192014694214, -2.7251152992248535, -2.517038345336914, -2.3089613914489746, -2.100884437561035, -1.8928074836730957, -1.6847305297851562, -1.4766535758972168, -1.2685766220092773, -1.0604997873306274, -0.852422833442688, -0.6443458795547485, -0.43626880645751953, -0.22819186747074127, -0.020114928483963013, 0.18796199560165405, 0.3960389494895935, 0.6041158437728882, 0.8121927976608276, 1.020269751548767, 1.2283467054367065, 1.436423659324646, 1.6445006132125854, 1.8525774478912354, 2.060654401779175, 2.2687313556671143, 2.4768083095550537, 2.684885263442993, 2.8929622173309326, 3.101039171218872, 3.3091161251068115, 3.517193078994751, 3.7252700328826904, 3.933346748352051, 4.14142370223999, 4.34950065612793, 4.557577610015869, 4.765654563903809, 4.973731517791748, 5.1818084716796875, 5.389885425567627, 5.597962379455566, 5.806039333343506, 6.014116287231445, 6.222193241119385]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 18.0, 18.0, 22.0, 36.0, 47.0, 68.0, 113.0, 156.0, 234.0, 318.0, 475.0, 589.0, 905.0, 1310.0, 1800.0, 2619.0, 3698.0, 5136.0, 7947.0, 12060.0, 19170.0, 31702.0, 57005.0, 111665.0, 269215.0, 1007126.0, 1769679.0, 520359.0, 172109.0, 81100.0, 43905.0, 26109.0, 16199.0, 10289.0, 6686.0, 4425.0, 3107.0, 2141.0, 1422.0, 1019.0, 749.0, 506.0, 360.0, 233.0, 149.0, 111.0, 66.0, 42.0, 22.0, 18.0, 6.0, 4.0, 5.0, 3.0, 1.0], "bins": [-8.984375, -8.72967529296875, -8.4749755859375, -8.22027587890625, -7.965576171875, -7.71087646484375, -7.4561767578125, -7.20147705078125, -6.94677734375, -6.69207763671875, -6.4373779296875, -6.18267822265625, -5.927978515625, -5.67327880859375, -5.4185791015625, -5.16387939453125, -4.9091796875, -4.65447998046875, -4.3997802734375, -4.14508056640625, -3.890380859375, -3.63568115234375, -3.3809814453125, -3.12628173828125, -2.87158203125, -2.61688232421875, -2.3621826171875, -2.10748291015625, -1.852783203125, -1.59808349609375, -1.3433837890625, -1.08868408203125, -0.833984375, -0.57928466796875, -0.3245849609375, -0.06988525390625, 0.184814453125, 0.43951416015625, 0.6942138671875, 0.94891357421875, 1.20361328125, 1.45831298828125, 1.7130126953125, 1.96771240234375, 2.222412109375, 2.47711181640625, 2.7318115234375, 2.98651123046875, 3.2412109375, 3.49591064453125, 3.7506103515625, 4.00531005859375, 4.260009765625, 4.51470947265625, 4.7694091796875, 5.02410888671875, 5.27880859375, 5.53350830078125, 5.7882080078125, 6.04290771484375, 6.297607421875, 6.55230712890625, 6.8070068359375, 7.06170654296875, 7.31640625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 7.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 10.0, 17.0, 10.0, 10.0, 17.0, 20.0, 16.0, 34.0, 24.0, 46.0, 33.0, 48.0, 48.0, 34.0, 51.0, 47.0, 39.0, 55.0, 38.0, 48.0, 47.0, 39.0, 32.0, 29.0, 23.0, 24.0, 22.0, 18.0, 20.0, 15.0, 16.0, 10.0, 12.0, 6.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.203125, -4.087738037109375, -3.97235107421875, -3.856964111328125, -3.7415771484375, -3.626190185546875, -3.51080322265625, -3.395416259765625, -3.280029296875, -3.164642333984375, -3.04925537109375, -2.933868408203125, -2.8184814453125, -2.703094482421875, -2.58770751953125, -2.472320556640625, -2.35693359375, -2.241546630859375, -2.12615966796875, -2.010772705078125, -1.8953857421875, -1.779998779296875, -1.66461181640625, -1.549224853515625, -1.433837890625, -1.318450927734375, -1.20306396484375, -1.087677001953125, -0.9722900390625, -0.856903076171875, -0.74151611328125, -0.626129150390625, -0.5107421875, -0.395355224609375, -0.27996826171875, -0.164581298828125, -0.0491943359375, 0.066192626953125, 0.18157958984375, 0.296966552734375, 0.412353515625, 0.527740478515625, 0.64312744140625, 0.758514404296875, 0.8739013671875, 0.989288330078125, 1.10467529296875, 1.220062255859375, 1.33544921875, 1.450836181640625, 1.56622314453125, 1.681610107421875, 1.7969970703125, 1.912384033203125, 2.02777099609375, 2.143157958984375, 2.258544921875, 2.373931884765625, 2.48931884765625, 2.604705810546875, 2.7200927734375, 2.835479736328125, 2.95086669921875, 3.066253662109375, 3.181640625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 9.0, 14.0, 16.0, 17.0, 30.0, 42.0, 62.0, 87.0, 126.0, 154.0, 237.0, 332.0, 475.0, 722.0, 1010.0, 1487.0, 2286.0, 3540.0, 5790.0, 9070.0, 15136.0, 27225.0, 51256.0, 103669.0, 232490.0, 633073.0, 1755765.0, 811744.0, 282608.0, 121337.0, 58596.0, 30550.0, 17224.0, 10142.0, 6193.0, 3906.0, 2528.0, 1706.0, 1108.0, 746.0, 554.0, 369.0, 251.0, 171.0, 126.0, 91.0, 67.0, 50.0, 29.0, 27.0, 8.0, 14.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0], "bins": [-7.58203125, -7.3494873046875, -7.116943359375, -6.8843994140625, -6.65185546875, -6.4193115234375, -6.186767578125, -5.9542236328125, -5.7216796875, -5.4891357421875, -5.256591796875, -5.0240478515625, -4.79150390625, -4.5589599609375, -4.326416015625, -4.0938720703125, -3.861328125, -3.6287841796875, -3.396240234375, -3.1636962890625, -2.93115234375, -2.6986083984375, -2.466064453125, -2.2335205078125, -2.0009765625, -1.7684326171875, -1.535888671875, -1.3033447265625, -1.07080078125, -0.8382568359375, -0.605712890625, -0.3731689453125, -0.140625, 0.0919189453125, 0.324462890625, 0.5570068359375, 0.78955078125, 1.0220947265625, 1.254638671875, 1.4871826171875, 1.7197265625, 1.9522705078125, 2.184814453125, 2.4173583984375, 2.64990234375, 2.8824462890625, 3.114990234375, 3.3475341796875, 3.580078125, 3.8126220703125, 4.045166015625, 4.2777099609375, 4.51025390625, 4.7427978515625, 4.975341796875, 5.2078857421875, 5.4404296875, 5.6729736328125, 5.905517578125, 6.1380615234375, 6.37060546875, 6.6031494140625, 6.835693359375, 7.0682373046875, 7.30078125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 9.0, 14.0, 10.0, 16.0, 21.0, 25.0, 51.0, 57.0, 37.0, 62.0, 83.0, 110.0, 125.0, 120.0, 165.0, 234.0, 217.0, 277.0, 285.0, 328.0, 310.0, 260.0, 223.0, 185.0, 155.0, 127.0, 86.0, 86.0, 68.0, 58.0, 47.0, 39.0, 37.0, 19.0, 23.0, 22.0, 10.0, 9.0, 10.0, 13.0, 13.0, 5.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.875, -1.81561279296875, -1.7562255859375, -1.69683837890625, -1.637451171875, -1.57806396484375, -1.5186767578125, -1.45928955078125, -1.39990234375, -1.34051513671875, -1.2811279296875, -1.22174072265625, -1.162353515625, -1.10296630859375, -1.0435791015625, -0.98419189453125, -0.9248046875, -0.86541748046875, -0.8060302734375, -0.74664306640625, -0.687255859375, -0.62786865234375, -0.5684814453125, -0.50909423828125, -0.44970703125, -0.39031982421875, -0.3309326171875, -0.27154541015625, -0.212158203125, -0.15277099609375, -0.0933837890625, -0.03399658203125, 0.025390625, 0.08477783203125, 0.1441650390625, 0.20355224609375, 0.262939453125, 0.32232666015625, 0.3817138671875, 0.44110107421875, 0.50048828125, 0.55987548828125, 0.6192626953125, 0.67864990234375, 0.738037109375, 0.79742431640625, 0.8568115234375, 0.91619873046875, 0.9755859375, 1.03497314453125, 1.0943603515625, 1.15374755859375, 1.213134765625, 1.27252197265625, 1.3319091796875, 1.39129638671875, 1.45068359375, 1.51007080078125, 1.5694580078125, 1.62884521484375, 1.688232421875, 1.74761962890625, 1.8070068359375, 1.86639404296875, 1.92578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 7.0, 7.0, 11.0, 16.0, 16.0, 25.0, 54.0, 72.0, 110.0, 129.0, 161.0, 129.0, 76.0, 51.0, 50.0, 21.0, 15.0, 10.0, 5.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.27719783782959, -5.997032642364502, -5.716867923736572, -5.436702728271484, -5.156538009643555, -4.876372814178467, -4.596207618713379, -4.316042900085449, -4.0358781814575195, -3.7557132244110107, -3.475548267364502, -3.195383071899414, -2.9152183532714844, -2.6350531578063965, -2.3548882007598877, -2.074723243713379, -1.794558048248291, -1.5143930912017822, -1.2342281341552734, -0.9540630578994751, -0.6738981008529663, -0.3937331438064575, -0.11356806755065918, 0.1665968894958496, 0.4467618465423584, 0.7269268035888672, 1.007091760635376, 1.2872568368911743, 1.567421793937683, 1.847586750984192, 2.1277518272399902, 2.407916784286499, 2.688081741333008, 2.9682466983795166, 3.2484116554260254, 3.5285768508911133, 3.808741569519043, 4.088906764984131, 4.369071960449219, 4.649236679077148, 4.929401397705078, 5.209566593170166, 5.489731311798096, 5.769896507263184, 6.050061225891113, 6.330226421356201, 6.610391616821289, 6.890556335449219, 7.170721530914307, 7.4508867263793945, 7.731051445007324, 8.011216163635254, 8.2913818359375, 8.57154655456543, 8.85171127319336, 9.131875991821289, 9.412041664123535, 9.692206382751465, 9.972372055053711, 10.25253677368164, 10.53270149230957, 10.8128662109375, 11.093031883239746, 11.373196601867676, 11.653361320495605]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 4.0, 8.0, 10.0, 6.0, 6.0, 13.0, 9.0, 12.0, 23.0, 21.0, 31.0, 26.0, 28.0, 35.0, 33.0, 41.0, 37.0, 38.0, 48.0, 33.0, 30.0, 36.0, 61.0, 32.0, 34.0, 37.0, 33.0, 38.0, 24.0, 28.0, 28.0, 17.0, 20.0, 13.0, 21.0, 16.0, 9.0, 13.0, 10.0, 3.0, 11.0, 2.0, 4.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.869497537612915, -3.750976085662842, -3.6324548721313477, -3.5139334201812744, -3.395411968231201, -3.276890754699707, -3.158369302749634, -3.0398478507995605, -2.9213266372680664, -2.802805185317993, -2.684283971786499, -2.565762519836426, -2.4472413063049316, -2.3287198543548584, -2.210198402404785, -2.091677188873291, -1.9731557369232178, -1.854634404182434, -1.7361130714416504, -1.6175916194915771, -1.4990702867507935, -1.3805489540100098, -1.2620275020599365, -1.1435061693191528, -1.0249848365783691, -0.9064635038375854, -0.787942111492157, -0.6694207191467285, -0.5508993864059448, -0.43237805366516113, -0.31385666131973267, -0.1953352689743042, -0.07681393623352051, 0.04170742630958557, 0.16022878885269165, 0.27875015139579773, 0.3972715139389038, 0.5157928466796875, 0.634314239025116, 0.7528356313705444, 0.8713569641113281, 0.9898782968521118, 1.1083996295928955, 1.2269210815429688, 1.3454424142837524, 1.4639637470245361, 1.5824851989746094, 1.701006531715393, 1.8195278644561768, 1.9380491971969604, 2.056570529937744, 2.1750919818878174, 2.2936134338378906, 2.4121346473693848, 2.530656099319458, 2.6491775512695312, 2.7676987648010254, 2.8862202167510986, 3.0047414302825928, 3.123262882232666, 3.24178409576416, 3.3603055477142334, 3.4788269996643066, 3.597348213195801, 3.715869665145874]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 4.0, 3.0, 9.0, 15.0, 15.0, 24.0, 34.0, 40.0, 51.0, 87.0, 85.0, 119.0, 164.0, 220.0, 308.0, 416.0, 529.0, 777.0, 1052.0, 1618.0, 2125.0, 3176.0, 4784.0, 7396.0, 11812.0, 19333.0, 34665.0, 69995.0, 199289.0, 433435.0, 129065.0, 53467.0, 28075.0, 16231.0, 9943.0, 6369.0, 4070.0, 2823.0, 1956.0, 1403.0, 990.0, 708.0, 488.0, 368.0, 248.0, 181.0, 131.0, 136.0, 82.0, 62.0, 56.0, 41.0, 29.0, 22.0, 9.0, 10.0, 10.0, 4.0, 1.0, 6.0, 2.0], "bins": [-4.65625, -4.51220703125, -4.3681640625, -4.22412109375, -4.080078125, -3.93603515625, -3.7919921875, -3.64794921875, -3.50390625, -3.35986328125, -3.2158203125, -3.07177734375, -2.927734375, -2.78369140625, -2.6396484375, -2.49560546875, -2.3515625, -2.20751953125, -2.0634765625, -1.91943359375, -1.775390625, -1.63134765625, -1.4873046875, -1.34326171875, -1.19921875, -1.05517578125, -0.9111328125, -0.76708984375, -0.623046875, -0.47900390625, -0.3349609375, -0.19091796875, -0.046875, 0.09716796875, 0.2412109375, 0.38525390625, 0.529296875, 0.67333984375, 0.8173828125, 0.96142578125, 1.10546875, 1.24951171875, 1.3935546875, 1.53759765625, 1.681640625, 1.82568359375, 1.9697265625, 2.11376953125, 2.2578125, 2.40185546875, 2.5458984375, 2.68994140625, 2.833984375, 2.97802734375, 3.1220703125, 3.26611328125, 3.41015625, 3.55419921875, 3.6982421875, 3.84228515625, 3.986328125, 4.13037109375, 4.2744140625, 4.41845703125, 4.5625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 13.0, 8.0, 12.0, 18.0, 26.0, 19.0, 23.0, 22.0, 28.0, 40.0, 36.0, 41.0, 36.0, 57.0, 45.0, 33.0, 38.0, 44.0, 53.0, 40.0, 36.0, 37.0, 40.0, 21.0, 29.0, 25.0, 21.0, 18.0, 17.0, 15.0, 15.0, 22.0, 4.0, 12.0, 7.0, 3.0, 2.0, 5.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-4.55859375, -4.4288330078125, -4.299072265625, -4.1693115234375, -4.03955078125, -3.9097900390625, -3.780029296875, -3.6502685546875, -3.5205078125, -3.3907470703125, -3.260986328125, -3.1312255859375, -3.00146484375, -2.8717041015625, -2.741943359375, -2.6121826171875, -2.482421875, -2.3526611328125, -2.222900390625, -2.0931396484375, -1.96337890625, -1.8336181640625, -1.703857421875, -1.5740966796875, -1.4443359375, -1.3145751953125, -1.184814453125, -1.0550537109375, -0.92529296875, -0.7955322265625, -0.665771484375, -0.5360107421875, -0.40625, -0.2764892578125, -0.146728515625, -0.0169677734375, 0.11279296875, 0.2425537109375, 0.372314453125, 0.5020751953125, 0.6318359375, 0.7615966796875, 0.891357421875, 1.0211181640625, 1.15087890625, 1.2806396484375, 1.410400390625, 1.5401611328125, 1.669921875, 1.7996826171875, 1.929443359375, 2.0592041015625, 2.18896484375, 2.3187255859375, 2.448486328125, 2.5782470703125, 2.7080078125, 2.8377685546875, 2.967529296875, 3.0972900390625, 3.22705078125, 3.3568115234375, 3.486572265625, 3.6163330078125, 3.74609375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 12.0, 18.0, 27.0, 22.0, 52.0, 56.0, 92.0, 115.0, 198.0, 288.0, 386.0, 577.0, 807.0, 1215.0, 2005.0, 3149.0, 5792.0, 11552.0, 28233.0, 161965.0, 741420.0, 53675.0, 17173.0, 8051.0, 4357.0, 2571.0, 1568.0, 1018.0, 621.0, 476.0, 307.0, 214.0, 158.0, 115.0, 78.0, 59.0, 35.0, 27.0, 15.0, 18.0, 10.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.3515625, -9.0703125, -8.7890625, -8.5078125, -8.2265625, -7.9453125, -7.6640625, -7.3828125, -7.1015625, -6.8203125, -6.5390625, -6.2578125, -5.9765625, -5.6953125, -5.4140625, -5.1328125, -4.8515625, -4.5703125, -4.2890625, -4.0078125, -3.7265625, -3.4453125, -3.1640625, -2.8828125, -2.6015625, -2.3203125, -2.0390625, -1.7578125, -1.4765625, -1.1953125, -0.9140625, -0.6328125, -0.3515625, -0.0703125, 0.2109375, 0.4921875, 0.7734375, 1.0546875, 1.3359375, 1.6171875, 1.8984375, 2.1796875, 2.4609375, 2.7421875, 3.0234375, 3.3046875, 3.5859375, 3.8671875, 4.1484375, 4.4296875, 4.7109375, 4.9921875, 5.2734375, 5.5546875, 5.8359375, 6.1171875, 6.3984375, 6.6796875, 6.9609375, 7.2421875, 7.5234375, 7.8046875, 8.0859375, 8.3671875, 8.6484375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 10.0, 12.0, 9.0, 15.0, 17.0, 26.0, 21.0, 22.0, 33.0, 30.0, 25.0, 45.0, 27.0, 24.0, 44.0, 51.0, 44.0, 40.0, 38.0, 40.0, 39.0, 46.0, 34.0, 34.0, 34.0, 36.0, 23.0, 23.0, 17.0, 23.0, 13.0, 14.0, 13.0, 8.0, 12.0, 7.0, 6.0, 4.0, 7.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.12109375, -3.027313232421875, -2.93353271484375, -2.839752197265625, -2.7459716796875, -2.652191162109375, -2.55841064453125, -2.464630126953125, -2.370849609375, -2.277069091796875, -2.18328857421875, -2.089508056640625, -1.9957275390625, -1.901947021484375, -1.80816650390625, -1.714385986328125, -1.62060546875, -1.526824951171875, -1.43304443359375, -1.339263916015625, -1.2454833984375, -1.151702880859375, -1.05792236328125, -0.964141845703125, -0.870361328125, -0.776580810546875, -0.68280029296875, -0.589019775390625, -0.4952392578125, -0.401458740234375, -0.30767822265625, -0.213897705078125, -0.1201171875, -0.026336669921875, 0.06744384765625, 0.161224365234375, 0.2550048828125, 0.348785400390625, 0.44256591796875, 0.536346435546875, 0.630126953125, 0.723907470703125, 0.81768798828125, 0.911468505859375, 1.0052490234375, 1.099029541015625, 1.19281005859375, 1.286590576171875, 1.38037109375, 1.474151611328125, 1.56793212890625, 1.661712646484375, 1.7554931640625, 1.849273681640625, 1.94305419921875, 2.036834716796875, 2.130615234375, 2.224395751953125, 2.31817626953125, 2.411956787109375, 2.5057373046875, 2.599517822265625, 2.69329833984375, 2.787078857421875, 2.880859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 12.0, 14.0, 24.0, 28.0, 59.0, 72.0, 124.0, 190.0, 274.0, 441.0, 792.0, 1355.0, 2533.0, 5299.0, 11792.0, 35875.0, 287800.0, 629035.0, 46289.0, 14141.0, 5843.0, 2765.0, 1500.0, 869.0, 515.0, 340.0, 181.0, 148.0, 75.0, 41.0, 31.0, 21.0, 21.0, 8.0, 4.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.302734375, -3.202911376953125, -3.10308837890625, -3.003265380859375, -2.9034423828125, -2.803619384765625, -2.70379638671875, -2.603973388671875, -2.504150390625, -2.404327392578125, -2.30450439453125, -2.204681396484375, -2.1048583984375, -2.005035400390625, -1.90521240234375, -1.805389404296875, -1.70556640625, -1.605743408203125, -1.50592041015625, -1.406097412109375, -1.3062744140625, -1.206451416015625, -1.10662841796875, -1.006805419921875, -0.906982421875, -0.807159423828125, -0.70733642578125, -0.607513427734375, -0.5076904296875, -0.407867431640625, -0.30804443359375, -0.208221435546875, -0.1083984375, -0.008575439453125, 0.09124755859375, 0.191070556640625, 0.2908935546875, 0.390716552734375, 0.49053955078125, 0.590362548828125, 0.690185546875, 0.790008544921875, 0.88983154296875, 0.989654541015625, 1.0894775390625, 1.189300537109375, 1.28912353515625, 1.388946533203125, 1.48876953125, 1.588592529296875, 1.68841552734375, 1.788238525390625, 1.8880615234375, 1.987884521484375, 2.08770751953125, 2.187530517578125, 2.287353515625, 2.387176513671875, 2.48699951171875, 2.586822509765625, 2.6866455078125, 2.786468505859375, 2.88629150390625, 2.986114501953125, 3.0859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 4.0, 5.0, 5.0, 4.0, 6.0, 11.0, 13.0, 15.0, 12.0, 22.0, 33.0, 45.0, 57.0, 67.0, 72.0, 96.0, 126.0, 79.0, 76.0, 57.0, 42.0, 29.0, 22.0, 29.0, 18.0, 10.0, 11.0, 5.0, 7.0, 2.0, 7.0, 5.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011610984802246094, -0.00011289399117231369, -0.00010967813432216644, -0.0001064622774720192, -0.00010324642062187195, -0.0001000305637717247, -9.681470692157745e-05, -9.35988500714302e-05, -9.038299322128296e-05, -8.716713637113571e-05, -8.395127952098846e-05, -8.073542267084122e-05, -7.751956582069397e-05, -7.430370897054672e-05, -7.108785212039948e-05, -6.787199527025223e-05, -6.465613842010498e-05, -6.144028156995773e-05, -5.8224424719810486e-05, -5.500856786966324e-05, -5.179271101951599e-05, -4.8576854169368744e-05, -4.5360997319221497e-05, -4.214514046907425e-05, -3.8929283618927e-05, -3.5713426768779755e-05, -3.249756991863251e-05, -2.928171306848526e-05, -2.6065856218338013e-05, -2.2849999368190765e-05, -1.9634142518043518e-05, -1.641828566789627e-05, -1.3202428817749023e-05, -9.986571967601776e-06, -6.770715117454529e-06, -3.5548582673072815e-06, -3.390014171600342e-07, 2.876855432987213e-06, 6.0927122831344604e-06, 9.308569133281708e-06, 1.2524425983428955e-05, 1.5740282833576202e-05, 1.895613968372345e-05, 2.2171996533870697e-05, 2.5387853384017944e-05, 2.860371023416519e-05, 3.181956708431244e-05, 3.5035423934459686e-05, 3.8251280784606934e-05, 4.146713763475418e-05, 4.468299448490143e-05, 4.7898851335048676e-05, 5.111470818519592e-05, 5.433056503534317e-05, 5.754642188549042e-05, 6.0762278735637665e-05, 6.397813558578491e-05, 6.719399243593216e-05, 7.04098492860794e-05, 7.362570613622665e-05, 7.68415629863739e-05, 8.005741983652115e-05, 8.32732766866684e-05, 8.648913353681564e-05, 8.970499038696289e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 13.0, 9.0, 18.0, 27.0, 29.0, 46.0, 65.0, 87.0, 108.0, 180.0, 205.0, 304.0, 477.0, 774.0, 1110.0, 1780.0, 2877.0, 4964.0, 8851.0, 17682.0, 42098.0, 137679.0, 569491.0, 168555.0, 48097.0, 19396.0, 9785.0, 5172.0, 3167.0, 1868.0, 1156.0, 728.0, 510.0, 383.0, 241.0, 165.0, 127.0, 101.0, 65.0, 53.0, 30.0, 23.0, 14.0, 11.0, 10.0, 2.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.87890625, -1.8193817138671875, -1.759857177734375, -1.7003326416015625, -1.64080810546875, -1.5812835693359375, -1.521759033203125, -1.4622344970703125, -1.4027099609375, -1.3431854248046875, -1.283660888671875, -1.2241363525390625, -1.16461181640625, -1.1050872802734375, -1.045562744140625, -0.9860382080078125, -0.926513671875, -0.8669891357421875, -0.807464599609375, -0.7479400634765625, -0.68841552734375, -0.6288909912109375, -0.569366455078125, -0.5098419189453125, -0.4503173828125, -0.3907928466796875, -0.331268310546875, -0.2717437744140625, -0.21221923828125, -0.1526947021484375, -0.093170166015625, -0.0336456298828125, 0.02587890625, 0.0854034423828125, 0.144927978515625, 0.2044525146484375, 0.26397705078125, 0.3235015869140625, 0.383026123046875, 0.4425506591796875, 0.5020751953125, 0.5615997314453125, 0.621124267578125, 0.6806488037109375, 0.74017333984375, 0.7996978759765625, 0.859222412109375, 0.9187469482421875, 0.978271484375, 1.0377960205078125, 1.097320556640625, 1.1568450927734375, 1.21636962890625, 1.2758941650390625, 1.335418701171875, 1.3949432373046875, 1.4544677734375, 1.5139923095703125, 1.573516845703125, 1.6330413818359375, 1.69256591796875, 1.7520904541015625, 1.811614990234375, 1.8711395263671875, 1.9306640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 10.0, 20.0, 26.0, 37.0, 53.0, 55.0, 79.0, 115.0, 134.0, 145.0, 100.0, 66.0, 42.0, 30.0, 22.0, 12.0, 12.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478515625, -0.45975494384765625, -0.4409942626953125, -0.42223358154296875, -0.403472900390625, -0.38471221923828125, -0.3659515380859375, -0.34719085693359375, -0.32843017578125, -0.30966949462890625, -0.2909088134765625, -0.27214813232421875, -0.253387451171875, -0.23462677001953125, -0.2158660888671875, -0.19710540771484375, -0.1783447265625, -0.15958404541015625, -0.1408233642578125, -0.12206268310546875, -0.103302001953125, -0.08454132080078125, -0.0657806396484375, -0.04701995849609375, -0.02825927734375, -0.00949859619140625, 0.0092620849609375, 0.02802276611328125, 0.046783447265625, 0.06554412841796875, 0.0843048095703125, 0.10306549072265625, 0.121826171875, 0.14058685302734375, 0.1593475341796875, 0.17810821533203125, 0.196868896484375, 0.21562957763671875, 0.2343902587890625, 0.25315093994140625, 0.27191162109375, 0.29067230224609375, 0.3094329833984375, 0.32819366455078125, 0.346954345703125, 0.36571502685546875, 0.3844757080078125, 0.40323638916015625, 0.4219970703125, 0.44075775146484375, 0.4595184326171875, 0.47827911376953125, 0.497039794921875, 0.5158004760742188, 0.5345611572265625, 0.5533218383789062, 0.57208251953125, 0.5908432006835938, 0.6096038818359375, 0.6283645629882812, 0.647125244140625, 0.6658859252929688, 0.6846466064453125, 0.7034072875976562, 0.72216796875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 11.0, 14.0, 18.0, 29.0, 29.0, 52.0, 88.0, 126.0, 168.0, 146.0, 109.0, 57.0, 50.0, 37.0, 9.0, 10.0, 11.0, 2.0, 7.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1531829833984375, -5.871450901031494, -5.589718341827393, -5.307986259460449, -5.026253700256348, -4.744521617889404, -4.462789535522461, -4.181056976318359, -3.899324893951416, -3.6175925731658936, -3.335860252380371, -3.0541281700134277, -2.7723958492279053, -2.490663528442383, -2.2089314460754395, -1.927199125289917, -1.6454668045043945, -1.363734483718872, -1.0820022821426392, -0.8002700209617615, -0.5185377597808838, -0.23680543899536133, 0.04492676258087158, 0.3266589641571045, 0.608391284942627, 0.8901235461235046, 1.1718558073043823, 1.4535880088806152, 1.7353203296661377, 2.01705265045166, 2.2987847328186035, 2.580517053604126, 2.8622493743896484, 3.143981695175171, 3.4257140159606934, 3.7074460983276367, 3.989178419113159, 4.270910739898682, 4.552642822265625, 4.834375381469727, 5.11610746383667, 5.397839546203613, 5.679572105407715, 5.961304187774658, 6.243036270141602, 6.524768829345703, 6.8065009117126465, 7.08823299407959, 7.369965553283691, 7.651697635650635, 7.933430194854736, 8.21516227722168, 8.496894836425781, 8.778627395629883, 9.060359001159668, 9.34209156036377, 9.623823165893555, 9.905555725097656, 10.187287330627441, 10.469019889831543, 10.750752449035645, 11.03248405456543, 11.314216613769531, 11.595949172973633, 11.877681732177734]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 5.0, 7.0, 9.0, 6.0, 9.0, 13.0, 11.0, 20.0, 22.0, 22.0, 24.0, 34.0, 27.0, 34.0, 37.0, 40.0, 40.0, 31.0, 51.0, 33.0, 48.0, 36.0, 41.0, 41.0, 39.0, 35.0, 28.0, 36.0, 26.0, 26.0, 25.0, 17.0, 23.0, 12.0, 22.0, 8.0, 12.0, 10.0, 5.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.9159622192382812, -3.7973082065582275, -3.678654193878174, -3.56000018119812, -3.4413461685180664, -3.322692394256592, -3.204038143157959, -3.0853843688964844, -2.9667303562164307, -2.848076343536377, -2.7294223308563232, -2.6107683181762695, -2.492114305496216, -2.373460292816162, -2.2548065185546875, -2.136152505874634, -2.01749849319458, -1.8988444805145264, -1.7801904678344727, -1.661536455154419, -1.5428825616836548, -1.424228549003601, -1.3055745363235474, -1.1869206428527832, -1.0682663917541504, -0.9496123790740967, -0.8309584259986877, -0.712304413318634, -0.5936504602432251, -0.4749964475631714, -0.3563424348831177, -0.23768848180770874, -0.1190345287322998, -0.0003805384039878845, 0.11827345192432404, 0.23692744970321655, 0.3555814325809479, 0.4742354154586792, 0.5928894281387329, 0.7115433812141418, 0.8301973938941956, 0.9488514065742493, 1.0675053596496582, 1.186159372329712, 1.3048133850097656, 1.4234673976898193, 1.542121410369873, 1.6607753038406372, 1.779429316520691, 1.8980833292007446, 2.016737222671509, 2.1353912353515625, 2.254045248031616, 2.37269926071167, 2.4913532733917236, 2.6100072860717773, 2.728661298751831, 2.8473153114318848, 2.9659693241119385, 3.084623336791992, 3.203277349472046, 3.3219313621520996, 3.440585136413574, 3.559239149093628, 3.6778931617736816]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 15.0, 16.0, 30.0, 35.0, 56.0, 75.0, 119.0, 205.0, 271.0, 396.0, 594.0, 985.0, 1498.0, 2469.0, 4057.0, 6583.0, 11452.0, 20324.0, 37080.0, 71739.0, 143297.0, 266133.0, 231355.0, 116925.0, 59355.0, 31428.0, 17229.0, 9816.0, 5680.0, 3289.0, 2181.0, 1350.0, 864.0, 529.0, 363.0, 229.0, 168.0, 116.0, 74.0, 59.0, 33.0, 21.0, 20.0, 12.0, 2.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0, -7.75653076171875, -7.5130615234375, -7.26959228515625, -7.026123046875, -6.78265380859375, -6.5391845703125, -6.29571533203125, -6.05224609375, -5.80877685546875, -5.5653076171875, -5.32183837890625, -5.078369140625, -4.83489990234375, -4.5914306640625, -4.34796142578125, -4.1044921875, -3.86102294921875, -3.6175537109375, -3.37408447265625, -3.130615234375, -2.88714599609375, -2.6436767578125, -2.40020751953125, -2.15673828125, -1.91326904296875, -1.6697998046875, -1.42633056640625, -1.182861328125, -0.93939208984375, -0.6959228515625, -0.45245361328125, -0.208984375, 0.03448486328125, 0.2779541015625, 0.52142333984375, 0.764892578125, 1.00836181640625, 1.2518310546875, 1.49530029296875, 1.73876953125, 1.98223876953125, 2.2257080078125, 2.46917724609375, 2.712646484375, 2.95611572265625, 3.1995849609375, 3.44305419921875, 3.6865234375, 3.92999267578125, 4.1734619140625, 4.41693115234375, 4.660400390625, 4.90386962890625, 5.1473388671875, 5.39080810546875, 5.63427734375, 5.87774658203125, 6.1212158203125, 6.36468505859375, 6.608154296875, 6.85162353515625, 7.0950927734375, 7.33856201171875, 7.58203125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 4.0, 9.0, 5.0, 6.0, 10.0, 9.0, 12.0, 26.0, 29.0, 25.0, 35.0, 30.0, 43.0, 43.0, 43.0, 52.0, 47.0, 53.0, 39.0, 42.0, 46.0, 43.0, 50.0, 43.0, 41.0, 27.0, 37.0, 22.0, 10.0, 19.0, 17.0, 14.0, 16.0, 12.0, 11.0, 4.0, 1.0, 2.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0], "bins": [-4.296875, -4.178436279296875, -4.05999755859375, -3.941558837890625, -3.8231201171875, -3.704681396484375, -3.58624267578125, -3.467803955078125, -3.349365234375, -3.230926513671875, -3.11248779296875, -2.994049072265625, -2.8756103515625, -2.757171630859375, -2.63873291015625, -2.520294189453125, -2.40185546875, -2.283416748046875, -2.16497802734375, -2.046539306640625, -1.9281005859375, -1.809661865234375, -1.69122314453125, -1.572784423828125, -1.454345703125, -1.335906982421875, -1.21746826171875, -1.099029541015625, -0.9805908203125, -0.862152099609375, -0.74371337890625, -0.625274658203125, -0.5068359375, -0.388397216796875, -0.26995849609375, -0.151519775390625, -0.0330810546875, 0.085357666015625, 0.20379638671875, 0.322235107421875, 0.440673828125, 0.559112548828125, 0.67755126953125, 0.795989990234375, 0.9144287109375, 1.032867431640625, 1.15130615234375, 1.269744873046875, 1.38818359375, 1.506622314453125, 1.62506103515625, 1.743499755859375, 1.8619384765625, 1.980377197265625, 2.09881591796875, 2.217254638671875, 2.335693359375, 2.454132080078125, 2.57257080078125, 2.691009521484375, 2.8094482421875, 2.927886962890625, 3.04632568359375, 3.164764404296875, 3.283203125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 8.0, 5.0, 8.0, 17.0, 30.0, 34.0, 44.0, 62.0, 109.0, 168.0, 244.0, 374.0, 626.0, 1060.0, 1752.0, 3157.0, 5828.0, 10776.0, 20750.0, 41289.0, 83778.0, 172074.0, 295555.0, 207243.0, 100964.0, 49337.0, 24931.0, 12751.0, 6744.0, 3587.0, 2037.0, 1231.0, 717.0, 436.0, 299.0, 159.0, 128.0, 74.0, 57.0, 38.0, 28.0, 10.0, 18.0, 6.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.796875, -7.55792236328125, -7.3189697265625, -7.08001708984375, -6.841064453125, -6.60211181640625, -6.3631591796875, -6.12420654296875, -5.88525390625, -5.64630126953125, -5.4073486328125, -5.16839599609375, -4.929443359375, -4.69049072265625, -4.4515380859375, -4.21258544921875, -3.9736328125, -3.73468017578125, -3.4957275390625, -3.25677490234375, -3.017822265625, -2.77886962890625, -2.5399169921875, -2.30096435546875, -2.06201171875, -1.82305908203125, -1.5841064453125, -1.34515380859375, -1.106201171875, -0.86724853515625, -0.6282958984375, -0.38934326171875, -0.150390625, 0.08856201171875, 0.3275146484375, 0.56646728515625, 0.805419921875, 1.04437255859375, 1.2833251953125, 1.52227783203125, 1.76123046875, 2.00018310546875, 2.2391357421875, 2.47808837890625, 2.717041015625, 2.95599365234375, 3.1949462890625, 3.43389892578125, 3.6728515625, 3.91180419921875, 4.1507568359375, 4.38970947265625, 4.628662109375, 4.86761474609375, 5.1065673828125, 5.34552001953125, 5.58447265625, 5.82342529296875, 6.0623779296875, 6.30133056640625, 6.540283203125, 6.77923583984375, 7.0181884765625, 7.25714111328125, 7.49609375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 4.0, 9.0, 12.0, 15.0, 12.0, 24.0, 15.0, 23.0, 22.0, 21.0, 21.0, 23.0, 27.0, 33.0, 22.0, 36.0, 39.0, 28.0, 41.0, 51.0, 34.0, 38.0, 35.0, 33.0, 40.0, 23.0, 44.0, 32.0, 28.0, 21.0, 30.0, 31.0, 25.0, 16.0, 13.0, 9.0, 11.0, 9.0, 7.0, 8.0, 4.0, 5.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0], "bins": [-2.244140625, -2.1786956787109375, -2.113250732421875, -2.0478057861328125, -1.98236083984375, -1.9169158935546875, -1.851470947265625, -1.7860260009765625, -1.7205810546875, -1.6551361083984375, -1.589691162109375, -1.5242462158203125, -1.45880126953125, -1.3933563232421875, -1.327911376953125, -1.2624664306640625, -1.197021484375, -1.1315765380859375, -1.066131591796875, -1.0006866455078125, -0.93524169921875, -0.8697967529296875, -0.804351806640625, -0.7389068603515625, -0.6734619140625, -0.6080169677734375, -0.542572021484375, -0.4771270751953125, -0.41168212890625, -0.3462371826171875, -0.280792236328125, -0.2153472900390625, -0.14990234375, -0.0844573974609375, -0.019012451171875, 0.0464324951171875, 0.11187744140625, 0.1773223876953125, 0.242767333984375, 0.3082122802734375, 0.3736572265625, 0.4391021728515625, 0.504547119140625, 0.5699920654296875, 0.63543701171875, 0.7008819580078125, 0.766326904296875, 0.8317718505859375, 0.897216796875, 0.9626617431640625, 1.028106689453125, 1.0935516357421875, 1.15899658203125, 1.2244415283203125, 1.289886474609375, 1.3553314208984375, 1.4207763671875, 1.4862213134765625, 1.551666259765625, 1.6171112060546875, 1.68255615234375, 1.7480010986328125, 1.813446044921875, 1.8788909912109375, 1.9443359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 18.0, 32.0, 50.0, 56.0, 77.0, 133.0, 176.0, 252.0, 415.0, 592.0, 990.0, 1731.0, 3117.0, 6455.0, 16356.0, 60275.0, 777765.0, 133915.0, 26922.0, 9362.0, 4223.0, 2152.0, 1227.0, 749.0, 493.0, 303.0, 202.0, 154.0, 89.0, 72.0, 55.0, 28.0, 25.0, 17.0, 15.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.1029052734375, -10.729248046875, -10.3555908203125, -9.98193359375, -9.6082763671875, -9.234619140625, -8.8609619140625, -8.4873046875, -8.1136474609375, -7.739990234375, -7.3663330078125, -6.99267578125, -6.6190185546875, -6.245361328125, -5.8717041015625, -5.498046875, -5.1243896484375, -4.750732421875, -4.3770751953125, -4.00341796875, -3.6297607421875, -3.256103515625, -2.8824462890625, -2.5087890625, -2.1351318359375, -1.761474609375, -1.3878173828125, -1.01416015625, -0.6405029296875, -0.266845703125, 0.1068115234375, 0.48046875, 0.8541259765625, 1.227783203125, 1.6014404296875, 1.97509765625, 2.3487548828125, 2.722412109375, 3.0960693359375, 3.4697265625, 3.8433837890625, 4.217041015625, 4.5906982421875, 4.96435546875, 5.3380126953125, 5.711669921875, 6.0853271484375, 6.458984375, 6.8326416015625, 7.206298828125, 7.5799560546875, 7.95361328125, 8.3272705078125, 8.700927734375, 9.0745849609375, 9.4482421875, 9.8218994140625, 10.195556640625, 10.5692138671875, 10.94287109375, 11.3165283203125, 11.690185546875, 12.0638427734375, 12.4375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 7.0, 9.0, 15.0, 24.0, 35.0, 56.0, 121.0, 305.0, 178.0, 100.0, 54.0, 24.0, 26.0, 16.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030612945556640625, -0.0002958327531814575, -0.0002855360507965088, -0.00027523934841156006, -0.00026494264602661133, -0.0002546459436416626, -0.00024434924125671387, -0.00023405253887176514, -0.0002237558364868164, -0.00021345913410186768, -0.00020316243171691895, -0.00019286572933197021, -0.00018256902694702148, -0.00017227232456207275, -0.00016197562217712402, -0.0001516789197921753, -0.00014138221740722656, -0.00013108551502227783, -0.0001207888126373291, -0.00011049211025238037, -0.00010019540786743164, -8.989870548248291e-05, -7.960200309753418e-05, -6.930530071258545e-05, -5.900859832763672e-05, -4.871189594268799e-05, -3.841519355773926e-05, -2.8118491172790527e-05, -1.7821788787841797e-05, -7.525086402893066e-06, 2.771615982055664e-06, 1.3068318367004395e-05, 2.3365020751953125e-05, 3.3661723136901855e-05, 4.3958425521850586e-05, 5.4255127906799316e-05, 6.455183029174805e-05, 7.484853267669678e-05, 8.514523506164551e-05, 9.544193744659424e-05, 0.00010573863983154297, 0.0001160353422164917, 0.00012633204460144043, 0.00013662874698638916, 0.0001469254493713379, 0.00015722215175628662, 0.00016751885414123535, 0.00017781555652618408, 0.0001881122589111328, 0.00019840896129608154, 0.00020870566368103027, 0.000219002366065979, 0.00022929906845092773, 0.00023959577083587646, 0.0002498924732208252, 0.0002601891756057739, 0.00027048587799072266, 0.0002807825803756714, 0.0002910792827606201, 0.00030137598514556885, 0.0003116726875305176, 0.0003219693899154663, 0.00033226609230041504, 0.00034256279468536377, 0.0003528594970703125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 5.0, 6.0, 10.0, 11.0, 17.0, 16.0, 21.0, 36.0, 41.0, 67.0, 90.0, 121.0, 171.0, 265.0, 360.0, 540.0, 854.0, 1313.0, 2226.0, 4006.0, 8235.0, 21063.0, 84566.0, 804702.0, 81216.0, 20488.0, 8088.0, 3926.0, 2159.0, 1303.0, 841.0, 551.0, 359.0, 265.0, 172.0, 114.0, 93.0, 68.0, 43.0, 39.0, 26.0, 23.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-11.1640625, -10.8204345703125, -10.476806640625, -10.1331787109375, -9.78955078125, -9.4459228515625, -9.102294921875, -8.7586669921875, -8.4150390625, -8.0714111328125, -7.727783203125, -7.3841552734375, -7.04052734375, -6.6968994140625, -6.353271484375, -6.0096435546875, -5.666015625, -5.3223876953125, -4.978759765625, -4.6351318359375, -4.29150390625, -3.9478759765625, -3.604248046875, -3.2606201171875, -2.9169921875, -2.5733642578125, -2.229736328125, -1.8861083984375, -1.54248046875, -1.1988525390625, -0.855224609375, -0.5115966796875, -0.16796875, 0.1756591796875, 0.519287109375, 0.8629150390625, 1.20654296875, 1.5501708984375, 1.893798828125, 2.2374267578125, 2.5810546875, 2.9246826171875, 3.268310546875, 3.6119384765625, 3.95556640625, 4.2991943359375, 4.642822265625, 4.9864501953125, 5.330078125, 5.6737060546875, 6.017333984375, 6.3609619140625, 6.70458984375, 7.0482177734375, 7.391845703125, 7.7354736328125, 8.0791015625, 8.4227294921875, 8.766357421875, 9.1099853515625, 9.45361328125, 9.7972412109375, 10.140869140625, 10.4844970703125, 10.828125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 1.0, 3.0, 4.0, 6.0, 9.0, 12.0, 17.0, 23.0, 26.0, 36.0, 81.0, 122.0, 359.0, 99.0, 56.0, 40.0, 27.0, 23.0, 13.0, 10.0, 7.0, 2.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.533203125, -2.4521484375, -2.37109375, -2.2900390625, -2.208984375, -2.1279296875, -2.046875, -1.9658203125, -1.884765625, -1.8037109375, -1.72265625, -1.6416015625, -1.560546875, -1.4794921875, -1.3984375, -1.3173828125, -1.236328125, -1.1552734375, -1.07421875, -0.9931640625, -0.912109375, -0.8310546875, -0.75, -0.6689453125, -0.587890625, -0.5068359375, -0.42578125, -0.3447265625, -0.263671875, -0.1826171875, -0.1015625, -0.0205078125, 0.060546875, 0.1416015625, 0.22265625, 0.3037109375, 0.384765625, 0.4658203125, 0.546875, 0.6279296875, 0.708984375, 0.7900390625, 0.87109375, 0.9521484375, 1.033203125, 1.1142578125, 1.1953125, 1.2763671875, 1.357421875, 1.4384765625, 1.51953125, 1.6005859375, 1.681640625, 1.7626953125, 1.84375, 1.9248046875, 2.005859375, 2.0869140625, 2.16796875, 2.2490234375, 2.330078125, 2.4111328125, 2.4921875, 2.5732421875, 2.654296875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 13.0, 22.0, 41.0, 60.0, 120.0, 159.0, 186.0, 137.0, 72.0, 59.0, 33.0, 27.0, 20.0, 7.0, 9.0, 4.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.377165794372559, -5.079503059387207, -4.7818403244018555, -4.484177589416504, -4.186514854431152, -3.888852119445801, -3.591189384460449, -3.2935266494750977, -2.995863914489746, -2.6982011795043945, -2.400538444519043, -2.1028757095336914, -1.8052129745483398, -1.5075502395629883, -1.2098875045776367, -0.9122247695922852, -0.6145620346069336, -0.31689929962158203, -0.01923656463623047, 0.2784261703491211, 0.5760889053344727, 0.8737516403198242, 1.1714143753051758, 1.4690771102905273, 1.766739845275879, 2.0644025802612305, 2.362065315246582, 2.6597280502319336, 2.957390785217285, 3.2550535202026367, 3.5527162551879883, 3.85037899017334, 4.148042678833008, 4.445705413818359, 4.743368148803711, 5.0410308837890625, 5.338693618774414, 5.636356353759766, 5.934019088745117, 6.231681823730469, 6.52934455871582, 6.827007293701172, 7.124670028686523, 7.422332763671875, 7.719995498657227, 8.017658233642578, 8.31532096862793, 8.612983703613281, 8.910646438598633, 9.208309173583984, 9.505971908569336, 9.803634643554688, 10.101297378540039, 10.39896011352539, 10.696622848510742, 10.994285583496094, 11.291948318481445, 11.589611053466797, 11.887273788452148, 12.1849365234375, 12.482599258422852, 12.780261993408203, 13.077924728393555, 13.375587463378906, 13.673250198364258]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 2.0, 7.0, 5.0, 7.0, 14.0, 13.0, 15.0, 16.0, 14.0, 32.0, 19.0, 20.0, 30.0, 29.0, 35.0, 41.0, 34.0, 47.0, 34.0, 40.0, 40.0, 51.0, 39.0, 51.0, 43.0, 40.0, 38.0, 31.0, 38.0, 25.0, 27.0, 27.0, 12.0, 9.0, 12.0, 14.0, 14.0, 1.0, 7.0, 5.0, 8.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.248772621154785, -3.1344285011291504, -3.0200846195220947, -2.905740737915039, -2.7913966178894043, -2.6770524978637695, -2.562708616256714, -2.448364734649658, -2.3340206146240234, -2.2196764945983887, -2.105332612991333, -1.9909886121749878, -1.8766446113586426, -1.7623006105422974, -1.6479566097259521, -1.533612608909607, -1.4192686080932617, -1.3049246072769165, -1.1905806064605713, -1.076236605644226, -0.9618926048278809, -0.8475486040115356, -0.7332046031951904, -0.6188606023788452, -0.5045166015625, -0.3901726007461548, -0.27582859992980957, -0.16148459911346436, -0.04714059829711914, 0.06720340251922607, 0.1815474033355713, 0.2958914041519165, 0.4102354049682617, 0.5245794057846069, 0.6389234066009521, 0.7532674074172974, 0.8676114082336426, 0.9819554090499878, 1.096299409866333, 1.2106434106826782, 1.3249874114990234, 1.4393314123153687, 1.5536754131317139, 1.668019413948059, 1.7823634147644043, 1.8967074155807495, 2.0110514163970947, 2.1253952980041504, 2.239739418029785, 2.35408353805542, 2.4684274196624756, 2.5827713012695312, 2.697115421295166, 2.811459541320801, 2.9258034229278564, 3.040147304534912, 3.154491424560547, 3.2688355445861816, 3.3831794261932373, 3.497523307800293, 3.6118674278259277, 3.7262115478515625, 3.840555429458618, 3.954899311065674, 4.069243431091309]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 8.0, 15.0, 17.0, 33.0, 41.0, 63.0, 88.0, 139.0, 202.0, 316.0, 411.0, 713.0, 1027.0, 1658.0, 2669.0, 4215.0, 6921.0, 11487.0, 20376.0, 36816.0, 74607.0, 175661.0, 632498.0, 2116664.0, 742092.0, 196056.0, 80664.0, 38875.0, 20490.0, 11620.0, 6658.0, 4135.0, 2502.0, 1623.0, 1016.0, 643.0, 389.0, 301.0, 193.0, 128.0, 77.0, 54.0, 38.0, 31.0, 22.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.6953125, -6.50146484375, -6.3076171875, -6.11376953125, -5.919921875, -5.72607421875, -5.5322265625, -5.33837890625, -5.14453125, -4.95068359375, -4.7568359375, -4.56298828125, -4.369140625, -4.17529296875, -3.9814453125, -3.78759765625, -3.59375, -3.39990234375, -3.2060546875, -3.01220703125, -2.818359375, -2.62451171875, -2.4306640625, -2.23681640625, -2.04296875, -1.84912109375, -1.6552734375, -1.46142578125, -1.267578125, -1.07373046875, -0.8798828125, -0.68603515625, -0.4921875, -0.29833984375, -0.1044921875, 0.08935546875, 0.283203125, 0.47705078125, 0.6708984375, 0.86474609375, 1.05859375, 1.25244140625, 1.4462890625, 1.64013671875, 1.833984375, 2.02783203125, 2.2216796875, 2.41552734375, 2.609375, 2.80322265625, 2.9970703125, 3.19091796875, 3.384765625, 3.57861328125, 3.7724609375, 3.96630859375, 4.16015625, 4.35400390625, 4.5478515625, 4.74169921875, 4.935546875, 5.12939453125, 5.3232421875, 5.51708984375, 5.7109375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 5.0, 14.0, 22.0, 17.0, 17.0, 23.0, 30.0, 23.0, 31.0, 41.0, 40.0, 35.0, 41.0, 52.0, 49.0, 39.0, 53.0, 46.0, 44.0, 43.0, 37.0, 50.0, 29.0, 25.0, 30.0, 27.0, 24.0, 17.0, 11.0, 11.0, 10.0, 7.0, 7.0, 2.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.67578125, -2.600341796875, -2.52490234375, -2.449462890625, -2.3740234375, -2.298583984375, -2.22314453125, -2.147705078125, -2.072265625, -1.996826171875, -1.92138671875, -1.845947265625, -1.7705078125, -1.695068359375, -1.61962890625, -1.544189453125, -1.46875, -1.393310546875, -1.31787109375, -1.242431640625, -1.1669921875, -1.091552734375, -1.01611328125, -0.940673828125, -0.865234375, -0.789794921875, -0.71435546875, -0.638916015625, -0.5634765625, -0.488037109375, -0.41259765625, -0.337158203125, -0.26171875, -0.186279296875, -0.11083984375, -0.035400390625, 0.0400390625, 0.115478515625, 0.19091796875, 0.266357421875, 0.341796875, 0.417236328125, 0.49267578125, 0.568115234375, 0.6435546875, 0.718994140625, 0.79443359375, 0.869873046875, 0.9453125, 1.020751953125, 1.09619140625, 1.171630859375, 1.2470703125, 1.322509765625, 1.39794921875, 1.473388671875, 1.548828125, 1.624267578125, 1.69970703125, 1.775146484375, 1.8505859375, 1.926025390625, 2.00146484375, 2.076904296875, 2.15234375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 12.0, 14.0, 18.0, 34.0, 40.0, 58.0, 91.0, 110.0, 194.0, 238.0, 436.0, 604.0, 897.0, 1510.0, 2200.0, 3573.0, 5762.0, 9699.0, 16913.0, 30061.0, 57047.0, 117297.0, 266404.0, 745635.0, 1747531.0, 697479.0, 253853.0, 111934.0, 54600.0, 28903.0, 16219.0, 9496.0, 5660.0, 3467.0, 2155.0, 1440.0, 852.0, 639.0, 399.0, 254.0, 166.0, 113.0, 71.0, 68.0, 39.0, 30.0, 17.0, 17.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0], "bins": [-4.93359375, -4.78619384765625, -4.6387939453125, -4.49139404296875, -4.343994140625, -4.19659423828125, -4.0491943359375, -3.90179443359375, -3.75439453125, -3.60699462890625, -3.4595947265625, -3.31219482421875, -3.164794921875, -3.01739501953125, -2.8699951171875, -2.72259521484375, -2.5751953125, -2.42779541015625, -2.2803955078125, -2.13299560546875, -1.985595703125, -1.83819580078125, -1.6907958984375, -1.54339599609375, -1.39599609375, -1.24859619140625, -1.1011962890625, -0.95379638671875, -0.806396484375, -0.65899658203125, -0.5115966796875, -0.36419677734375, -0.216796875, -0.06939697265625, 0.0780029296875, 0.22540283203125, 0.372802734375, 0.52020263671875, 0.6676025390625, 0.81500244140625, 0.96240234375, 1.10980224609375, 1.2572021484375, 1.40460205078125, 1.552001953125, 1.69940185546875, 1.8468017578125, 1.99420166015625, 2.1416015625, 2.28900146484375, 2.4364013671875, 2.58380126953125, 2.731201171875, 2.87860107421875, 3.0260009765625, 3.17340087890625, 3.32080078125, 3.46820068359375, 3.6156005859375, 3.76300048828125, 3.910400390625, 4.05780029296875, 4.2052001953125, 4.35260009765625, 4.5]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 6.0, 8.0, 12.0, 11.0, 15.0, 21.0, 27.0, 25.0, 57.0, 64.0, 77.0, 86.0, 112.0, 131.0, 152.0, 194.0, 215.0, 235.0, 304.0, 317.0, 344.0, 329.0, 250.0, 198.0, 150.0, 153.0, 103.0, 84.0, 76.0, 68.0, 45.0, 34.0, 45.0, 31.0, 16.0, 17.0, 7.0, 13.0, 9.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.11248779296875, -1.0726318359375, -1.03277587890625, -0.992919921875, -0.95306396484375, -0.9132080078125, -0.87335205078125, -0.83349609375, -0.79364013671875, -0.7537841796875, -0.71392822265625, -0.674072265625, -0.63421630859375, -0.5943603515625, -0.55450439453125, -0.5146484375, -0.47479248046875, -0.4349365234375, -0.39508056640625, -0.355224609375, -0.31536865234375, -0.2755126953125, -0.23565673828125, -0.19580078125, -0.15594482421875, -0.1160888671875, -0.07623291015625, -0.036376953125, 0.00347900390625, 0.0433349609375, 0.08319091796875, 0.123046875, 0.16290283203125, 0.2027587890625, 0.24261474609375, 0.282470703125, 0.32232666015625, 0.3621826171875, 0.40203857421875, 0.44189453125, 0.48175048828125, 0.5216064453125, 0.56146240234375, 0.601318359375, 0.64117431640625, 0.6810302734375, 0.72088623046875, 0.7607421875, 0.80059814453125, 0.8404541015625, 0.88031005859375, 0.920166015625, 0.96002197265625, 0.9998779296875, 1.03973388671875, 1.07958984375, 1.11944580078125, 1.1593017578125, 1.19915771484375, 1.239013671875, 1.27886962890625, 1.3187255859375, 1.35858154296875, 1.3984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 10.0, 8.0, 12.0, 25.0, 34.0, 53.0, 77.0, 124.0, 158.0, 149.0, 114.0, 75.0, 45.0, 31.0, 24.0, 21.0, 10.0, 10.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.053717136383057, -6.863794803619385, -6.673872947692871, -6.483950614929199, -6.2940287590026855, -6.104106426239014, -5.9141845703125, -5.724262237548828, -5.534339904785156, -5.344417572021484, -5.154495716094971, -4.964573383331299, -4.774651527404785, -4.584729194641113, -4.394806861877441, -4.204885005950928, -4.014963150024414, -3.8250410556793213, -3.6351189613342285, -3.4451966285705566, -3.255274772644043, -3.065352439880371, -2.8754303455352783, -2.6855082511901855, -2.4955861568450928, -2.3056640625, -2.1157419681549072, -1.925819754600525, -1.7358976602554321, -1.5459755659103394, -1.356053352355957, -1.1661312580108643, -0.9762091636657715, -0.7862870693206787, -0.5963649153709412, -0.4064427614212036, -0.21652066707611084, -0.026598572731018066, 0.16332364082336426, 0.35324573516845703, 0.5431678295135498, 0.7330899238586426, 0.9230120778083801, 1.1129342317581177, 1.3028563261032104, 1.4927784204483032, 1.6827006340026855, 1.8726227283477783, 2.062544822692871, 2.252466917037964, 2.4423890113830566, 2.6323113441467285, 2.822233200073242, 3.012155532836914, 3.202077627182007, 3.3919997215270996, 3.5819218158721924, 3.771843910217285, 3.961766004562378, 4.151688098907471, 4.341610431671143, 4.531532287597656, 4.721454620361328, 4.911376953125, 5.101298809051514]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 15.0, 8.0, 8.0, 14.0, 17.0, 13.0, 19.0, 28.0, 30.0, 26.0, 28.0, 30.0, 35.0, 27.0, 38.0, 44.0, 33.0, 36.0, 45.0, 46.0, 43.0, 39.0, 40.0, 38.0, 29.0, 40.0, 34.0, 25.0, 29.0, 21.0, 21.0, 12.0, 12.0, 12.0, 4.0, 15.0, 7.0, 4.0, 3.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31754469871521, -2.241307258605957, -2.165070056915283, -2.0888326168060303, -2.0125951766967773, -1.9363579750061035, -1.8601205348968506, -1.7838832139968872, -1.7076458930969238, -1.6314085721969604, -1.555171251296997, -1.4789338111877441, -1.4026964902877808, -1.3264591693878174, -1.2502217292785645, -1.173984408378601, -1.0977470874786377, -1.0215097665786743, -0.9452723860740662, -0.869035005569458, -0.7927976846694946, -0.7165603637695312, -0.6403229832649231, -0.5640856027603149, -0.48784828186035156, -0.4116109311580658, -0.33537358045578003, -0.25913622975349426, -0.1828988790512085, -0.10666152834892273, -0.030424177646636963, 0.04581320285797119, 0.12205052375793457, 0.19828787446022034, 0.2745252251625061, 0.35076257586479187, 0.42699992656707764, 0.503237247467041, 0.5794746279716492, 0.6557120084762573, 0.7319493293762207, 0.8081866502761841, 0.8844240307807922, 0.9606614112854004, 1.0368987321853638, 1.1131360530853271, 1.18937349319458, 1.2656108140945435, 1.3418481349945068, 1.4180854558944702, 1.4943227767944336, 1.5705602169036865, 1.64679753780365, 1.7230348587036133, 1.7992722988128662, 1.8755096197128296, 1.951746940612793, 2.027984380722046, 2.1042215824127197, 2.1804590225219727, 2.2566962242126465, 2.3329336643218994, 2.4091711044311523, 2.485408306121826, 2.561645746231079]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 11.0, 16.0, 19.0, 24.0, 44.0, 58.0, 77.0, 92.0, 152.0, 250.0, 339.0, 549.0, 779.0, 1351.0, 1980.0, 3221.0, 5475.0, 9138.0, 16416.0, 31873.0, 72559.0, 262830.0, 451730.0, 101038.0, 40548.0, 20026.0, 11031.0, 6502.0, 3812.0, 2358.0, 1447.0, 926.0, 601.0, 396.0, 277.0, 187.0, 130.0, 88.0, 60.0, 47.0, 24.0, 13.0, 20.0, 6.0, 5.0, 6.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0], "bins": [-3.888671875, -3.77484130859375, -3.6610107421875, -3.54718017578125, -3.433349609375, -3.31951904296875, -3.2056884765625, -3.09185791015625, -2.97802734375, -2.86419677734375, -2.7503662109375, -2.63653564453125, -2.522705078125, -2.40887451171875, -2.2950439453125, -2.18121337890625, -2.0673828125, -1.95355224609375, -1.8397216796875, -1.72589111328125, -1.612060546875, -1.49822998046875, -1.3843994140625, -1.27056884765625, -1.15673828125, -1.04290771484375, -0.9290771484375, -0.81524658203125, -0.701416015625, -0.58758544921875, -0.4737548828125, -0.35992431640625, -0.24609375, -0.13226318359375, -0.0184326171875, 0.09539794921875, 0.209228515625, 0.32305908203125, 0.4368896484375, 0.55072021484375, 0.66455078125, 0.77838134765625, 0.8922119140625, 1.00604248046875, 1.119873046875, 1.23370361328125, 1.3475341796875, 1.46136474609375, 1.5751953125, 1.68902587890625, 1.8028564453125, 1.91668701171875, 2.030517578125, 2.14434814453125, 2.2581787109375, 2.37200927734375, 2.48583984375, 2.59967041015625, 2.7135009765625, 2.82733154296875, 2.941162109375, 3.05499267578125, 3.1688232421875, 3.28265380859375, 3.396484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 5.0, 8.0, 8.0, 15.0, 12.0, 17.0, 14.0, 22.0, 26.0, 22.0, 23.0, 36.0, 38.0, 35.0, 32.0, 45.0, 47.0, 46.0, 55.0, 39.0, 42.0, 43.0, 45.0, 40.0, 40.0, 41.0, 35.0, 30.0, 18.0, 18.0, 13.0, 13.0, 17.0, 11.0, 7.0, 6.0, 5.0, 3.0, 7.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.642578125, -2.5592041015625, -2.475830078125, -2.3924560546875, -2.30908203125, -2.2257080078125, -2.142333984375, -2.0589599609375, -1.9755859375, -1.8922119140625, -1.808837890625, -1.7254638671875, -1.64208984375, -1.5587158203125, -1.475341796875, -1.3919677734375, -1.30859375, -1.2252197265625, -1.141845703125, -1.0584716796875, -0.97509765625, -0.8917236328125, -0.808349609375, -0.7249755859375, -0.6416015625, -0.5582275390625, -0.474853515625, -0.3914794921875, -0.30810546875, -0.2247314453125, -0.141357421875, -0.0579833984375, 0.025390625, 0.1087646484375, 0.192138671875, 0.2755126953125, 0.35888671875, 0.4422607421875, 0.525634765625, 0.6090087890625, 0.6923828125, 0.7757568359375, 0.859130859375, 0.9425048828125, 1.02587890625, 1.1092529296875, 1.192626953125, 1.2760009765625, 1.359375, 1.4427490234375, 1.526123046875, 1.6094970703125, 1.69287109375, 1.7762451171875, 1.859619140625, 1.9429931640625, 2.0263671875, 2.1097412109375, 2.193115234375, 2.2764892578125, 2.35986328125, 2.4432373046875, 2.526611328125, 2.6099853515625, 2.693359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 15.0, 5.0, 15.0, 14.0, 14.0, 36.0, 52.0, 49.0, 72.0, 109.0, 145.0, 171.0, 299.0, 395.0, 569.0, 842.0, 1129.0, 1825.0, 2834.0, 4808.0, 8978.0, 18834.0, 58930.0, 739252.0, 150877.0, 29333.0, 12249.0, 6250.0, 3568.0, 2200.0, 1387.0, 973.0, 635.0, 467.0, 377.0, 205.0, 176.0, 139.0, 91.0, 59.0, 42.0, 47.0, 29.0, 17.0, 8.0, 10.0, 7.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-5.86328125, -5.678466796875, -5.49365234375, -5.308837890625, -5.1240234375, -4.939208984375, -4.75439453125, -4.569580078125, -4.384765625, -4.199951171875, -4.01513671875, -3.830322265625, -3.6455078125, -3.460693359375, -3.27587890625, -3.091064453125, -2.90625, -2.721435546875, -2.53662109375, -2.351806640625, -2.1669921875, -1.982177734375, -1.79736328125, -1.612548828125, -1.427734375, -1.242919921875, -1.05810546875, -0.873291015625, -0.6884765625, -0.503662109375, -0.31884765625, -0.134033203125, 0.05078125, 0.235595703125, 0.42041015625, 0.605224609375, 0.7900390625, 0.974853515625, 1.15966796875, 1.344482421875, 1.529296875, 1.714111328125, 1.89892578125, 2.083740234375, 2.2685546875, 2.453369140625, 2.63818359375, 2.822998046875, 3.0078125, 3.192626953125, 3.37744140625, 3.562255859375, 3.7470703125, 3.931884765625, 4.11669921875, 4.301513671875, 4.486328125, 4.671142578125, 4.85595703125, 5.040771484375, 5.2255859375, 5.410400390625, 5.59521484375, 5.780029296875, 5.96484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 14.0, 8.0, 14.0, 12.0, 20.0, 16.0, 32.0, 25.0, 18.0, 28.0, 27.0, 44.0, 33.0, 38.0, 37.0, 38.0, 32.0, 45.0, 49.0, 37.0, 29.0, 38.0, 33.0, 34.0, 32.0, 23.0, 23.0, 29.0, 36.0, 23.0, 19.0, 12.0, 12.0, 13.0, 12.0, 12.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5732421875, -1.5205841064453125, -1.467926025390625, -1.4152679443359375, -1.36260986328125, -1.3099517822265625, -1.257293701171875, -1.2046356201171875, -1.1519775390625, -1.0993194580078125, -1.046661376953125, -0.9940032958984375, -0.94134521484375, -0.8886871337890625, -0.836029052734375, -0.7833709716796875, -0.730712890625, -0.6780548095703125, -0.625396728515625, -0.5727386474609375, -0.52008056640625, -0.4674224853515625, -0.414764404296875, -0.3621063232421875, -0.3094482421875, -0.2567901611328125, -0.204132080078125, -0.1514739990234375, -0.09881591796875, -0.0461578369140625, 0.006500244140625, 0.0591583251953125, 0.11181640625, 0.1644744873046875, 0.217132568359375, 0.2697906494140625, 0.32244873046875, 0.3751068115234375, 0.427764892578125, 0.4804229736328125, 0.5330810546875, 0.5857391357421875, 0.638397216796875, 0.6910552978515625, 0.74371337890625, 0.7963714599609375, 0.849029541015625, 0.9016876220703125, 0.954345703125, 1.0070037841796875, 1.059661865234375, 1.1123199462890625, 1.16497802734375, 1.2176361083984375, 1.270294189453125, 1.3229522705078125, 1.3756103515625, 1.4282684326171875, 1.480926513671875, 1.5335845947265625, 1.58624267578125, 1.6389007568359375, 1.691558837890625, 1.7442169189453125, 1.796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 6.0, 1.0, 5.0, 6.0, 17.0, 19.0, 14.0, 26.0, 49.0, 61.0, 67.0, 129.0, 150.0, 201.0, 288.0, 439.0, 644.0, 1005.0, 1618.0, 2803.0, 5081.0, 10755.0, 27764.0, 132835.0, 755937.0, 70173.0, 19665.0, 8215.0, 4175.0, 2313.0, 1359.0, 862.0, 569.0, 359.0, 259.0, 170.0, 134.0, 102.0, 59.0, 56.0, 55.0, 26.0, 16.0, 18.0, 14.0, 20.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.328125, -1.2882843017578125, -1.248443603515625, -1.2086029052734375, -1.16876220703125, -1.1289215087890625, -1.089080810546875, -1.0492401123046875, -1.0093994140625, -0.9695587158203125, -0.929718017578125, -0.8898773193359375, -0.85003662109375, -0.8101959228515625, -0.770355224609375, -0.7305145263671875, -0.690673828125, -0.6508331298828125, -0.610992431640625, -0.5711517333984375, -0.53131103515625, -0.4914703369140625, -0.451629638671875, -0.4117889404296875, -0.3719482421875, -0.3321075439453125, -0.292266845703125, -0.2524261474609375, -0.21258544921875, -0.1727447509765625, -0.132904052734375, -0.0930633544921875, -0.05322265625, -0.0133819580078125, 0.026458740234375, 0.0662994384765625, 0.10614013671875, 0.1459808349609375, 0.185821533203125, 0.2256622314453125, 0.2655029296875, 0.3053436279296875, 0.345184326171875, 0.3850250244140625, 0.42486572265625, 0.4647064208984375, 0.504547119140625, 0.5443878173828125, 0.584228515625, 0.6240692138671875, 0.663909912109375, 0.7037506103515625, 0.74359130859375, 0.7834320068359375, 0.823272705078125, 0.8631134033203125, 0.9029541015625, 0.9427947998046875, 0.982635498046875, 1.0224761962890625, 1.06231689453125, 1.1021575927734375, 1.141998291015625, 1.1818389892578125, 1.2216796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 7.0, 4.0, 15.0, 11.0, 13.0, 18.0, 28.0, 59.0, 69.0, 102.0, 128.0, 174.0, 138.0, 85.0, 42.0, 32.0, 27.0, 24.0, 8.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-05, -4.260055720806122e-05, -4.049763083457947e-05, -3.839470446109772e-05, -3.629177808761597e-05, -3.4188851714134216e-05, -3.2085925340652466e-05, -2.9982998967170715e-05, -2.7880072593688965e-05, -2.5777146220207214e-05, -2.3674219846725464e-05, -2.1571293473243713e-05, -1.9468367099761963e-05, -1.7365440726280212e-05, -1.5262514352798462e-05, -1.3159587979316711e-05, -1.1056661605834961e-05, -8.95373523235321e-06, -6.85080885887146e-06, -4.7478824853897095e-06, -2.644956111907959e-06, -5.420297384262085e-07, 1.560896635055542e-06, 3.6638230085372925e-06, 5.766749382019043e-06, 7.869675755500793e-06, 9.972602128982544e-06, 1.2075528502464294e-05, 1.4178454875946045e-05, 1.6281381249427795e-05, 1.8384307622909546e-05, 2.0487233996391296e-05, 2.2590160369873047e-05, 2.4693086743354797e-05, 2.6796013116836548e-05, 2.88989394903183e-05, 3.100186586380005e-05, 3.31047922372818e-05, 3.520771861076355e-05, 3.73106449842453e-05, 3.941357135772705e-05, 4.15164977312088e-05, 4.361942410469055e-05, 4.57223504781723e-05, 4.782527685165405e-05, 4.99282032251358e-05, 5.2031129598617554e-05, 5.4134055972099304e-05, 5.6236982345581055e-05, 5.8339908719062805e-05, 6.0442835092544556e-05, 6.25457614660263e-05, 6.464868783950806e-05, 6.675161421298981e-05, 6.885454058647156e-05, 7.095746695995331e-05, 7.306039333343506e-05, 7.516331970691681e-05, 7.726624608039856e-05, 7.936917245388031e-05, 8.147209882736206e-05, 8.357502520084381e-05, 8.567795157432556e-05, 8.778087794780731e-05, 8.988380432128906e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 12.0, 12.0, 18.0, 37.0, 48.0, 56.0, 104.0, 128.0, 181.0, 309.0, 400.0, 615.0, 1037.0, 1663.0, 2752.0, 5009.0, 9841.0, 21180.0, 54558.0, 208490.0, 569720.0, 105692.0, 34855.0, 14618.0, 7335.0, 3790.0, 2238.0, 1331.0, 868.0, 543.0, 359.0, 244.0, 146.0, 94.0, 85.0, 49.0, 41.0, 33.0, 20.0, 12.0, 4.0, 6.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.16796875, -1.1338958740234375, -1.099822998046875, -1.0657501220703125, -1.03167724609375, -0.9976043701171875, -0.963531494140625, -0.9294586181640625, -0.8953857421875, -0.8613128662109375, -0.827239990234375, -0.7931671142578125, -0.75909423828125, -0.7250213623046875, -0.690948486328125, -0.6568756103515625, -0.622802734375, -0.5887298583984375, -0.554656982421875, -0.5205841064453125, -0.48651123046875, -0.4524383544921875, -0.418365478515625, -0.3842926025390625, -0.3502197265625, -0.3161468505859375, -0.282073974609375, -0.2480010986328125, -0.21392822265625, -0.1798553466796875, -0.145782470703125, -0.1117095947265625, -0.07763671875, -0.0435638427734375, -0.009490966796875, 0.0245819091796875, 0.05865478515625, 0.0927276611328125, 0.126800537109375, 0.1608734130859375, 0.1949462890625, 0.2290191650390625, 0.263092041015625, 0.2971649169921875, 0.33123779296875, 0.3653106689453125, 0.399383544921875, 0.4334564208984375, 0.467529296875, 0.5016021728515625, 0.535675048828125, 0.5697479248046875, 0.60382080078125, 0.6378936767578125, 0.671966552734375, 0.7060394287109375, 0.7401123046875, 0.7741851806640625, 0.808258056640625, 0.8423309326171875, 0.87640380859375, 0.9104766845703125, 0.944549560546875, 0.9786224365234375, 1.0126953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 5.0, 11.0, 21.0, 17.0, 33.0, 42.0, 54.0, 70.0, 90.0, 122.0, 118.0, 114.0, 78.0, 50.0, 41.0, 29.0, 22.0, 9.0, 11.0, 9.0, 11.0, 5.0, 5.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.237060546875, -0.22910308837890625, -0.2211456298828125, -0.21318817138671875, -0.205230712890625, -0.19727325439453125, -0.1893157958984375, -0.18135833740234375, -0.17340087890625, -0.16544342041015625, -0.1574859619140625, -0.14952850341796875, -0.141571044921875, -0.13361358642578125, -0.1256561279296875, -0.11769866943359375, -0.1097412109375, -0.10178375244140625, -0.0938262939453125, -0.08586883544921875, -0.077911376953125, -0.06995391845703125, -0.0619964599609375, -0.05403900146484375, -0.04608154296875, -0.03812408447265625, -0.0301666259765625, -0.02220916748046875, -0.014251708984375, -0.00629425048828125, 0.0016632080078125, 0.00962066650390625, 0.017578125, 0.02553558349609375, 0.0334930419921875, 0.04145050048828125, 0.049407958984375, 0.05736541748046875, 0.0653228759765625, 0.07328033447265625, 0.08123779296875, 0.08919525146484375, 0.0971527099609375, 0.10511016845703125, 0.113067626953125, 0.12102508544921875, 0.1289825439453125, 0.13694000244140625, 0.1448974609375, 0.15285491943359375, 0.1608123779296875, 0.16876983642578125, 0.176727294921875, 0.18468475341796875, 0.1926422119140625, 0.20059967041015625, 0.20855712890625, 0.21651458740234375, 0.2244720458984375, 0.23242950439453125, 0.240386962890625, 0.24834442138671875, 0.2563018798828125, 0.26425933837890625, 0.272216796875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 11.0, 13.0, 14.0, 28.0, 30.0, 48.0, 69.0, 119.0, 151.0, 138.0, 119.0, 80.0, 41.0, 40.0, 26.0, 18.0, 15.0, 14.0, 12.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.450377464294434, -6.27675724029541, -6.103137016296387, -5.9295172691345215, -5.755897045135498, -5.582276821136475, -5.408657073974609, -5.235036849975586, -5.0614166259765625, -4.887796401977539, -4.714176177978516, -4.54055643081665, -4.366936206817627, -4.1933159828186035, -4.019696235656738, -3.846076011657715, -3.6724557876586914, -3.498835563659668, -3.3252155780792236, -3.1515955924987793, -2.977975368499756, -2.8043551445007324, -2.630735158920288, -2.4571151733398438, -2.2834949493408203, -2.109874725341797, -1.9362547397613525, -1.7626346349716187, -1.5890145301818848, -1.4153944253921509, -1.241774320602417, -1.068154215812683, -0.8945345878601074, -0.7209144830703735, -0.5472943782806396, -0.37367427349090576, -0.20005416870117188, -0.02643406391143799, 0.1471860408782959, 0.3208061456680298, 0.49442625045776367, 0.6680463552474976, 0.8416664600372314, 1.0152865648269653, 1.1889066696166992, 1.362526774406433, 1.536146879196167, 1.7097669839859009, 1.8833870887756348, 2.057007312774658, 2.2306272983551025, 2.404247283935547, 2.5778675079345703, 2.7514877319335938, 2.925107717514038, 3.0987277030944824, 3.272347927093506, 3.4459681510925293, 3.6195881366729736, 3.793208122253418, 3.9668283462524414, 4.140448570251465, 4.314068794250488, 4.4876885414123535, 4.661308765411377]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 3.0, 5.0, 12.0, 8.0, 9.0, 12.0, 17.0, 15.0, 18.0, 24.0, 27.0, 32.0, 28.0, 29.0, 33.0, 34.0, 40.0, 31.0, 41.0, 34.0, 44.0, 37.0, 54.0, 39.0, 34.0, 39.0, 33.0, 32.0, 41.0, 24.0, 35.0, 23.0, 11.0, 12.0, 20.0, 8.0, 10.0, 10.0, 6.0, 5.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28342342376709, -2.2087173461914062, -2.1340110301971436, -2.05930495262146, -1.9845988750457764, -1.9098926782608032, -1.83518648147583, -1.7604804039001465, -1.6857742071151733, -1.6110680103302002, -1.5363619327545166, -1.4616557359695435, -1.3869495391845703, -1.3122434616088867, -1.2375372648239136, -1.1628310680389404, -1.0881249904632568, -1.0134187936782837, -0.9387127161026001, -0.864006519317627, -0.7893003821372986, -0.7145942449569702, -0.6398880481719971, -0.5651819109916687, -0.49047577381134033, -0.41576963663101196, -0.3410634696483612, -0.26635730266571045, -0.19165116548538208, -0.11694502830505371, -0.042238861322402954, 0.0324673056602478, 0.10717320442199707, 0.18187935650348663, 0.2565855085849762, 0.33129167556762695, 0.4059978127479553, 0.4807039499282837, 0.5554101467132568, 0.6301162838935852, 0.7048224210739136, 0.7795285582542419, 0.8542346954345703, 0.9289408922195435, 1.0036470890045166, 1.0783531665802002, 1.1530593633651733, 1.2277655601501465, 1.30247163772583, 1.3771778345108032, 1.4518839120864868, 1.52659010887146, 1.6012961864471436, 1.6760023832321167, 1.7507085800170898, 1.8254146575927734, 1.9001208543777466, 1.9748270511627197, 2.0495331287384033, 2.124239206314087, 2.1989455223083496, 2.273651599884033, 2.348357677459717, 2.4230639934539795, 2.497770071029663]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 6.0, 2.0, 9.0, 7.0, 23.0, 24.0, 36.0, 55.0, 56.0, 77.0, 129.0, 185.0, 271.0, 354.0, 523.0, 770.0, 1065.0, 1584.0, 2437.0, 3689.0, 5731.0, 8922.0, 14402.0, 22952.0, 38425.0, 65665.0, 113985.0, 192815.0, 223383.0, 143831.0, 81873.0, 47973.0, 28683.0, 17495.0, 10898.0, 6904.0, 4476.0, 2861.0, 1923.0, 1282.0, 811.0, 569.0, 414.0, 287.0, 194.0, 144.0, 101.0, 94.0, 46.0, 34.0, 24.0, 21.0, 13.0, 10.0, 8.0, 2.0, 6.0, 6.0, 1.0, 1.0], "bins": [-3.921875, -3.80010986328125, -3.6783447265625, -3.55657958984375, -3.434814453125, -3.31304931640625, -3.1912841796875, -3.06951904296875, -2.94775390625, -2.82598876953125, -2.7042236328125, -2.58245849609375, -2.460693359375, -2.33892822265625, -2.2171630859375, -2.09539794921875, -1.9736328125, -1.85186767578125, -1.7301025390625, -1.60833740234375, -1.486572265625, -1.36480712890625, -1.2430419921875, -1.12127685546875, -0.99951171875, -0.87774658203125, -0.7559814453125, -0.63421630859375, -0.512451171875, -0.39068603515625, -0.2689208984375, -0.14715576171875, -0.025390625, 0.09637451171875, 0.2181396484375, 0.33990478515625, 0.461669921875, 0.58343505859375, 0.7052001953125, 0.82696533203125, 0.94873046875, 1.07049560546875, 1.1922607421875, 1.31402587890625, 1.435791015625, 1.55755615234375, 1.6793212890625, 1.80108642578125, 1.9228515625, 2.04461669921875, 2.1663818359375, 2.28814697265625, 2.409912109375, 2.53167724609375, 2.6534423828125, 2.77520751953125, 2.89697265625, 3.01873779296875, 3.1405029296875, 3.26226806640625, 3.384033203125, 3.50579833984375, 3.6275634765625, 3.74932861328125, 3.87109375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 8.0, 9.0, 11.0, 11.0, 17.0, 20.0, 25.0, 23.0, 28.0, 36.0, 41.0, 36.0, 34.0, 35.0, 38.0, 44.0, 32.0, 41.0, 47.0, 44.0, 32.0, 49.0, 52.0, 34.0, 38.0, 26.0, 29.0, 22.0, 16.0, 12.0, 18.0, 11.0, 8.0, 8.0, 10.0, 10.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.23828125, -2.168792724609375, -2.09930419921875, -2.029815673828125, -1.9603271484375, -1.890838623046875, -1.82135009765625, -1.751861572265625, -1.682373046875, -1.612884521484375, -1.54339599609375, -1.473907470703125, -1.4044189453125, -1.334930419921875, -1.26544189453125, -1.195953369140625, -1.12646484375, -1.056976318359375, -0.98748779296875, -0.917999267578125, -0.8485107421875, -0.779022216796875, -0.70953369140625, -0.640045166015625, -0.570556640625, -0.501068115234375, -0.43157958984375, -0.362091064453125, -0.2926025390625, -0.223114013671875, -0.15362548828125, -0.084136962890625, -0.0146484375, 0.054840087890625, 0.12432861328125, 0.193817138671875, 0.2633056640625, 0.332794189453125, 0.40228271484375, 0.471771240234375, 0.541259765625, 0.610748291015625, 0.68023681640625, 0.749725341796875, 0.8192138671875, 0.888702392578125, 0.95819091796875, 1.027679443359375, 1.09716796875, 1.166656494140625, 1.23614501953125, 1.305633544921875, 1.3751220703125, 1.444610595703125, 1.51409912109375, 1.583587646484375, 1.653076171875, 1.722564697265625, 1.79205322265625, 1.861541748046875, 1.9310302734375, 2.000518798828125, 2.07000732421875, 2.139495849609375, 2.208984375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 11.0, 9.0, 16.0, 17.0, 25.0, 36.0, 54.0, 65.0, 102.0, 175.0, 247.0, 393.0, 618.0, 936.0, 1416.0, 2538.0, 4031.0, 6802.0, 12251.0, 21592.0, 38907.0, 71254.0, 130336.0, 231435.0, 231674.0, 131157.0, 71723.0, 39217.0, 21757.0, 12080.0, 6931.0, 4150.0, 2465.0, 1532.0, 898.0, 587.0, 353.0, 254.0, 158.0, 120.0, 80.0, 50.0, 35.0, 14.0, 22.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-4.5234375, -4.390411376953125, -4.25738525390625, -4.124359130859375, -3.9913330078125, -3.858306884765625, -3.72528076171875, -3.592254638671875, -3.459228515625, -3.326202392578125, -3.19317626953125, -3.060150146484375, -2.9271240234375, -2.794097900390625, -2.66107177734375, -2.528045654296875, -2.39501953125, -2.261993408203125, -2.12896728515625, -1.995941162109375, -1.8629150390625, -1.729888916015625, -1.59686279296875, -1.463836669921875, -1.330810546875, -1.197784423828125, -1.06475830078125, -0.931732177734375, -0.7987060546875, -0.665679931640625, -0.53265380859375, -0.399627685546875, -0.2666015625, -0.133575439453125, -0.00054931640625, 0.132476806640625, 0.2655029296875, 0.398529052734375, 0.53155517578125, 0.664581298828125, 0.797607421875, 0.930633544921875, 1.06365966796875, 1.196685791015625, 1.3297119140625, 1.462738037109375, 1.59576416015625, 1.728790283203125, 1.86181640625, 1.994842529296875, 2.12786865234375, 2.260894775390625, 2.3939208984375, 2.526947021484375, 2.65997314453125, 2.792999267578125, 2.926025390625, 3.059051513671875, 3.19207763671875, 3.325103759765625, 3.4581298828125, 3.591156005859375, 3.72418212890625, 3.857208251953125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 12.0, 13.0, 14.0, 10.0, 20.0, 21.0, 20.0, 26.0, 31.0, 25.0, 30.0, 28.0, 47.0, 41.0, 47.0, 59.0, 42.0, 43.0, 36.0, 52.0, 40.0, 52.0, 36.0, 32.0, 31.0, 31.0, 30.0, 19.0, 23.0, 15.0, 16.0, 6.0, 9.0, 9.0, 6.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-1.826171875, -1.7763519287109375, -1.726531982421875, -1.6767120361328125, -1.62689208984375, -1.5770721435546875, -1.527252197265625, -1.4774322509765625, -1.4276123046875, -1.3777923583984375, -1.327972412109375, -1.2781524658203125, -1.22833251953125, -1.1785125732421875, -1.128692626953125, -1.0788726806640625, -1.029052734375, -0.9792327880859375, -0.929412841796875, -0.8795928955078125, -0.82977294921875, -0.7799530029296875, -0.730133056640625, -0.6803131103515625, -0.6304931640625, -0.5806732177734375, -0.530853271484375, -0.4810333251953125, -0.43121337890625, -0.3813934326171875, -0.331573486328125, -0.2817535400390625, -0.23193359375, -0.1821136474609375, -0.132293701171875, -0.0824737548828125, -0.03265380859375, 0.0171661376953125, 0.066986083984375, 0.1168060302734375, 0.1666259765625, 0.2164459228515625, 0.266265869140625, 0.3160858154296875, 0.36590576171875, 0.4157257080078125, 0.465545654296875, 0.5153656005859375, 0.565185546875, 0.6150054931640625, 0.664825439453125, 0.7146453857421875, 0.76446533203125, 0.8142852783203125, 0.864105224609375, 0.9139251708984375, 0.9637451171875, 1.0135650634765625, 1.063385009765625, 1.1132049560546875, 1.16302490234375, 1.2128448486328125, 1.262664794921875, 1.3124847412109375, 1.3623046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 9.0, 7.0, 9.0, 8.0, 11.0, 26.0, 31.0, 46.0, 53.0, 92.0, 143.0, 188.0, 307.0, 487.0, 743.0, 1299.0, 2405.0, 4842.0, 11627.0, 34040.0, 197593.0, 713796.0, 51936.0, 15547.0, 6292.0, 3019.0, 1568.0, 855.0, 518.0, 346.0, 233.0, 125.0, 109.0, 82.0, 60.0, 34.0, 20.0, 17.0, 13.0, 11.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.00921630859375, -5.7957763671875, -5.58233642578125, -5.368896484375, -5.15545654296875, -4.9420166015625, -4.72857666015625, -4.51513671875, -4.30169677734375, -4.0882568359375, -3.87481689453125, -3.661376953125, -3.44793701171875, -3.2344970703125, -3.02105712890625, -2.8076171875, -2.59417724609375, -2.3807373046875, -2.16729736328125, -1.953857421875, -1.74041748046875, -1.5269775390625, -1.31353759765625, -1.10009765625, -0.88665771484375, -0.6732177734375, -0.45977783203125, -0.246337890625, -0.03289794921875, 0.1805419921875, 0.39398193359375, 0.607421875, 0.82086181640625, 1.0343017578125, 1.24774169921875, 1.461181640625, 1.67462158203125, 1.8880615234375, 2.10150146484375, 2.31494140625, 2.52838134765625, 2.7418212890625, 2.95526123046875, 3.168701171875, 3.38214111328125, 3.5955810546875, 3.80902099609375, 4.0224609375, 4.23590087890625, 4.4493408203125, 4.66278076171875, 4.876220703125, 5.08966064453125, 5.3031005859375, 5.51654052734375, 5.72998046875, 5.94342041015625, 6.1568603515625, 6.37030029296875, 6.583740234375, 6.79718017578125, 7.0106201171875, 7.22406005859375, 7.4375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 1.0, 4.0, 5.0, 8.0, 8.0, 6.0, 20.0, 29.0, 25.0, 37.0, 59.0, 87.0, 153.0, 201.0, 96.0, 69.0, 49.0, 27.0, 28.0, 15.0, 15.0, 12.0, 3.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00012969970703125, -0.00012590736150741577, -0.00012211501598358154, -0.00011832267045974731, -0.00011453032493591309, -0.00011073797941207886, -0.00010694563388824463, -0.0001031532883644104, -9.936094284057617e-05, -9.556859731674194e-05, -9.177625179290771e-05, -8.798390626907349e-05, -8.419156074523926e-05, -8.039921522140503e-05, -7.66068696975708e-05, -7.281452417373657e-05, -6.902217864990234e-05, -6.522983312606812e-05, -6.143748760223389e-05, -5.764514207839966e-05, -5.385279655456543e-05, -5.00604510307312e-05, -4.626810550689697e-05, -4.2475759983062744e-05, -3.8683414459228516e-05, -3.489106893539429e-05, -3.109872341156006e-05, -2.730637788772583e-05, -2.35140323638916e-05, -1.9721686840057373e-05, -1.5929341316223145e-05, -1.2136995792388916e-05, -8.344650268554688e-06, -4.552304744720459e-06, -7.599592208862305e-07, 3.032386302947998e-06, 6.8247318267822266e-06, 1.0617077350616455e-05, 1.4409422874450684e-05, 1.8201768398284912e-05, 2.199411392211914e-05, 2.578645944595337e-05, 2.9578804969787598e-05, 3.3371150493621826e-05, 3.7163496017456055e-05, 4.095584154129028e-05, 4.474818706512451e-05, 4.854053258895874e-05, 5.233287811279297e-05, 5.61252236366272e-05, 5.9917569160461426e-05, 6.370991468429565e-05, 6.750226020812988e-05, 7.129460573196411e-05, 7.508695125579834e-05, 7.887929677963257e-05, 8.26716423034668e-05, 8.646398782730103e-05, 9.025633335113525e-05, 9.404867887496948e-05, 9.784102439880371e-05, 0.00010163336992263794, 0.00010542571544647217, 0.0001092180609703064, 0.00011301040649414062]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 8.0, 9.0, 13.0, 21.0, 48.0, 57.0, 73.0, 102.0, 148.0, 190.0, 251.0, 442.0, 629.0, 903.0, 1363.0, 2213.0, 4142.0, 7915.0, 18161.0, 52601.0, 622348.0, 259927.0, 43917.0, 15979.0, 7158.0, 3776.0, 2086.0, 1249.0, 867.0, 577.0, 402.0, 277.0, 208.0, 143.0, 92.0, 70.0, 42.0, 37.0, 22.0, 13.0, 16.0, 12.0, 5.0, 6.0, 8.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.9833984375, -4.822265625, -4.6611328125, -4.5, -4.3388671875, -4.177734375, -4.0166015625, -3.85546875, -3.6943359375, -3.533203125, -3.3720703125, -3.2109375, -3.0498046875, -2.888671875, -2.7275390625, -2.56640625, -2.4052734375, -2.244140625, -2.0830078125, -1.921875, -1.7607421875, -1.599609375, -1.4384765625, -1.27734375, -1.1162109375, -0.955078125, -0.7939453125, -0.6328125, -0.4716796875, -0.310546875, -0.1494140625, 0.01171875, 0.1728515625, 0.333984375, 0.4951171875, 0.65625, 0.8173828125, 0.978515625, 1.1396484375, 1.30078125, 1.4619140625, 1.623046875, 1.7841796875, 1.9453125, 2.1064453125, 2.267578125, 2.4287109375, 2.58984375, 2.7509765625, 2.912109375, 3.0732421875, 3.234375, 3.3955078125, 3.556640625, 3.7177734375, 3.87890625, 4.0400390625, 4.201171875, 4.3623046875, 4.5234375, 4.6845703125, 4.845703125, 5.0068359375, 5.16796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 4.0, 10.0, 7.0, 5.0, 25.0, 23.0, 22.0, 39.0, 50.0, 76.0, 222.0, 208.0, 82.0, 44.0, 51.0, 25.0, 16.0, 19.0, 15.0, 12.0, 12.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.25, -1.21209716796875, -1.1741943359375, -1.13629150390625, -1.098388671875, -1.06048583984375, -1.0225830078125, -0.98468017578125, -0.94677734375, -0.90887451171875, -0.8709716796875, -0.83306884765625, -0.795166015625, -0.75726318359375, -0.7193603515625, -0.68145751953125, -0.6435546875, -0.60565185546875, -0.5677490234375, -0.52984619140625, -0.491943359375, -0.45404052734375, -0.4161376953125, -0.37823486328125, -0.34033203125, -0.30242919921875, -0.2645263671875, -0.22662353515625, -0.188720703125, -0.15081787109375, -0.1129150390625, -0.07501220703125, -0.037109375, 0.00079345703125, 0.0386962890625, 0.07659912109375, 0.114501953125, 0.15240478515625, 0.1903076171875, 0.22821044921875, 0.26611328125, 0.30401611328125, 0.3419189453125, 0.37982177734375, 0.417724609375, 0.45562744140625, 0.4935302734375, 0.53143310546875, 0.5693359375, 0.60723876953125, 0.6451416015625, 0.68304443359375, 0.720947265625, 0.75885009765625, 0.7967529296875, 0.83465576171875, 0.87255859375, 0.91046142578125, 0.9483642578125, 0.98626708984375, 1.024169921875, 1.06207275390625, 1.0999755859375, 1.13787841796875, 1.17578125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 11.0, 21.0, 22.0, 29.0, 45.0, 74.0, 118.0, 150.0, 162.0, 89.0, 74.0, 63.0, 33.0, 24.0, 21.0, 16.0, 10.0, 7.0, 6.0, 7.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.855809688568115, -5.697134017944336, -5.538457870483398, -5.379782199859619, -5.22110652923584, -5.062430381774902, -4.903754711151123, -4.745079040527344, -4.586402893066406, -4.427727222442627, -4.2690510749816895, -4.11037540435791, -3.951699733734131, -3.7930238246917725, -3.634347915649414, -3.4756722450256348, -3.3169965744018555, -3.158320665359497, -2.9996449947357178, -2.8409690856933594, -2.68229341506958, -2.5236175060272217, -2.3649415969848633, -2.206265926361084, -2.0475900173187256, -1.8889142274856567, -1.730238437652588, -1.5715625286102295, -1.4128867387771606, -1.2542109489440918, -1.0955350399017334, -0.9368592500686646, -0.7781839370727539, -0.6195081472396851, -0.46083229780197144, -0.3021564781665802, -0.14348065853118896, 0.015195131301879883, 0.1738709807395935, 0.33254683017730713, 0.491222620010376, 0.6498984098434448, 0.8085742592811584, 0.9672501087188721, 1.125925898551941, 1.2846016883850098, 1.4432775974273682, 1.601953387260437, 1.7606291770935059, 1.9193049669265747, 2.0779807567596436, 2.236656665802002, 2.3953323364257812, 2.5540082454681396, 2.712684154510498, 2.8713598251342773, 3.0300357341766357, 3.188711643218994, 3.3473873138427734, 3.506063222885132, 3.6647391319274902, 3.8234148025512695, 3.982090711593628, 4.140766620635986, 4.299442291259766]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 10.0, 12.0, 11.0, 10.0, 16.0, 8.0, 14.0, 17.0, 21.0, 17.0, 27.0, 28.0, 18.0, 27.0, 34.0, 43.0, 31.0, 32.0, 45.0, 34.0, 39.0, 46.0, 44.0, 60.0, 41.0, 36.0, 29.0, 26.0, 28.0, 27.0, 18.0, 20.0, 22.0, 24.0, 12.0, 8.0, 10.0, 11.0, 10.0, 6.0, 3.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.091533660888672, -2.0223774909973145, -1.953221321105957, -1.8840651512145996, -1.8149088621139526, -1.7457526922225952, -1.6765965223312378, -1.6074403524398804, -1.5382840633392334, -1.469127893447876, -1.3999717235565186, -1.3308155536651611, -1.2616592645645142, -1.1925030946731567, -1.1233469247817993, -1.054190754890442, -0.9850345849990845, -0.915878415107727, -0.8467221856117249, -0.7775660157203674, -0.7084097862243652, -0.6392536163330078, -0.5700974464416504, -0.500941276550293, -0.43178504705429077, -0.36262884736061096, -0.29347264766693115, -0.22431647777557373, -0.15516027808189392, -0.08600407838821411, -0.01684790849685669, 0.05230829119682312, 0.12146449089050293, 0.19062069058418274, 0.25977689027786255, 0.32893306016921997, 0.3980892598628998, 0.4672454595565796, 0.536401629447937, 0.6055577993392944, 0.6747140288352966, 0.743870198726654, 0.8130264282226562, 0.8821825981140137, 0.9513387680053711, 1.0204949378967285, 1.089651107788086, 1.158807396888733, 1.2279635667800903, 1.2971197366714478, 1.3662759065628052, 1.4354321956634521, 1.5045883655548096, 1.573744535446167, 1.6429007053375244, 1.7120568752288818, 1.7812130451202393, 1.8503692150115967, 1.919525384902954, 1.9886815547943115, 2.057837724685669, 2.1269941329956055, 2.196150302886963, 2.2653064727783203, 2.3344626426696777]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 11.0, 4.0, 11.0, 14.0, 21.0, 18.0, 36.0, 40.0, 58.0, 77.0, 120.0, 124.0, 212.0, 278.0, 410.0, 539.0, 820.0, 1127.0, 1679.0, 2339.0, 3434.0, 5059.0, 7926.0, 12991.0, 21369.0, 37033.0, 67765.0, 137476.0, 355342.0, 1358594.0, 1470784.0, 387265.0, 145768.0, 72231.0, 39923.0, 23173.0, 14109.0, 8924.0, 5622.0, 3753.0, 2535.0, 1697.0, 1161.0, 776.0, 519.0, 368.0, 269.0, 155.0, 114.0, 76.0, 53.0, 34.0, 20.0, 10.0, 9.0, 3.0, 5.0, 4.0], "bins": [-3.826171875, -3.720001220703125, -3.61383056640625, -3.507659912109375, -3.4014892578125, -3.295318603515625, -3.18914794921875, -3.082977294921875, -2.976806640625, -2.870635986328125, -2.76446533203125, -2.658294677734375, -2.5521240234375, -2.445953369140625, -2.33978271484375, -2.233612060546875, -2.12744140625, -2.021270751953125, -1.91510009765625, -1.808929443359375, -1.7027587890625, -1.596588134765625, -1.49041748046875, -1.384246826171875, -1.278076171875, -1.171905517578125, -1.06573486328125, -0.959564208984375, -0.8533935546875, -0.747222900390625, -0.64105224609375, -0.534881591796875, -0.4287109375, -0.322540283203125, -0.21636962890625, -0.110198974609375, -0.0040283203125, 0.102142333984375, 0.20831298828125, 0.314483642578125, 0.420654296875, 0.526824951171875, 0.63299560546875, 0.739166259765625, 0.8453369140625, 0.951507568359375, 1.05767822265625, 1.163848876953125, 1.27001953125, 1.376190185546875, 1.48236083984375, 1.588531494140625, 1.6947021484375, 1.800872802734375, 1.90704345703125, 2.013214111328125, 2.119384765625, 2.225555419921875, 2.33172607421875, 2.437896728515625, 2.5440673828125, 2.650238037109375, 2.75640869140625, 2.862579345703125, 2.96875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 9.0, 8.0, 9.0, 9.0, 20.0, 14.0, 18.0, 16.0, 18.0, 26.0, 26.0, 28.0, 28.0, 29.0, 41.0, 31.0, 36.0, 47.0, 41.0, 40.0, 50.0, 54.0, 47.0, 33.0, 46.0, 34.0, 24.0, 21.0, 39.0, 19.0, 20.0, 13.0, 18.0, 12.0, 14.0, 9.0, 8.0, 7.0, 8.0, 1.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.47265625, -1.4268341064453125, -1.381011962890625, -1.3351898193359375, -1.28936767578125, -1.2435455322265625, -1.197723388671875, -1.1519012451171875, -1.1060791015625, -1.0602569580078125, -1.014434814453125, -0.9686126708984375, -0.92279052734375, -0.8769683837890625, -0.831146240234375, -0.7853240966796875, -0.739501953125, -0.6936798095703125, -0.647857666015625, -0.6020355224609375, -0.55621337890625, -0.5103912353515625, -0.464569091796875, -0.4187469482421875, -0.3729248046875, -0.3271026611328125, -0.281280517578125, -0.2354583740234375, -0.18963623046875, -0.1438140869140625, -0.097991943359375, -0.0521697998046875, -0.00634765625, 0.0394744873046875, 0.085296630859375, 0.1311187744140625, 0.17694091796875, 0.2227630615234375, 0.268585205078125, 0.3144073486328125, 0.3602294921875, 0.4060516357421875, 0.451873779296875, 0.4976959228515625, 0.54351806640625, 0.5893402099609375, 0.635162353515625, 0.6809844970703125, 0.726806640625, 0.7726287841796875, 0.818450927734375, 0.8642730712890625, 0.91009521484375, 0.9559173583984375, 1.001739501953125, 1.0475616455078125, 1.0933837890625, 1.1392059326171875, 1.185028076171875, 1.2308502197265625, 1.27667236328125, 1.3224945068359375, 1.368316650390625, 1.4141387939453125, 1.4599609375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 14.0, 14.0, 18.0, 32.0, 49.0, 63.0, 96.0, 140.0, 216.0, 371.0, 525.0, 883.0, 1396.0, 2330.0, 4045.0, 7282.0, 12672.0, 24123.0, 47973.0, 102663.0, 244287.0, 704440.0, 1837808.0, 738313.0, 253524.0, 105628.0, 49453.0, 24760.0, 13334.0, 7223.0, 4244.0, 2438.0, 1472.0, 840.0, 596.0, 345.0, 244.0, 141.0, 98.0, 60.0, 33.0, 32.0, 22.0, 12.0, 9.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.31854248046875, -3.2132568359375, -3.10797119140625, -3.002685546875, -2.89739990234375, -2.7921142578125, -2.68682861328125, -2.58154296875, -2.47625732421875, -2.3709716796875, -2.26568603515625, -2.160400390625, -2.05511474609375, -1.9498291015625, -1.84454345703125, -1.7392578125, -1.63397216796875, -1.5286865234375, -1.42340087890625, -1.318115234375, -1.21282958984375, -1.1075439453125, -1.00225830078125, -0.89697265625, -0.79168701171875, -0.6864013671875, -0.58111572265625, -0.475830078125, -0.37054443359375, -0.2652587890625, -0.15997314453125, -0.0546875, 0.05059814453125, 0.1558837890625, 0.26116943359375, 0.366455078125, 0.47174072265625, 0.5770263671875, 0.68231201171875, 0.78759765625, 0.89288330078125, 0.9981689453125, 1.10345458984375, 1.208740234375, 1.31402587890625, 1.4193115234375, 1.52459716796875, 1.6298828125, 1.73516845703125, 1.8404541015625, 1.94573974609375, 2.051025390625, 2.15631103515625, 2.2615966796875, 2.36688232421875, 2.47216796875, 2.57745361328125, 2.6827392578125, 2.78802490234375, 2.893310546875, 2.99859619140625, 3.1038818359375, 3.20916748046875, 3.314453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 3.0, 7.0, 11.0, 10.0, 13.0, 16.0, 23.0, 24.0, 44.0, 50.0, 46.0, 55.0, 70.0, 105.0, 96.0, 141.0, 174.0, 193.0, 219.0, 243.0, 274.0, 258.0, 284.0, 270.0, 239.0, 209.0, 188.0, 142.0, 131.0, 85.0, 104.0, 57.0, 42.0, 44.0, 35.0, 34.0, 35.0, 20.0, 17.0, 14.0, 7.0, 4.0, 15.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.76171875, -0.7371826171875, -0.712646484375, -0.6881103515625, -0.66357421875, -0.6390380859375, -0.614501953125, -0.5899658203125, -0.5654296875, -0.5408935546875, -0.516357421875, -0.4918212890625, -0.46728515625, -0.4427490234375, -0.418212890625, -0.3936767578125, -0.369140625, -0.3446044921875, -0.320068359375, -0.2955322265625, -0.27099609375, -0.2464599609375, -0.221923828125, -0.1973876953125, -0.1728515625, -0.1483154296875, -0.123779296875, -0.0992431640625, -0.07470703125, -0.0501708984375, -0.025634765625, -0.0010986328125, 0.0234375, 0.0479736328125, 0.072509765625, 0.0970458984375, 0.12158203125, 0.1461181640625, 0.170654296875, 0.1951904296875, 0.2197265625, 0.2442626953125, 0.268798828125, 0.2933349609375, 0.31787109375, 0.3424072265625, 0.366943359375, 0.3914794921875, 0.416015625, 0.4405517578125, 0.465087890625, 0.4896240234375, 0.51416015625, 0.5386962890625, 0.563232421875, 0.5877685546875, 0.6123046875, 0.6368408203125, 0.661376953125, 0.6859130859375, 0.71044921875, 0.7349853515625, 0.759521484375, 0.7840576171875, 0.80859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 14.0, 14.0, 25.0, 44.0, 53.0, 90.0, 126.0, 139.0, 146.0, 100.0, 67.0, 44.0, 34.0, 26.0, 15.0, 12.0, 9.0, 5.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.113173961639404, -4.994057655334473, -4.874941349029541, -4.755825042724609, -4.636708736419678, -4.517592430114746, -4.3984761238098145, -4.279359817504883, -4.160243511199951, -4.0411272048950195, -3.922010898590088, -3.8028945922851562, -3.6837782859802246, -3.564661979675293, -3.4455456733703613, -3.3264293670654297, -3.207312822341919, -3.0881965160369873, -2.9690802097320557, -2.849963903427124, -2.7308475971221924, -2.6117312908172607, -2.49261474609375, -2.3734984397888184, -2.2543821334838867, -2.135265827178955, -2.0161495208740234, -1.8970332145690918, -1.7779169082641602, -1.6588006019592285, -1.5396841764450073, -1.4205678701400757, -1.3014514446258545, -1.1823351383209229, -1.0632188320159912, -0.9441024661064148, -0.8249861598014832, -0.7058698534965515, -0.5867534875869751, -0.46763718128204346, -0.3485208749771118, -0.22940455377101898, -0.11028823256492615, 0.00882810354232788, 0.12794440984725952, 0.24706071615219116, 0.3661770820617676, 0.4852933883666992, 0.6044096946716309, 0.7235260009765625, 0.8426423072814941, 0.9617586731910706, 1.0808749198913574, 1.199991226196289, 1.3191076517105103, 1.438223958015442, 1.5573402643203735, 1.6764565706253052, 1.7955728769302368, 1.914689302444458, 2.0338056087493896, 2.1529219150543213, 2.272038221359253, 2.3911545276641846, 2.510270833969116]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 6.0, 13.0, 8.0, 8.0, 11.0, 16.0, 25.0, 24.0, 32.0, 37.0, 24.0, 27.0, 35.0, 31.0, 31.0, 39.0, 40.0, 46.0, 51.0, 36.0, 41.0, 51.0, 49.0, 29.0, 39.0, 37.0, 20.0, 22.0, 28.0, 22.0, 21.0, 11.0, 9.0, 14.0, 12.0, 2.0, 7.0, 5.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8106961250305176, -1.757601261138916, -1.7045063972473145, -1.651411533355713, -1.5983166694641113, -1.5452218055725098, -1.4921269416809082, -1.4390320777893066, -1.385937213897705, -1.3328423500061035, -1.279747486114502, -1.2266526222229004, -1.1735577583312988, -1.1204628944396973, -1.0673680305480957, -1.0142731666564941, -0.9611783623695374, -0.9080834984779358, -0.8549886345863342, -0.8018937706947327, -0.7487989068031311, -0.6957041025161743, -0.6426092386245728, -0.5895143747329712, -0.5364195108413696, -0.48332464694976807, -0.4302297830581665, -0.37713491916656494, -0.3240400552749634, -0.2709452211856842, -0.21785035729408264, -0.16475549340248108, -0.11166059970855713, -0.058565739542245865, -0.005470879375934601, 0.047623977065086365, 0.10071884095668793, 0.1538136899471283, 0.20690855383872986, 0.2600034177303314, 0.313098281621933, 0.36619314551353455, 0.4192880094051361, 0.4723828434944153, 0.5254777073860168, 0.5785725712776184, 0.63166743516922, 0.6847622990608215, 0.7378571629524231, 0.7909520268440247, 0.8440468907356262, 0.8971417546272278, 0.9502366185188293, 1.0033314228057861, 1.0564262866973877, 1.1095211505889893, 1.1626160144805908, 1.2157108783721924, 1.268805742263794, 1.3219006061553955, 1.374995470046997, 1.4280903339385986, 1.4811851978302002, 1.5342800617218018, 1.5873749256134033]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 6.0, 5.0, 5.0, 9.0, 22.0, 24.0, 36.0, 43.0, 81.0, 90.0, 140.0, 226.0, 375.0, 568.0, 889.0, 1390.0, 2364.0, 4237.0, 7481.0, 13942.0, 27910.0, 60446.0, 156995.0, 462461.0, 178298.0, 66327.0, 30106.0, 14973.0, 8037.0, 4472.0, 2561.0, 1479.0, 911.0, 548.0, 334.0, 233.0, 169.0, 106.0, 77.0, 44.0, 42.0, 29.0, 18.0, 7.0, 10.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.98046875, -1.9156494140625, -1.850830078125, -1.7860107421875, -1.72119140625, -1.6563720703125, -1.591552734375, -1.5267333984375, -1.4619140625, -1.3970947265625, -1.332275390625, -1.2674560546875, -1.20263671875, -1.1378173828125, -1.072998046875, -1.0081787109375, -0.943359375, -0.8785400390625, -0.813720703125, -0.7489013671875, -0.68408203125, -0.6192626953125, -0.554443359375, -0.4896240234375, -0.4248046875, -0.3599853515625, -0.295166015625, -0.2303466796875, -0.16552734375, -0.1007080078125, -0.035888671875, 0.0289306640625, 0.09375, 0.1585693359375, 0.223388671875, 0.2882080078125, 0.35302734375, 0.4178466796875, 0.482666015625, 0.5474853515625, 0.6123046875, 0.6771240234375, 0.741943359375, 0.8067626953125, 0.87158203125, 0.9364013671875, 1.001220703125, 1.0660400390625, 1.130859375, 1.1956787109375, 1.260498046875, 1.3253173828125, 1.39013671875, 1.4549560546875, 1.519775390625, 1.5845947265625, 1.6494140625, 1.7142333984375, 1.779052734375, 1.8438720703125, 1.90869140625, 1.9735107421875, 2.038330078125, 2.1031494140625, 2.16796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 7.0, 7.0, 10.0, 12.0, 9.0, 20.0, 23.0, 24.0, 22.0, 27.0, 36.0, 40.0, 34.0, 32.0, 42.0, 41.0, 43.0, 47.0, 38.0, 52.0, 41.0, 41.0, 47.0, 34.0, 44.0, 24.0, 27.0, 24.0, 19.0, 22.0, 16.0, 13.0, 10.0, 10.0, 10.0, 7.0, 8.0, 5.0, 7.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.9609375, -1.9049072265625, -1.848876953125, -1.7928466796875, -1.73681640625, -1.6807861328125, -1.624755859375, -1.5687255859375, -1.5126953125, -1.4566650390625, -1.400634765625, -1.3446044921875, -1.28857421875, -1.2325439453125, -1.176513671875, -1.1204833984375, -1.064453125, -1.0084228515625, -0.952392578125, -0.8963623046875, -0.84033203125, -0.7843017578125, -0.728271484375, -0.6722412109375, -0.6162109375, -0.5601806640625, -0.504150390625, -0.4481201171875, -0.39208984375, -0.3360595703125, -0.280029296875, -0.2239990234375, -0.16796875, -0.1119384765625, -0.055908203125, 0.0001220703125, 0.05615234375, 0.1121826171875, 0.168212890625, 0.2242431640625, 0.2802734375, 0.3363037109375, 0.392333984375, 0.4483642578125, 0.50439453125, 0.5604248046875, 0.616455078125, 0.6724853515625, 0.728515625, 0.7845458984375, 0.840576171875, 0.8966064453125, 0.95263671875, 1.0086669921875, 1.064697265625, 1.1207275390625, 1.1767578125, 1.2327880859375, 1.288818359375, 1.3448486328125, 1.40087890625, 1.4569091796875, 1.512939453125, 1.5689697265625, 1.625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 10.0, 15.0, 16.0, 25.0, 28.0, 38.0, 35.0, 60.0, 81.0, 100.0, 136.0, 200.0, 279.0, 407.0, 622.0, 930.0, 1583.0, 2407.0, 4140.0, 7568.0, 15832.0, 44352.0, 506330.0, 389035.0, 41194.0, 15235.0, 7333.0, 3953.0, 2289.0, 1415.0, 913.0, 595.0, 389.0, 275.0, 185.0, 131.0, 90.0, 82.0, 58.0, 42.0, 32.0, 29.0, 20.0, 18.0, 3.0, 6.0, 9.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0], "bins": [-3.138671875, -3.037322998046875, -2.93597412109375, -2.834625244140625, -2.7332763671875, -2.631927490234375, -2.53057861328125, -2.429229736328125, -2.327880859375, -2.226531982421875, -2.12518310546875, -2.023834228515625, -1.9224853515625, -1.821136474609375, -1.71978759765625, -1.618438720703125, -1.51708984375, -1.415740966796875, -1.31439208984375, -1.213043212890625, -1.1116943359375, -1.010345458984375, -0.90899658203125, -0.807647705078125, -0.706298828125, -0.604949951171875, -0.50360107421875, -0.402252197265625, -0.3009033203125, -0.199554443359375, -0.09820556640625, 0.003143310546875, 0.1044921875, 0.205841064453125, 0.30718994140625, 0.408538818359375, 0.5098876953125, 0.611236572265625, 0.71258544921875, 0.813934326171875, 0.915283203125, 1.016632080078125, 1.11798095703125, 1.219329833984375, 1.3206787109375, 1.422027587890625, 1.52337646484375, 1.624725341796875, 1.72607421875, 1.827423095703125, 1.92877197265625, 2.030120849609375, 2.1314697265625, 2.232818603515625, 2.33416748046875, 2.435516357421875, 2.536865234375, 2.638214111328125, 2.73956298828125, 2.840911865234375, 2.9422607421875, 3.043609619140625, 3.14495849609375, 3.246307373046875, 3.34765625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 12.0, 6.0, 4.0, 4.0, 13.0, 9.0, 21.0, 19.0, 22.0, 27.0, 21.0, 24.0, 26.0, 36.0, 38.0, 42.0, 38.0, 45.0, 35.0, 47.0, 45.0, 60.0, 37.0, 30.0, 40.0, 38.0, 45.0, 27.0, 27.0, 33.0, 22.0, 22.0, 18.0, 25.0, 16.0, 9.0, 8.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.27520751953125, -1.2349853515625, -1.19476318359375, -1.154541015625, -1.11431884765625, -1.0740966796875, -1.03387451171875, -0.99365234375, -0.95343017578125, -0.9132080078125, -0.87298583984375, -0.832763671875, -0.79254150390625, -0.7523193359375, -0.71209716796875, -0.671875, -0.63165283203125, -0.5914306640625, -0.55120849609375, -0.510986328125, -0.47076416015625, -0.4305419921875, -0.39031982421875, -0.35009765625, -0.30987548828125, -0.2696533203125, -0.22943115234375, -0.189208984375, -0.14898681640625, -0.1087646484375, -0.06854248046875, -0.0283203125, 0.01190185546875, 0.0521240234375, 0.09234619140625, 0.132568359375, 0.17279052734375, 0.2130126953125, 0.25323486328125, 0.29345703125, 0.33367919921875, 0.3739013671875, 0.41412353515625, 0.454345703125, 0.49456787109375, 0.5347900390625, 0.57501220703125, 0.615234375, 0.65545654296875, 0.6956787109375, 0.73590087890625, 0.776123046875, 0.81634521484375, 0.8565673828125, 0.89678955078125, 0.93701171875, 0.97723388671875, 1.0174560546875, 1.05767822265625, 1.097900390625, 1.13812255859375, 1.1783447265625, 1.21856689453125, 1.2587890625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 4.0, 4.0, 11.0, 18.0, 23.0, 27.0, 42.0, 73.0, 95.0, 124.0, 173.0, 230.0, 344.0, 497.0, 759.0, 1017.0, 1641.0, 2573.0, 4473.0, 8028.0, 16466.0, 41637.0, 173971.0, 644165.0, 93840.0, 29104.0, 12516.0, 6395.0, 3636.0, 2149.0, 1443.0, 918.0, 607.0, 474.0, 313.0, 210.0, 149.0, 111.0, 90.0, 51.0, 41.0, 25.0, 34.0, 11.0, 12.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.44189453125, -0.42822265625, -0.41455078125, -0.40087890625, -0.38720703125, -0.37353515625, -0.35986328125, -0.34619140625, -0.33251953125, -0.31884765625, -0.30517578125, -0.29150390625, -0.27783203125, -0.26416015625, -0.25048828125, -0.23681640625, -0.22314453125, -0.20947265625, -0.19580078125, -0.18212890625, -0.16845703125, -0.15478515625, -0.14111328125, -0.12744140625, -0.11376953125, -0.10009765625, -0.08642578125, -0.07275390625, -0.05908203125, -0.04541015625, -0.03173828125, -0.01806640625, -0.00439453125, 0.00927734375, 0.02294921875, 0.03662109375, 0.05029296875, 0.06396484375, 0.07763671875, 0.09130859375, 0.10498046875, 0.11865234375, 0.13232421875, 0.14599609375, 0.15966796875, 0.17333984375, 0.18701171875, 0.20068359375, 0.21435546875, 0.22802734375, 0.24169921875, 0.25537109375, 0.26904296875, 0.28271484375, 0.29638671875, 0.31005859375, 0.32373046875, 0.33740234375, 0.35107421875, 0.36474609375, 0.37841796875, 0.39208984375, 0.40576171875, 0.41943359375, 0.43310546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 1.0, 6.0, 1.0, 3.0, 12.0, 6.0, 10.0, 8.0, 14.0, 17.0, 28.0, 39.0, 31.0, 43.0, 69.0, 79.0, 90.0, 103.0, 81.0, 91.0, 69.0, 47.0, 28.0, 32.0, 18.0, 15.0, 12.0, 8.0, 10.0, 9.0, 8.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.7894973754882812e-05, -2.7103349566459656e-05, -2.63117253780365e-05, -2.5520101189613342e-05, -2.4728477001190186e-05, -2.393685281276703e-05, -2.3145228624343872e-05, -2.2353604435920715e-05, -2.156198024749756e-05, -2.0770356059074402e-05, -1.9978731870651245e-05, -1.918710768222809e-05, -1.839548349380493e-05, -1.7603859305381775e-05, -1.6812235116958618e-05, -1.602061092853546e-05, -1.5228986740112305e-05, -1.4437362551689148e-05, -1.3645738363265991e-05, -1.2854114174842834e-05, -1.2062489986419678e-05, -1.1270865797996521e-05, -1.0479241609573364e-05, -9.687617421150208e-06, -8.89599323272705e-06, -8.104369044303894e-06, -7.312744855880737e-06, -6.5211206674575806e-06, -5.729496479034424e-06, -4.937872290611267e-06, -4.14624810218811e-06, -3.3546239137649536e-06, -2.562999725341797e-06, -1.7713755369186401e-06, -9.797513484954834e-07, -1.8812716007232666e-07, 6.034970283508301e-07, 1.3951212167739868e-06, 2.1867454051971436e-06, 2.9783695936203003e-06, 3.769993782043457e-06, 4.561617970466614e-06, 5.3532421588897705e-06, 6.144866347312927e-06, 6.936490535736084e-06, 7.72811472415924e-06, 8.519738912582397e-06, 9.311363101005554e-06, 1.0102987289428711e-05, 1.0894611477851868e-05, 1.1686235666275024e-05, 1.2477859854698181e-05, 1.3269484043121338e-05, 1.4061108231544495e-05, 1.4852732419967651e-05, 1.5644356608390808e-05, 1.6435980796813965e-05, 1.722760498523712e-05, 1.801922917366028e-05, 1.8810853362083435e-05, 1.9602477550506592e-05, 2.039410173892975e-05, 2.1185725927352905e-05, 2.1977350115776062e-05, 2.276897430419922e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 8.0, 11.0, 7.0, 8.0, 9.0, 17.0, 26.0, 42.0, 59.0, 77.0, 115.0, 156.0, 228.0, 319.0, 438.0, 694.0, 996.0, 1540.0, 2298.0, 3825.0, 6169.0, 10870.0, 19524.0, 38698.0, 88250.0, 306167.0, 375445.0, 99542.0, 42010.0, 21210.0, 11611.0, 6761.0, 4007.0, 2516.0, 1627.0, 1015.0, 697.0, 444.0, 342.0, 223.0, 159.0, 114.0, 80.0, 45.0, 48.0, 31.0, 25.0, 18.0, 11.0, 7.0, 9.0, 5.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.3271484375, -0.3158912658691406, -0.30463409423828125, -0.2933769226074219, -0.2821197509765625, -0.2708625793457031, -0.25960540771484375, -0.24834823608398438, -0.237091064453125, -0.22583389282226562, -0.21457672119140625, -0.20331954956054688, -0.1920623779296875, -0.18080520629882812, -0.16954803466796875, -0.15829086303710938, -0.14703369140625, -0.13577651977539062, -0.12451934814453125, -0.11326217651367188, -0.1020050048828125, -0.09074783325195312, -0.07949066162109375, -0.06823348999023438, -0.056976318359375, -0.045719146728515625, -0.03446197509765625, -0.023204803466796875, -0.0119476318359375, -0.000690460205078125, 0.01056671142578125, 0.021823883056640625, 0.0330810546875, 0.044338226318359375, 0.05559539794921875, 0.06685256958007812, 0.0781097412109375, 0.08936691284179688, 0.10062408447265625, 0.11188125610351562, 0.123138427734375, 0.13439559936523438, 0.14565277099609375, 0.15690994262695312, 0.1681671142578125, 0.17942428588867188, 0.19068145751953125, 0.20193862915039062, 0.21319580078125, 0.22445297241210938, 0.23571014404296875, 0.24696731567382812, 0.2582244873046875, 0.2694816589355469, 0.28073883056640625, 0.2919960021972656, 0.303253173828125, 0.3145103454589844, 0.32576751708984375, 0.3370246887207031, 0.3482818603515625, 0.3595390319824219, 0.37079620361328125, 0.3820533752441406, 0.393310546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 8.0, 3.0, 5.0, 3.0, 8.0, 12.0, 11.0, 14.0, 15.0, 39.0, 29.0, 35.0, 57.0, 75.0, 98.0, 119.0, 103.0, 83.0, 74.0, 44.0, 37.0, 25.0, 18.0, 26.0, 16.0, 8.0, 7.0, 8.0, 6.0, 6.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09283447265625, -0.08958816528320312, -0.08634185791015625, -0.08309555053710938, -0.0798492431640625, -0.07660293579101562, -0.07335662841796875, -0.07011032104492188, -0.066864013671875, -0.06361770629882812, -0.06037139892578125, -0.057125091552734375, -0.0538787841796875, -0.050632476806640625, -0.04738616943359375, -0.044139862060546875, -0.0408935546875, -0.037647247314453125, -0.03440093994140625, -0.031154632568359375, -0.0279083251953125, -0.024662017822265625, -0.02141571044921875, -0.018169403076171875, -0.014923095703125, -0.011676788330078125, -0.00843048095703125, -0.005184173583984375, -0.0019378662109375, 0.001308441162109375, 0.00455474853515625, 0.007801055908203125, 0.01104736328125, 0.014293670654296875, 0.01753997802734375, 0.020786285400390625, 0.0240325927734375, 0.027278900146484375, 0.03052520751953125, 0.033771514892578125, 0.037017822265625, 0.040264129638671875, 0.04351043701171875, 0.046756744384765625, 0.0500030517578125, 0.053249359130859375, 0.05649566650390625, 0.059741973876953125, 0.06298828125, 0.06623458862304688, 0.06948089599609375, 0.07272720336914062, 0.0759735107421875, 0.07921981811523438, 0.08246612548828125, 0.08571243286132812, 0.088958740234375, 0.09220504760742188, 0.09545135498046875, 0.09869766235351562, 0.1019439697265625, 0.10519027709960938, 0.10843658447265625, 0.11168289184570312, 0.11492919921875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 12.0, 18.0, 20.0, 37.0, 63.0, 84.0, 123.0, 133.0, 144.0, 124.0, 64.0, 31.0, 40.0, 28.0, 21.0, 8.0, 10.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.878830432891846, -4.762570381164551, -4.646309852600098, -4.530049800872803, -4.41378927230835, -4.297529220581055, -4.181268692016602, -4.065008640289307, -3.9487483501434326, -3.8324880599975586, -3.7162277698516846, -3.5999674797058105, -3.4837074279785156, -3.3674468994140625, -3.2511868476867676, -3.1349265575408936, -3.0186662673950195, -2.9024059772491455, -2.7861456871032715, -2.6698853969573975, -2.5536251068115234, -2.4373650550842285, -2.3211047649383545, -2.2048444747924805, -2.0885841846466064, -1.9723238945007324, -1.8560636043548584, -1.739803433418274, -1.6235431432724, -1.5072828531265259, -1.3910226821899414, -1.2747623920440674, -1.1585018634796143, -1.0422415733337402, -0.925981342792511, -0.8097211122512817, -0.6934608221054077, -0.5772005319595337, -0.46094030141830444, -0.3446800708770752, -0.22841978073120117, -0.11215952038764954, 0.0041007399559021, 0.12036100029945374, 0.23662126064300537, 0.3528815507888794, 0.46914178133010864, 0.5854020118713379, 0.7016623020172119, 0.8179225921630859, 0.9341828227043152, 1.0504430532455444, 1.1667033433914185, 1.2829636335372925, 1.399223804473877, 1.515484094619751, 1.631744384765625, 1.748004674911499, 1.864264965057373, 1.9805251359939575, 2.096785545349121, 2.213045597076416, 2.32930588722229, 2.445566177368164, 2.561826467514038]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 13.0, 8.0, 11.0, 9.0, 7.0, 16.0, 14.0, 20.0, 34.0, 33.0, 30.0, 24.0, 36.0, 31.0, 30.0, 29.0, 35.0, 50.0, 48.0, 43.0, 30.0, 42.0, 56.0, 45.0, 34.0, 32.0, 41.0, 23.0, 19.0, 27.0, 23.0, 18.0, 12.0, 9.0, 12.0, 12.0, 6.0, 7.0, 3.0, 6.0, 8.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7791060209274292, -1.7269487380981445, -1.6747915744781494, -1.6226342916488647, -1.5704771280288696, -1.518319845199585, -1.4661626815795898, -1.4140053987503052, -1.36184823513031, -1.3096909523010254, -1.2575337886810303, -1.2053765058517456, -1.1532193422317505, -1.1010620594024658, -1.0489048957824707, -0.996747612953186, -0.9445903897285461, -0.8924331665039062, -0.8402759432792664, -0.7881187200546265, -0.7359614968299866, -0.6838042736053467, -0.631646990776062, -0.5794898271560669, -0.5273325443267822, -0.47517532110214233, -0.42301809787750244, -0.37086087465286255, -0.31870365142822266, -0.2665463984012604, -0.21438917517662048, -0.1622319519519806, -0.11007475852966309, -0.057917531579732895, -0.005760304629802704, 0.046396926045417786, 0.09855414927005768, 0.15071138739585876, 0.20286861062049866, 0.25502583384513855, 0.30718305706977844, 0.35934028029441833, 0.4114975035190582, 0.4636547565460205, 0.5158119797706604, 0.5679692029953003, 0.6201264262199402, 0.6722836494445801, 0.72444087266922, 0.7765980958938599, 0.8287553191184998, 0.8809125423431396, 0.9330697655677795, 0.9852269887924194, 1.037384271621704, 1.0895414352416992, 1.1416987180709839, 1.1938560009002686, 1.2460131645202637, 1.2981704473495483, 1.3503276109695435, 1.4024848937988281, 1.4546420574188232, 1.506799340248108, 1.558956503868103]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 1.0, 7.0, 5.0, 9.0, 26.0, 30.0, 49.0, 70.0, 112.0, 155.0, 244.0, 385.0, 607.0, 994.0, 1725.0, 2833.0, 4928.0, 8526.0, 15054.0, 26876.0, 49975.0, 96584.0, 183327.0, 266711.0, 181691.0, 95515.0, 49909.0, 26680.0, 14879.0, 8526.0, 4904.0, 2894.0, 1649.0, 953.0, 590.0, 400.0, 268.0, 152.0, 104.0, 64.0, 59.0, 25.0, 15.0, 20.0, 6.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.0390625, -2.94256591796875, -2.8460693359375, -2.74957275390625, -2.653076171875, -2.55657958984375, -2.4600830078125, -2.36358642578125, -2.26708984375, -2.17059326171875, -2.0740966796875, -1.97760009765625, -1.881103515625, -1.78460693359375, -1.6881103515625, -1.59161376953125, -1.4951171875, -1.39862060546875, -1.3021240234375, -1.20562744140625, -1.109130859375, -1.01263427734375, -0.9161376953125, -0.81964111328125, -0.72314453125, -0.62664794921875, -0.5301513671875, -0.43365478515625, -0.337158203125, -0.24066162109375, -0.1441650390625, -0.04766845703125, 0.048828125, 0.14532470703125, 0.2418212890625, 0.33831787109375, 0.434814453125, 0.53131103515625, 0.6278076171875, 0.72430419921875, 0.82080078125, 0.91729736328125, 1.0137939453125, 1.11029052734375, 1.206787109375, 1.30328369140625, 1.3997802734375, 1.49627685546875, 1.5927734375, 1.68927001953125, 1.7857666015625, 1.88226318359375, 1.978759765625, 2.07525634765625, 2.1717529296875, 2.26824951171875, 2.36474609375, 2.46124267578125, 2.5577392578125, 2.65423583984375, 2.750732421875, 2.84722900390625, 2.9437255859375, 3.04022216796875, 3.13671875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 3.0, 5.0, 7.0, 12.0, 9.0, 10.0, 10.0, 16.0, 23.0, 26.0, 30.0, 17.0, 25.0, 26.0, 32.0, 33.0, 36.0, 38.0, 37.0, 39.0, 35.0, 41.0, 26.0, 51.0, 46.0, 42.0, 38.0, 35.0, 27.0, 26.0, 30.0, 24.0, 25.0, 19.0, 15.0, 11.0, 6.0, 16.0, 11.0, 8.0, 5.0, 4.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.5498046875, -1.5045013427734375, -1.459197998046875, -1.4138946533203125, -1.36859130859375, -1.3232879638671875, -1.277984619140625, -1.2326812744140625, -1.1873779296875, -1.1420745849609375, -1.096771240234375, -1.0514678955078125, -1.00616455078125, -0.9608612060546875, -0.915557861328125, -0.8702545166015625, -0.824951171875, -0.7796478271484375, -0.734344482421875, -0.6890411376953125, -0.64373779296875, -0.5984344482421875, -0.553131103515625, -0.5078277587890625, -0.4625244140625, -0.4172210693359375, -0.371917724609375, -0.3266143798828125, -0.28131103515625, -0.2360076904296875, -0.190704345703125, -0.1454010009765625, -0.10009765625, -0.0547943115234375, -0.009490966796875, 0.0358123779296875, 0.08111572265625, 0.1264190673828125, 0.171722412109375, 0.2170257568359375, 0.2623291015625, 0.3076324462890625, 0.352935791015625, 0.3982391357421875, 0.44354248046875, 0.4888458251953125, 0.534149169921875, 0.5794525146484375, 0.624755859375, 0.6700592041015625, 0.715362548828125, 0.7606658935546875, 0.80596923828125, 0.8512725830078125, 0.896575927734375, 0.9418792724609375, 0.9871826171875, 1.0324859619140625, 1.077789306640625, 1.1230926513671875, 1.16839599609375, 1.2136993408203125, 1.259002685546875, 1.3043060302734375, 1.349609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 16.0, 27.0, 31.0, 57.0, 66.0, 102.0, 173.0, 265.0, 389.0, 707.0, 1180.0, 2021.0, 3995.0, 7653.0, 15221.0, 30994.0, 64123.0, 135050.0, 281210.0, 263826.0, 124203.0, 59120.0, 28379.0, 14009.0, 7159.0, 3758.0, 2001.0, 1098.0, 629.0, 378.0, 224.0, 152.0, 101.0, 58.0, 52.0, 42.0, 22.0, 14.0, 13.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40625, -3.29962158203125, -3.1929931640625, -3.08636474609375, -2.979736328125, -2.87310791015625, -2.7664794921875, -2.65985107421875, -2.55322265625, -2.44659423828125, -2.3399658203125, -2.23333740234375, -2.126708984375, -2.02008056640625, -1.9134521484375, -1.80682373046875, -1.7001953125, -1.59356689453125, -1.4869384765625, -1.38031005859375, -1.273681640625, -1.16705322265625, -1.0604248046875, -0.95379638671875, -0.84716796875, -0.74053955078125, -0.6339111328125, -0.52728271484375, -0.420654296875, -0.31402587890625, -0.2073974609375, -0.10076904296875, 0.005859375, 0.11248779296875, 0.2191162109375, 0.32574462890625, 0.432373046875, 0.53900146484375, 0.6456298828125, 0.75225830078125, 0.85888671875, 0.96551513671875, 1.0721435546875, 1.17877197265625, 1.285400390625, 1.39202880859375, 1.4986572265625, 1.60528564453125, 1.7119140625, 1.81854248046875, 1.9251708984375, 2.03179931640625, 2.138427734375, 2.24505615234375, 2.3516845703125, 2.45831298828125, 2.56494140625, 2.67156982421875, 2.7781982421875, 2.88482666015625, 2.991455078125, 3.09808349609375, 3.2047119140625, 3.31134033203125, 3.41796875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 8.0, 6.0, 12.0, 12.0, 13.0, 18.0, 27.0, 14.0, 15.0, 22.0, 31.0, 23.0, 31.0, 37.0, 26.0, 34.0, 38.0, 46.0, 32.0, 42.0, 43.0, 51.0, 35.0, 33.0, 39.0, 36.0, 29.0, 22.0, 32.0, 28.0, 18.0, 19.0, 16.0, 15.0, 10.0, 10.0, 13.0, 12.0, 5.0, 11.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7533187866210938, -0.7239227294921875, -0.6945266723632812, -0.665130615234375, -0.6357345581054688, -0.6063385009765625, -0.5769424438476562, -0.54754638671875, -0.5181503295898438, -0.4887542724609375, -0.45935821533203125, -0.429962158203125, -0.40056610107421875, -0.3711700439453125, -0.34177398681640625, -0.3123779296875, -0.28298187255859375, -0.2535858154296875, -0.22418975830078125, -0.194793701171875, -0.16539764404296875, -0.1360015869140625, -0.10660552978515625, -0.07720947265625, -0.04781341552734375, -0.0184173583984375, 0.01097869873046875, 0.040374755859375, 0.06977081298828125, 0.0991668701171875, 0.12856292724609375, 0.157958984375, 0.18735504150390625, 0.2167510986328125, 0.24614715576171875, 0.275543212890625, 0.30493927001953125, 0.3343353271484375, 0.36373138427734375, 0.39312744140625, 0.42252349853515625, 0.4519195556640625, 0.48131561279296875, 0.510711669921875, 0.5401077270507812, 0.5695037841796875, 0.5988998413085938, 0.6282958984375, 0.6576919555664062, 0.6870880126953125, 0.7164840698242188, 0.745880126953125, 0.7752761840820312, 0.8046722412109375, 0.8340682983398438, 0.86346435546875, 0.8928604125976562, 0.9222564697265625, 0.9516525268554688, 0.981048583984375, 1.0104446411132812, 1.0398406982421875, 1.0692367553710938, 1.0986328125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 3.0, 5.0, 11.0, 6.0, 22.0, 26.0, 37.0, 35.0, 76.0, 118.0, 175.0, 270.0, 425.0, 724.0, 1250.0, 2347.0, 4629.0, 9614.0, 23002.0, 76211.0, 686442.0, 177519.0, 37922.0, 14067.0, 6295.0, 3131.0, 1781.0, 938.0, 534.0, 296.0, 205.0, 143.0, 85.0, 57.0, 63.0, 22.0, 18.0, 17.0, 10.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.9378662109375, -3.805419921875, -3.6729736328125, -3.54052734375, -3.4080810546875, -3.275634765625, -3.1431884765625, -3.0107421875, -2.8782958984375, -2.745849609375, -2.6134033203125, -2.48095703125, -2.3485107421875, -2.216064453125, -2.0836181640625, -1.951171875, -1.8187255859375, -1.686279296875, -1.5538330078125, -1.42138671875, -1.2889404296875, -1.156494140625, -1.0240478515625, -0.8916015625, -0.7591552734375, -0.626708984375, -0.4942626953125, -0.36181640625, -0.2293701171875, -0.096923828125, 0.0355224609375, 0.16796875, 0.3004150390625, 0.432861328125, 0.5653076171875, 0.69775390625, 0.8302001953125, 0.962646484375, 1.0950927734375, 1.2275390625, 1.3599853515625, 1.492431640625, 1.6248779296875, 1.75732421875, 1.8897705078125, 2.022216796875, 2.1546630859375, 2.287109375, 2.4195556640625, 2.552001953125, 2.6844482421875, 2.81689453125, 2.9493408203125, 3.081787109375, 3.2142333984375, 3.3466796875, 3.4791259765625, 3.611572265625, 3.7440185546875, 3.87646484375, 4.0089111328125, 4.141357421875, 4.2738037109375, 4.40625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 10.0, 4.0, 9.0, 13.0, 24.0, 43.0, 72.0, 114.0, 185.0, 224.0, 116.0, 74.0, 28.0, 21.0, 19.0, 10.0, 8.0, 7.0, 5.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-05, -8.894316852092743e-05, -8.490309119224548e-05, -8.086301386356354e-05, -7.682293653488159e-05, -7.278285920619965e-05, -6.87427818775177e-05, -6.470270454883575e-05, -6.066262722015381e-05, -5.662254989147186e-05, -5.258247256278992e-05, -4.854239523410797e-05, -4.4502317905426025e-05, -4.046224057674408e-05, -3.6422163248062134e-05, -3.238208591938019e-05, -2.8342008590698242e-05, -2.4301931262016296e-05, -2.026185393333435e-05, -1.6221776604652405e-05, -1.2181699275970459e-05, -8.141621947288513e-06, -4.101544618606567e-06, -6.146728992462158e-08, 3.978610038757324e-06, 8.01868736743927e-06, 1.2058764696121216e-05, 1.609884202480316e-05, 2.0138919353485107e-05, 2.4178996682167053e-05, 2.8219074010849e-05, 3.2259151339530945e-05, 3.629922866821289e-05, 4.0339305996894836e-05, 4.437938332557678e-05, 4.841946065425873e-05, 5.2459537982940674e-05, 5.649961531162262e-05, 6.0539692640304565e-05, 6.457976996898651e-05, 6.861984729766846e-05, 7.26599246263504e-05, 7.670000195503235e-05, 8.07400792837143e-05, 8.478015661239624e-05, 8.882023394107819e-05, 9.286031126976013e-05, 9.690038859844208e-05, 0.00010094046592712402, 0.00010498054325580597, 0.00010902062058448792, 0.00011306069791316986, 0.0001171007752418518, 0.00012114085257053375, 0.0001251809298992157, 0.00012922100722789764, 0.0001332610845565796, 0.00013730116188526154, 0.00014134123921394348, 0.00014538131654262543, 0.00014942139387130737, 0.00015346147119998932, 0.00015750154852867126, 0.0001615416258573532, 0.00016558170318603516]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 8.0, 7.0, 12.0, 17.0, 36.0, 36.0, 46.0, 90.0, 127.0, 162.0, 258.0, 394.0, 633.0, 1064.0, 1786.0, 3401.0, 6783.0, 15688.0, 47846.0, 536597.0, 359615.0, 44559.0, 15034.0, 6506.0, 3265.0, 1731.0, 1020.0, 641.0, 413.0, 240.0, 160.0, 107.0, 72.0, 63.0, 42.0, 21.0, 22.0, 19.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.514404296875, -4.36865234375, -4.222900390625, -4.0771484375, -3.931396484375, -3.78564453125, -3.639892578125, -3.494140625, -3.348388671875, -3.20263671875, -3.056884765625, -2.9111328125, -2.765380859375, -2.61962890625, -2.473876953125, -2.328125, -2.182373046875, -2.03662109375, -1.890869140625, -1.7451171875, -1.599365234375, -1.45361328125, -1.307861328125, -1.162109375, -1.016357421875, -0.87060546875, -0.724853515625, -0.5791015625, -0.433349609375, -0.28759765625, -0.141845703125, 0.00390625, 0.149658203125, 0.29541015625, 0.441162109375, 0.5869140625, 0.732666015625, 0.87841796875, 1.024169921875, 1.169921875, 1.315673828125, 1.46142578125, 1.607177734375, 1.7529296875, 1.898681640625, 2.04443359375, 2.190185546875, 2.3359375, 2.481689453125, 2.62744140625, 2.773193359375, 2.9189453125, 3.064697265625, 3.21044921875, 3.356201171875, 3.501953125, 3.647705078125, 3.79345703125, 3.939208984375, 4.0849609375, 4.230712890625, 4.37646484375, 4.522216796875, 4.66796875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 14.0, 19.0, 18.0, 35.0, 35.0, 69.0, 105.0, 233.0, 159.0, 91.0, 56.0, 35.0, 30.0, 18.0, 14.0, 11.0, 6.0, 4.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.06219482421875, -1.0277099609375, -0.99322509765625, -0.958740234375, -0.92425537109375, -0.8897705078125, -0.85528564453125, -0.82080078125, -0.78631591796875, -0.7518310546875, -0.71734619140625, -0.682861328125, -0.64837646484375, -0.6138916015625, -0.57940673828125, -0.544921875, -0.51043701171875, -0.4759521484375, -0.44146728515625, -0.406982421875, -0.37249755859375, -0.3380126953125, -0.30352783203125, -0.26904296875, -0.23455810546875, -0.2000732421875, -0.16558837890625, -0.131103515625, -0.09661865234375, -0.0621337890625, -0.02764892578125, 0.0068359375, 0.04132080078125, 0.0758056640625, 0.11029052734375, 0.144775390625, 0.17926025390625, 0.2137451171875, 0.24822998046875, 0.28271484375, 0.31719970703125, 0.3516845703125, 0.38616943359375, 0.420654296875, 0.45513916015625, 0.4896240234375, 0.52410888671875, 0.55859375, 0.59307861328125, 0.6275634765625, 0.66204833984375, 0.696533203125, 0.73101806640625, 0.7655029296875, 0.79998779296875, 0.83447265625, 0.86895751953125, 0.9034423828125, 0.93792724609375, 0.972412109375, 1.00689697265625, 1.0413818359375, 1.07586669921875, 1.1103515625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 9.0, 10.0, 15.0, 24.0, 40.0, 69.0, 65.0, 104.0, 140.0, 116.0, 118.0, 58.0, 49.0, 28.0, 29.0, 24.0, 21.0, 21.0, 13.0, 11.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3150670528411865, -2.224872589111328, -2.134678363800049, -2.0444841384887695, -1.9542896747589111, -1.8640953302383423, -1.7739009857177734, -1.6837066411972046, -1.5935122966766357, -1.503317952156067, -1.413123607635498, -1.3229292631149292, -1.2327349185943604, -1.1425405740737915, -1.0523462295532227, -0.9621518850326538, -0.871957540512085, -0.7817631959915161, -0.6915688514709473, -0.6013745069503784, -0.5111801624298096, -0.4209858179092407, -0.3307914733886719, -0.24059712886810303, -0.15040278434753418, -0.06020843982696533, 0.029985904693603516, 0.12018024921417236, 0.2103745937347412, 0.30056893825531006, 0.3907632827758789, 0.48095762729644775, 0.5711519718170166, 0.6613463163375854, 0.7515406608581543, 0.8417350053787231, 0.931929349899292, 1.0221236944198608, 1.1123180389404297, 1.2025123834609985, 1.2927067279815674, 1.3829010725021362, 1.473095417022705, 1.563289761543274, 1.6534841060638428, 1.7436784505844116, 1.8338727951049805, 1.9240671396255493, 2.014261484146118, 2.1044559478759766, 2.194650173187256, 2.284844398498535, 2.3750388622283936, 2.465233325958252, 2.5554275512695312, 2.6456217765808105, 2.735816240310669, 2.8260107040405273, 2.9162049293518066, 3.006399154663086, 3.0965936183929443, 3.1867880821228027, 3.276982307434082, 3.3671765327453613, 3.4573709964752197]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 10.0, 10.0, 2.0, 16.0, 15.0, 17.0, 22.0, 36.0, 26.0, 31.0, 27.0, 41.0, 41.0, 46.0, 63.0, 47.0, 44.0, 34.0, 53.0, 36.0, 32.0, 45.0, 38.0, 47.0, 36.0, 29.0, 29.0, 12.0, 21.0, 23.0, 22.0, 12.0, 10.0, 5.0, 3.0, 6.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7765657901763916, -1.7177287340164185, -1.6588915586471558, -1.6000545024871826, -1.5412174463272095, -1.4823803901672363, -1.4235432147979736, -1.3647061586380005, -1.3058691024780273, -1.2470320463180542, -1.1881948709487915, -1.1293578147888184, -1.0705207586288452, -1.011683702468872, -0.9528465270996094, -0.8940094709396362, -0.8351722955703735, -0.7763351798057556, -0.7174981236457825, -0.6586610078811646, -0.5998239517211914, -0.5409868359565735, -0.48214972019195557, -0.42331263422966003, -0.3644755482673645, -0.30563846230506897, -0.24680136144161224, -0.18796426057815552, -0.12912717461585999, -0.07029008865356445, -0.011452972888946533, 0.047384113073349, 0.10622119903564453, 0.16505828499794006, 0.2238953858613968, 0.2827324867248535, 0.34156957268714905, 0.4004066586494446, 0.4592437744140625, 0.5180808305740356, 0.5769179463386536, 0.6357550621032715, 0.6945921182632446, 0.7534292340278625, 0.8122663497924805, 0.8711034059524536, 0.9299405217170715, 0.9887776374816895, 1.0476146936416626, 1.1064517498016357, 1.1652889251708984, 1.2241259813308716, 1.2829630374908447, 1.3418002128601074, 1.4006372690200806, 1.4594743251800537, 1.5183115005493164, 1.5771485567092896, 1.6359857320785522, 1.6948227882385254, 1.7536598443984985, 1.8124969005584717, 1.8713340759277344, 1.9301711320877075, 1.9890081882476807]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 24.0, 20.0, 35.0, 43.0, 66.0, 80.0, 137.0, 159.0, 258.0, 349.0, 480.0, 708.0, 1029.0, 1447.0, 2184.0, 3265.0, 4768.0, 7355.0, 11619.0, 18579.0, 31298.0, 54297.0, 101123.0, 212807.0, 605897.0, 1699719.0, 868172.0, 277942.0, 124215.0, 65780.0, 37662.0, 22165.0, 13866.0, 8837.0, 5629.0, 3728.0, 2621.0, 1725.0, 1258.0, 874.0, 588.0, 421.0, 317.0, 217.0, 148.0, 96.0, 87.0, 60.0, 36.0, 27.0, 18.0, 17.0, 7.0, 8.0, 4.0, 1.0, 2.0], "bins": [-2.22265625, -2.154571533203125, -2.08648681640625, -2.018402099609375, -1.9503173828125, -1.882232666015625, -1.81414794921875, -1.746063232421875, -1.677978515625, -1.609893798828125, -1.54180908203125, -1.473724365234375, -1.4056396484375, -1.337554931640625, -1.26947021484375, -1.201385498046875, -1.13330078125, -1.065216064453125, -0.99713134765625, -0.929046630859375, -0.8609619140625, -0.792877197265625, -0.72479248046875, -0.656707763671875, -0.588623046875, -0.520538330078125, -0.45245361328125, -0.384368896484375, -0.3162841796875, -0.248199462890625, -0.18011474609375, -0.112030029296875, -0.0439453125, 0.024139404296875, 0.09222412109375, 0.160308837890625, 0.2283935546875, 0.296478271484375, 0.36456298828125, 0.432647705078125, 0.500732421875, 0.568817138671875, 0.63690185546875, 0.704986572265625, 0.7730712890625, 0.841156005859375, 0.90924072265625, 0.977325439453125, 1.04541015625, 1.113494873046875, 1.18157958984375, 1.249664306640625, 1.3177490234375, 1.385833740234375, 1.45391845703125, 1.522003173828125, 1.590087890625, 1.658172607421875, 1.72625732421875, 1.794342041015625, 1.8624267578125, 1.930511474609375, 1.99859619140625, 2.066680908203125, 2.134765625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 8.0, 9.0, 14.0, 16.0, 26.0, 25.0, 26.0, 27.0, 41.0, 40.0, 32.0, 49.0, 51.0, 48.0, 55.0, 50.0, 44.0, 55.0, 33.0, 42.0, 43.0, 38.0, 38.0, 22.0, 34.0, 21.0, 19.0, 16.0, 18.0, 15.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.13671875, -1.0979766845703125, -1.059234619140625, -1.0204925537109375, -0.98175048828125, -0.9430084228515625, -0.904266357421875, -0.8655242919921875, -0.8267822265625, -0.7880401611328125, -0.749298095703125, -0.7105560302734375, -0.67181396484375, -0.6330718994140625, -0.594329833984375, -0.5555877685546875, -0.516845703125, -0.4781036376953125, -0.439361572265625, -0.4006195068359375, -0.36187744140625, -0.3231353759765625, -0.284393310546875, -0.2456512451171875, -0.2069091796875, -0.1681671142578125, -0.129425048828125, -0.0906829833984375, -0.05194091796875, -0.0131988525390625, 0.025543212890625, 0.0642852783203125, 0.10302734375, 0.1417694091796875, 0.180511474609375, 0.2192535400390625, 0.25799560546875, 0.2967376708984375, 0.335479736328125, 0.3742218017578125, 0.4129638671875, 0.4517059326171875, 0.490447998046875, 0.5291900634765625, 0.56793212890625, 0.6066741943359375, 0.645416259765625, 0.6841583251953125, 0.722900390625, 0.7616424560546875, 0.800384521484375, 0.8391265869140625, 0.87786865234375, 0.9166107177734375, 0.955352783203125, 0.9940948486328125, 1.0328369140625, 1.0715789794921875, 1.110321044921875, 1.1490631103515625, 1.18780517578125, 1.2265472412109375, 1.265289306640625, 1.3040313720703125, 1.3427734375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 12.0, 25.0, 17.0, 17.0, 46.0, 65.0, 117.0, 162.0, 251.0, 337.0, 578.0, 927.0, 1386.0, 2280.0, 3659.0, 5988.0, 9990.0, 17630.0, 31684.0, 61906.0, 129096.0, 298136.0, 848524.0, 1716353.0, 614133.0, 232143.0, 103846.0, 50775.0, 26718.0, 15022.0, 8732.0, 5195.0, 3181.0, 1829.0, 1255.0, 794.0, 495.0, 338.0, 235.0, 129.0, 75.0, 69.0, 48.0, 28.0, 27.0, 7.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.19921875, -2.131256103515625, -2.06329345703125, -1.995330810546875, -1.9273681640625, -1.859405517578125, -1.79144287109375, -1.723480224609375, -1.655517578125, -1.587554931640625, -1.51959228515625, -1.451629638671875, -1.3836669921875, -1.315704345703125, -1.24774169921875, -1.179779052734375, -1.11181640625, -1.043853759765625, -0.97589111328125, -0.907928466796875, -0.8399658203125, -0.772003173828125, -0.70404052734375, -0.636077880859375, -0.568115234375, -0.500152587890625, -0.43218994140625, -0.364227294921875, -0.2962646484375, -0.228302001953125, -0.16033935546875, -0.092376708984375, -0.0244140625, 0.043548583984375, 0.11151123046875, 0.179473876953125, 0.2474365234375, 0.315399169921875, 0.38336181640625, 0.451324462890625, 0.519287109375, 0.587249755859375, 0.65521240234375, 0.723175048828125, 0.7911376953125, 0.859100341796875, 0.92706298828125, 0.995025634765625, 1.06298828125, 1.130950927734375, 1.19891357421875, 1.266876220703125, 1.3348388671875, 1.402801513671875, 1.47076416015625, 1.538726806640625, 1.606689453125, 1.674652099609375, 1.74261474609375, 1.810577392578125, 1.8785400390625, 1.946502685546875, 2.01446533203125, 2.082427978515625, 2.150390625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 10.0, 10.0, 13.0, 10.0, 12.0, 22.0, 21.0, 37.0, 37.0, 46.0, 67.0, 88.0, 79.0, 118.0, 163.0, 182.0, 179.0, 220.0, 252.0, 292.0, 292.0, 285.0, 269.0, 239.0, 198.0, 182.0, 151.0, 127.0, 119.0, 75.0, 57.0, 40.0, 39.0, 25.0, 21.0, 21.0, 8.0, 19.0, 10.0, 10.0, 4.0, 4.0, 12.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6044921875, -0.58612060546875, -0.5677490234375, -0.54937744140625, -0.531005859375, -0.51263427734375, -0.4942626953125, -0.47589111328125, -0.45751953125, -0.43914794921875, -0.4207763671875, -0.40240478515625, -0.384033203125, -0.36566162109375, -0.3472900390625, -0.32891845703125, -0.310546875, -0.29217529296875, -0.2738037109375, -0.25543212890625, -0.237060546875, -0.21868896484375, -0.2003173828125, -0.18194580078125, -0.16357421875, -0.14520263671875, -0.1268310546875, -0.10845947265625, -0.090087890625, -0.07171630859375, -0.0533447265625, -0.03497314453125, -0.0166015625, 0.00177001953125, 0.0201416015625, 0.03851318359375, 0.056884765625, 0.07525634765625, 0.0936279296875, 0.11199951171875, 0.13037109375, 0.14874267578125, 0.1671142578125, 0.18548583984375, 0.203857421875, 0.22222900390625, 0.2406005859375, 0.25897216796875, 0.27734375, 0.29571533203125, 0.3140869140625, 0.33245849609375, 0.350830078125, 0.36920166015625, 0.3875732421875, 0.40594482421875, 0.42431640625, 0.44268798828125, 0.4610595703125, 0.47943115234375, 0.497802734375, 0.51617431640625, 0.5345458984375, 0.55291748046875, 0.5712890625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 5.0, 3.0, 10.0, 9.0, 13.0, 15.0, 28.0, 31.0, 37.0, 84.0, 86.0, 127.0, 143.0, 109.0, 68.0, 56.0, 48.0, 35.0, 22.0, 15.0, 15.0, 12.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5276777744293213, -2.4601409435272217, -2.392603874206543, -2.3250670433044434, -2.2575302124023438, -2.189993143081665, -2.1224563121795654, -2.0549192428588867, -1.987382411956787, -1.919845461845398, -1.8523085117340088, -1.7847716808319092, -1.71723473072052, -1.6496977806091309, -1.5821609497070312, -1.514623999595642, -1.447087049484253, -1.3795500993728638, -1.3120131492614746, -1.244476318359375, -1.1769393682479858, -1.1094024181365967, -1.041865587234497, -0.9743286371231079, -0.9067916870117188, -0.8392547369003296, -0.7717178463935852, -0.7041809558868408, -0.6366440057754517, -0.5691070556640625, -0.5015701651573181, -0.43403324484825134, -0.36649632453918457, -0.2989594042301178, -0.23142248392105103, -0.16388556361198425, -0.09634864330291748, -0.028811722993850708, 0.038725197315216064, 0.10626211762428284, 0.1737990379333496, 0.24133595824241638, 0.30887287855148315, 0.3764097988605499, 0.4439467191696167, 0.5114836692810059, 0.5790205597877502, 0.6465574502944946, 0.7140944004058838, 0.781631350517273, 0.8491682410240173, 0.9167051315307617, 0.9842420816421509, 1.05177903175354, 1.1193158626556396, 1.1868528127670288, 1.254389762878418, 1.3219267129898071, 1.3894636631011963, 1.457000494003296, 1.524537444114685, 1.5920743942260742, 1.6596112251281738, 1.727148175239563, 1.7946851253509521]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 10.0, 4.0, 12.0, 5.0, 16.0, 18.0, 17.0, 28.0, 20.0, 37.0, 28.0, 31.0, 37.0, 37.0, 30.0, 38.0, 41.0, 39.0, 37.0, 45.0, 49.0, 41.0, 40.0, 54.0, 33.0, 35.0, 27.0, 24.0, 29.0, 22.0, 22.0, 16.0, 13.0, 11.0, 11.0, 9.0, 10.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1917500495910645, -1.1529874801635742, -1.114224910736084, -1.0754623413085938, -1.036699652671814, -0.9979370832443237, -0.9591745138168335, -0.9204119443893433, -0.881649374961853, -0.8428868055343628, -0.8041241765022278, -0.7653616070747375, -0.7265990376472473, -0.6878364086151123, -0.6490738391876221, -0.6103112697601318, -0.5715486407279968, -0.5327860713005066, -0.49402347207069397, -0.45526087284088135, -0.4164983034133911, -0.3777357041835785, -0.33897310495376587, -0.30021053552627563, -0.261447936296463, -0.22268535196781158, -0.18392276763916016, -0.14516016840934753, -0.1063975840806961, -0.06763499975204468, -0.028872400522232056, 0.009890168905258179, 0.0486527681350708, 0.08741535246372223, 0.12617793679237366, 0.16494053602218628, 0.2037031203508377, 0.24246570467948914, 0.28122830390930176, 0.319990873336792, 0.3587534725666046, 0.39751607179641724, 0.43627864122390747, 0.4750412404537201, 0.5138038396835327, 0.552566409111023, 0.5913289785385132, 0.6300915479660034, 0.6688541769981384, 0.7076167464256287, 0.7463793754577637, 0.7851419448852539, 0.8239045143127441, 0.8626670837402344, 0.9014297127723694, 0.9401922821998596, 0.9789549112319946, 1.0177174806594849, 1.056480050086975, 1.0952427387237549, 1.1340053081512451, 1.1727678775787354, 1.2115304470062256, 1.2502930164337158, 1.289055585861206]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 8.0, 13.0, 12.0, 15.0, 33.0, 33.0, 56.0, 61.0, 83.0, 137.0, 199.0, 251.0, 371.0, 521.0, 794.0, 1133.0, 1664.0, 2431.0, 3629.0, 5737.0, 9051.0, 14898.0, 26272.0, 50101.0, 106052.0, 292051.0, 303335.0, 109712.0, 51104.0, 26929.0, 15180.0, 9283.0, 5807.0, 3666.0, 2453.0, 1679.0, 1170.0, 797.0, 543.0, 357.0, 276.0, 180.0, 149.0, 104.0, 64.0, 50.0, 43.0, 19.0, 23.0, 12.0, 11.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.86083984375, -0.833953857421875, -0.80706787109375, -0.780181884765625, -0.7532958984375, -0.726409912109375, -0.69952392578125, -0.672637939453125, -0.645751953125, -0.618865966796875, -0.59197998046875, -0.565093994140625, -0.5382080078125, -0.511322021484375, -0.48443603515625, -0.457550048828125, -0.4306640625, -0.403778076171875, -0.37689208984375, -0.350006103515625, -0.3231201171875, -0.296234130859375, -0.26934814453125, -0.242462158203125, -0.215576171875, -0.188690185546875, -0.16180419921875, -0.134918212890625, -0.1080322265625, -0.081146240234375, -0.05426025390625, -0.027374267578125, -0.00048828125, 0.026397705078125, 0.05328369140625, 0.080169677734375, 0.1070556640625, 0.133941650390625, 0.16082763671875, 0.187713623046875, 0.214599609375, 0.241485595703125, 0.26837158203125, 0.295257568359375, 0.3221435546875, 0.349029541015625, 0.37591552734375, 0.402801513671875, 0.4296875, 0.456573486328125, 0.48345947265625, 0.510345458984375, 0.5372314453125, 0.564117431640625, 0.59100341796875, 0.617889404296875, 0.644775390625, 0.671661376953125, 0.69854736328125, 0.725433349609375, 0.7523193359375, 0.779205322265625, 0.80609130859375, 0.832977294921875, 0.85986328125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 9.0, 15.0, 19.0, 21.0, 32.0, 20.0, 35.0, 26.0, 35.0, 34.0, 38.0, 36.0, 36.0, 42.0, 41.0, 37.0, 32.0, 40.0, 47.0, 56.0, 54.0, 32.0, 30.0, 28.0, 20.0, 15.0, 33.0, 21.0, 9.0, 15.0, 15.0, 9.0, 9.0, 5.0, 10.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2783203125, -1.2391815185546875, -1.200042724609375, -1.1609039306640625, -1.12176513671875, -1.0826263427734375, -1.043487548828125, -1.0043487548828125, -0.9652099609375, -0.9260711669921875, -0.886932373046875, -0.8477935791015625, -0.80865478515625, -0.7695159912109375, -0.730377197265625, -0.6912384033203125, -0.652099609375, -0.6129608154296875, -0.573822021484375, -0.5346832275390625, -0.49554443359375, -0.4564056396484375, -0.417266845703125, -0.3781280517578125, -0.3389892578125, -0.2998504638671875, -0.260711669921875, -0.2215728759765625, -0.18243408203125, -0.1432952880859375, -0.104156494140625, -0.0650177001953125, -0.02587890625, 0.0132598876953125, 0.052398681640625, 0.0915374755859375, 0.13067626953125, 0.1698150634765625, 0.208953857421875, 0.2480926513671875, 0.2872314453125, 0.3263702392578125, 0.365509033203125, 0.4046478271484375, 0.44378662109375, 0.4829254150390625, 0.522064208984375, 0.5612030029296875, 0.600341796875, 0.6394805908203125, 0.678619384765625, 0.7177581787109375, 0.75689697265625, 0.7960357666015625, 0.835174560546875, 0.8743133544921875, 0.9134521484375, 0.9525909423828125, 0.991729736328125, 1.0308685302734375, 1.07000732421875, 1.1091461181640625, 1.148284912109375, 1.1874237060546875, 1.2265625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 10.0, 13.0, 9.0, 16.0, 32.0, 27.0, 46.0, 51.0, 86.0, 132.0, 138.0, 198.0, 293.0, 376.0, 504.0, 721.0, 1030.0, 1518.0, 2237.0, 3570.0, 5624.0, 9783.0, 19005.0, 49854.0, 360736.0, 486960.0, 56983.0, 20651.0, 10572.0, 6021.0, 3669.0, 2383.0, 1542.0, 1085.0, 744.0, 508.0, 365.0, 283.0, 201.0, 157.0, 122.0, 81.0, 61.0, 45.0, 31.0, 27.0, 14.0, 11.0, 10.0, 13.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.3671875, -1.3258209228515625, -1.284454345703125, -1.2430877685546875, -1.20172119140625, -1.1603546142578125, -1.118988037109375, -1.0776214599609375, -1.0362548828125, -0.9948883056640625, -0.953521728515625, -0.9121551513671875, -0.87078857421875, -0.8294219970703125, -0.788055419921875, -0.7466888427734375, -0.705322265625, -0.6639556884765625, -0.622589111328125, -0.5812225341796875, -0.53985595703125, -0.4984893798828125, -0.457122802734375, -0.4157562255859375, -0.3743896484375, -0.3330230712890625, -0.291656494140625, -0.2502899169921875, -0.20892333984375, -0.1675567626953125, -0.126190185546875, -0.0848236083984375, -0.04345703125, -0.0020904541015625, 0.039276123046875, 0.0806427001953125, 0.12200927734375, 0.1633758544921875, 0.204742431640625, 0.2461090087890625, 0.2874755859375, 0.3288421630859375, 0.370208740234375, 0.4115753173828125, 0.45294189453125, 0.4943084716796875, 0.535675048828125, 0.5770416259765625, 0.618408203125, 0.6597747802734375, 0.701141357421875, 0.7425079345703125, 0.78387451171875, 0.8252410888671875, 0.866607666015625, 0.9079742431640625, 0.9493408203125, 0.9907073974609375, 1.032073974609375, 1.0734405517578125, 1.11480712890625, 1.1561737060546875, 1.197540283203125, 1.2389068603515625, 1.2802734375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 6.0, 11.0, 12.0, 11.0, 17.0, 15.0, 17.0, 17.0, 21.0, 26.0, 35.0, 25.0, 34.0, 40.0, 40.0, 34.0, 47.0, 50.0, 48.0, 52.0, 36.0, 47.0, 39.0, 44.0, 35.0, 27.0, 38.0, 26.0, 25.0, 22.0, 19.0, 11.0, 15.0, 16.0, 5.0, 9.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84326171875, -0.8162841796875, -0.789306640625, -0.7623291015625, -0.7353515625, -0.7083740234375, -0.681396484375, -0.6544189453125, -0.62744140625, -0.6004638671875, -0.573486328125, -0.5465087890625, -0.51953125, -0.4925537109375, -0.465576171875, -0.4385986328125, -0.41162109375, -0.3846435546875, -0.357666015625, -0.3306884765625, -0.3037109375, -0.2767333984375, -0.249755859375, -0.2227783203125, -0.19580078125, -0.1688232421875, -0.141845703125, -0.1148681640625, -0.087890625, -0.0609130859375, -0.033935546875, -0.0069580078125, 0.02001953125, 0.0469970703125, 0.073974609375, 0.1009521484375, 0.1279296875, 0.1549072265625, 0.181884765625, 0.2088623046875, 0.23583984375, 0.2628173828125, 0.289794921875, 0.3167724609375, 0.34375, 0.3707275390625, 0.397705078125, 0.4246826171875, 0.45166015625, 0.4786376953125, 0.505615234375, 0.5325927734375, 0.5595703125, 0.5865478515625, 0.613525390625, 0.6405029296875, 0.66748046875, 0.6944580078125, 0.721435546875, 0.7484130859375, 0.775390625, 0.8023681640625, 0.829345703125, 0.8563232421875, 0.88330078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 10.0, 7.0, 12.0, 9.0, 22.0, 24.0, 24.0, 25.0, 49.0, 68.0, 69.0, 105.0, 126.0, 161.0, 212.0, 265.0, 414.0, 647.0, 961.0, 1503.0, 2651.0, 4801.0, 9487.0, 23553.0, 86463.0, 696818.0, 159159.0, 33951.0, 12296.0, 5824.0, 3222.0, 1843.0, 1168.0, 754.0, 527.0, 334.0, 239.0, 173.0, 127.0, 115.0, 73.0, 72.0, 57.0, 32.0, 20.0, 25.0, 20.0, 15.0, 7.0, 5.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34716796875, -0.335845947265625, -0.32452392578125, -0.313201904296875, -0.3018798828125, -0.290557861328125, -0.27923583984375, -0.267913818359375, -0.256591796875, -0.245269775390625, -0.23394775390625, -0.222625732421875, -0.2113037109375, -0.199981689453125, -0.18865966796875, -0.177337646484375, -0.166015625, -0.154693603515625, -0.14337158203125, -0.132049560546875, -0.1207275390625, -0.109405517578125, -0.09808349609375, -0.086761474609375, -0.075439453125, -0.064117431640625, -0.05279541015625, -0.041473388671875, -0.0301513671875, -0.018829345703125, -0.00750732421875, 0.003814697265625, 0.01513671875, 0.026458740234375, 0.03778076171875, 0.049102783203125, 0.0604248046875, 0.071746826171875, 0.08306884765625, 0.094390869140625, 0.105712890625, 0.117034912109375, 0.12835693359375, 0.139678955078125, 0.1510009765625, 0.162322998046875, 0.17364501953125, 0.184967041015625, 0.1962890625, 0.207611083984375, 0.21893310546875, 0.230255126953125, 0.2415771484375, 0.252899169921875, 0.26422119140625, 0.275543212890625, 0.286865234375, 0.298187255859375, 0.30950927734375, 0.320831298828125, 0.3321533203125, 0.343475341796875, 0.35479736328125, 0.366119384765625, 0.37744140625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 7.0, 5.0, 17.0, 10.0, 18.0, 35.0, 43.0, 41.0, 57.0, 97.0, 123.0, 117.0, 112.0, 79.0, 57.0, 51.0, 22.0, 23.0, 15.0, 19.0, 11.0, 8.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8417835235595703e-05, -1.792237162590027e-05, -1.7426908016204834e-05, -1.69314444065094e-05, -1.6435980796813965e-05, -1.594051718711853e-05, -1.5445053577423096e-05, -1.4949589967727661e-05, -1.4454126358032227e-05, -1.3958662748336792e-05, -1.3463199138641357e-05, -1.2967735528945923e-05, -1.2472271919250488e-05, -1.1976808309555054e-05, -1.1481344699859619e-05, -1.0985881090164185e-05, -1.049041748046875e-05, -9.994953870773315e-06, -9.499490261077881e-06, -9.004026651382446e-06, -8.508563041687012e-06, -8.013099431991577e-06, -7.517635822296143e-06, -7.022172212600708e-06, -6.5267086029052734e-06, -6.031244993209839e-06, -5.535781383514404e-06, -5.04031777381897e-06, -4.544854164123535e-06, -4.049390554428101e-06, -3.553926944732666e-06, -3.0584633350372314e-06, -2.562999725341797e-06, -2.0675361156463623e-06, -1.5720725059509277e-06, -1.0766088962554932e-06, -5.811452865600586e-07, -8.568167686462402e-08, 4.0978193283081055e-07, 9.052455425262451e-07, 1.4007091522216797e-06, 1.8961727619171143e-06, 2.391636371612549e-06, 2.8870999813079834e-06, 3.382563591003418e-06, 3.8780272006988525e-06, 4.373490810394287e-06, 4.868954420089722e-06, 5.364418029785156e-06, 5.859881639480591e-06, 6.355345249176025e-06, 6.85080885887146e-06, 7.3462724685668945e-06, 7.841736078262329e-06, 8.337199687957764e-06, 8.832663297653198e-06, 9.328126907348633e-06, 9.823590517044067e-06, 1.0319054126739502e-05, 1.0814517736434937e-05, 1.1309981346130371e-05, 1.1805444955825806e-05, 1.230090856552124e-05, 1.2796372175216675e-05, 1.329183578491211e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 6.0, 5.0, 5.0, 13.0, 11.0, 18.0, 39.0, 39.0, 62.0, 84.0, 129.0, 177.0, 298.0, 446.0, 801.0, 1568.0, 3383.0, 9346.0, 33801.0, 203319.0, 684626.0, 81059.0, 18471.0, 5707.0, 2314.0, 1115.0, 579.0, 393.0, 221.0, 144.0, 120.0, 64.0, 68.0, 41.0, 25.0, 15.0, 12.0, 10.0, 8.0, 0.0, 4.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.5597915649414062, -0.5399932861328125, -0.5201950073242188, -0.500396728515625, -0.48059844970703125, -0.4608001708984375, -0.44100189208984375, -0.42120361328125, -0.40140533447265625, -0.3816070556640625, -0.36180877685546875, -0.342010498046875, -0.32221221923828125, -0.3024139404296875, -0.28261566162109375, -0.2628173828125, -0.24301910400390625, -0.2232208251953125, -0.20342254638671875, -0.183624267578125, -0.16382598876953125, -0.1440277099609375, -0.12422943115234375, -0.10443115234375, -0.08463287353515625, -0.0648345947265625, -0.04503631591796875, -0.025238037109375, -0.00543975830078125, 0.0143585205078125, 0.03415679931640625, 0.053955078125, 0.07375335693359375, 0.0935516357421875, 0.11334991455078125, 0.133148193359375, 0.15294647216796875, 0.1727447509765625, 0.19254302978515625, 0.21234130859375, 0.23213958740234375, 0.2519378662109375, 0.27173614501953125, 0.291534423828125, 0.31133270263671875, 0.3311309814453125, 0.35092926025390625, 0.3707275390625, 0.39052581787109375, 0.4103240966796875, 0.43012237548828125, 0.449920654296875, 0.46971893310546875, 0.4895172119140625, 0.5093154907226562, 0.52911376953125, 0.5489120483398438, 0.5687103271484375, 0.5885086059570312, 0.608306884765625, 0.6281051635742188, 0.6479034423828125, 0.6677017211914062, 0.6875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 6.0, 12.0, 15.0, 20.0, 22.0, 43.0, 60.0, 110.0, 134.0, 163.0, 138.0, 96.0, 62.0, 33.0, 28.0, 15.0, 10.0, 10.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0941162109375, -0.09009170532226562, -0.08606719970703125, -0.08204269409179688, -0.0780181884765625, -0.07399368286132812, -0.06996917724609375, -0.06594467163085938, -0.061920166015625, -0.057895660400390625, -0.05387115478515625, -0.049846649169921875, -0.0458221435546875, -0.041797637939453125, -0.03777313232421875, -0.033748626708984375, -0.02972412109375, -0.025699615478515625, -0.02167510986328125, -0.017650604248046875, -0.0136260986328125, -0.009601593017578125, -0.00557708740234375, -0.001552581787109375, 0.002471923828125, 0.006496429443359375, 0.01052093505859375, 0.014545440673828125, 0.0185699462890625, 0.022594451904296875, 0.02661895751953125, 0.030643463134765625, 0.03466796875, 0.038692474365234375, 0.04271697998046875, 0.046741485595703125, 0.0507659912109375, 0.054790496826171875, 0.05881500244140625, 0.06283950805664062, 0.066864013671875, 0.07088851928710938, 0.07491302490234375, 0.07893753051757812, 0.0829620361328125, 0.08698654174804688, 0.09101104736328125, 0.09503555297851562, 0.09906005859375, 0.10308456420898438, 0.10710906982421875, 0.11113357543945312, 0.1151580810546875, 0.11918258666992188, 0.12320709228515625, 0.12723159790039062, 0.131256103515625, 0.13528060913085938, 0.13930511474609375, 0.14332962036132812, 0.1473541259765625, 0.15137863159179688, 0.15540313720703125, 0.15942764282226562, 0.1634521484375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 12.0, 5.0, 10.0, 17.0, 16.0, 32.0, 34.0, 61.0, 100.0, 110.0, 143.0, 111.0, 95.0, 61.0, 49.0, 39.0, 25.0, 19.0, 13.0, 10.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4162213802337646, -2.348500967025757, -2.28078031539917, -2.213059902191162, -2.145339250564575, -2.0776188373565674, -2.0098981857299805, -1.9421777725219727, -1.8744572401046753, -1.806736707687378, -1.7390161752700806, -1.6712956428527832, -1.6035752296447754, -1.5358545780181885, -1.4681341648101807, -1.4004136323928833, -1.332693099975586, -1.2649725675582886, -1.1972520351409912, -1.1295315027236938, -1.0618109703063965, -0.9940904974937439, -0.9263700246810913, -0.858649492263794, -0.7909289598464966, -0.7232084274291992, -0.6554878950119019, -0.5877674221992493, -0.5200468897819519, -0.45232635736465454, -0.38460585474967957, -0.3168853521347046, -0.24916470050811768, -0.1814441829919815, -0.11372366547584534, -0.04600314795970917, 0.021717369556427002, 0.08943790197372437, 0.15715840458869934, 0.22487890720367432, 0.2925994396209717, 0.36031997203826904, 0.428040474653244, 0.495760977268219, 0.5634815096855164, 0.6312020421028137, 0.6989225149154663, 0.7666430473327637, 0.834363579750061, 0.9020841121673584, 0.9698046445846558, 1.0375251770019531, 1.105245590209961, 1.1729662418365479, 1.2406866550445557, 1.308407187461853, 1.3761277198791504, 1.4438482522964478, 1.5115687847137451, 1.5792893171310425, 1.6470098495483398, 1.7147302627563477, 1.782450795173645, 1.8501713275909424, 1.9178918600082397]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 11.0, 7.0, 6.0, 9.0, 12.0, 18.0, 16.0, 16.0, 27.0, 32.0, 32.0, 25.0, 36.0, 38.0, 34.0, 28.0, 40.0, 40.0, 43.0, 32.0, 48.0, 44.0, 42.0, 46.0, 48.0, 34.0, 26.0, 28.0, 28.0, 23.0, 25.0, 25.0, 15.0, 10.0, 12.0, 11.0, 7.0, 8.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.1591284275054932, -1.121032476425171, -1.0829365253448486, -1.0448405742645264, -1.006744623184204, -0.9686486124992371, -0.93055260181427, -0.8924566507339478, -0.8543606996536255, -0.8162647485733032, -0.778168797492981, -0.7400727868080139, -0.7019768357276917, -0.6638808846473694, -0.6257848739624023, -0.5876889228820801, -0.5495929718017578, -0.5114970207214355, -0.4734010398387909, -0.43530505895614624, -0.397209107875824, -0.3591131567955017, -0.32101717591285706, -0.2829211950302124, -0.24482524394989014, -0.20672927796840668, -0.16863331198692322, -0.13053734600543976, -0.0924413800239563, -0.05434541404247284, -0.01624944806098938, 0.021846532821655273, 0.05994248390197754, 0.098038449883461, 0.13613441586494446, 0.17423038184642792, 0.21232634782791138, 0.25042229890823364, 0.2885182797908783, 0.32661426067352295, 0.3647102117538452, 0.4028061628341675, 0.44090214371681213, 0.4789981245994568, 0.517094075679779, 0.5551900267601013, 0.5932860374450684, 0.6313819885253906, 0.6694779396057129, 0.7075738906860352, 0.7456698417663574, 0.7837658524513245, 0.8218618035316467, 0.859957754611969, 0.898053765296936, 0.9361497163772583, 0.9742456674575806, 1.0123416185379028, 1.050437569618225, 1.0885335206985474, 1.1266295909881592, 1.1647255420684814, 1.2028214931488037, 1.240917444229126, 1.2790133953094482]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 10.0, 9.0, 15.0, 18.0, 36.0, 62.0, 58.0, 111.0, 158.0, 228.0, 345.0, 421.0, 657.0, 967.0, 1480.0, 2324.0, 3495.0, 5317.0, 8358.0, 13567.0, 22208.0, 37573.0, 66518.0, 124107.0, 233914.0, 235643.0, 125636.0, 67299.0, 37870.0, 22287.0, 13502.0, 8553.0, 5281.0, 3532.0, 2309.0, 1468.0, 1025.0, 698.0, 458.0, 329.0, 212.0, 138.0, 108.0, 69.0, 59.0, 40.0, 26.0, 16.0, 9.0, 14.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0], "bins": [-2.064453125, -2.0019073486328125, -1.939361572265625, -1.8768157958984375, -1.81427001953125, -1.7517242431640625, -1.689178466796875, -1.6266326904296875, -1.5640869140625, -1.5015411376953125, -1.438995361328125, -1.3764495849609375, -1.31390380859375, -1.2513580322265625, -1.188812255859375, -1.1262664794921875, -1.063720703125, -1.0011749267578125, -0.938629150390625, -0.8760833740234375, -0.81353759765625, -0.7509918212890625, -0.688446044921875, -0.6259002685546875, -0.5633544921875, -0.5008087158203125, -0.438262939453125, -0.3757171630859375, -0.31317138671875, -0.2506256103515625, -0.188079833984375, -0.1255340576171875, -0.06298828125, -0.0004425048828125, 0.062103271484375, 0.1246490478515625, 0.18719482421875, 0.2497406005859375, 0.312286376953125, 0.3748321533203125, 0.4373779296875, 0.4999237060546875, 0.562469482421875, 0.6250152587890625, 0.68756103515625, 0.7501068115234375, 0.812652587890625, 0.8751983642578125, 0.937744140625, 1.0002899169921875, 1.062835693359375, 1.1253814697265625, 1.18792724609375, 1.2504730224609375, 1.313018798828125, 1.3755645751953125, 1.4381103515625, 1.5006561279296875, 1.563201904296875, 1.6257476806640625, 1.68829345703125, 1.7508392333984375, 1.813385009765625, 1.8759307861328125, 1.9384765625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 10.0, 11.0, 12.0, 7.0, 11.0, 17.0, 23.0, 32.0, 20.0, 33.0, 32.0, 32.0, 37.0, 38.0, 45.0, 35.0, 46.0, 50.0, 51.0, 31.0, 44.0, 49.0, 52.0, 38.0, 38.0, 19.0, 36.0, 27.0, 29.0, 15.0, 13.0, 13.0, 15.0, 10.0, 9.0, 7.0, 7.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0394744873046875, -1.003753662109375, -0.9680328369140625, -0.93231201171875, -0.8965911865234375, -0.860870361328125, -0.8251495361328125, -0.7894287109375, -0.7537078857421875, -0.717987060546875, -0.6822662353515625, -0.64654541015625, -0.6108245849609375, -0.575103759765625, -0.5393829345703125, -0.503662109375, -0.4679412841796875, -0.432220458984375, -0.3964996337890625, -0.36077880859375, -0.3250579833984375, -0.289337158203125, -0.2536163330078125, -0.2178955078125, -0.1821746826171875, -0.146453857421875, -0.1107330322265625, -0.07501220703125, -0.0392913818359375, -0.003570556640625, 0.0321502685546875, 0.06787109375, 0.1035919189453125, 0.139312744140625, 0.1750335693359375, 0.21075439453125, 0.2464752197265625, 0.282196044921875, 0.3179168701171875, 0.3536376953125, 0.3893585205078125, 0.425079345703125, 0.4608001708984375, 0.49652099609375, 0.5322418212890625, 0.567962646484375, 0.6036834716796875, 0.639404296875, 0.6751251220703125, 0.710845947265625, 0.7465667724609375, 0.78228759765625, 0.8180084228515625, 0.853729248046875, 0.8894500732421875, 0.9251708984375, 0.9608917236328125, 0.996612548828125, 1.0323333740234375, 1.06805419921875, 1.1037750244140625, 1.139495849609375, 1.1752166748046875, 1.2109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 9.0, 5.0, 12.0, 28.0, 32.0, 47.0, 70.0, 71.0, 120.0, 182.0, 265.0, 377.0, 581.0, 894.0, 1391.0, 2054.0, 3229.0, 5229.0, 8403.0, 14660.0, 26131.0, 48092.0, 94133.0, 187710.0, 288264.0, 174097.0, 87475.0, 44805.0, 24540.0, 13844.0, 7987.0, 4895.0, 3094.0, 1919.0, 1278.0, 862.0, 582.0, 387.0, 248.0, 186.0, 111.0, 80.0, 62.0, 35.0, 23.0, 27.0, 10.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.13671875, -2.07086181640625, -2.0050048828125, -1.93914794921875, -1.873291015625, -1.80743408203125, -1.7415771484375, -1.67572021484375, -1.60986328125, -1.54400634765625, -1.4781494140625, -1.41229248046875, -1.346435546875, -1.28057861328125, -1.2147216796875, -1.14886474609375, -1.0830078125, -1.01715087890625, -0.9512939453125, -0.88543701171875, -0.819580078125, -0.75372314453125, -0.6878662109375, -0.62200927734375, -0.55615234375, -0.49029541015625, -0.4244384765625, -0.35858154296875, -0.292724609375, -0.22686767578125, -0.1610107421875, -0.09515380859375, -0.029296875, 0.03656005859375, 0.1024169921875, 0.16827392578125, 0.234130859375, 0.29998779296875, 0.3658447265625, 0.43170166015625, 0.49755859375, 0.56341552734375, 0.6292724609375, 0.69512939453125, 0.760986328125, 0.82684326171875, 0.8927001953125, 0.95855712890625, 1.0244140625, 1.09027099609375, 1.1561279296875, 1.22198486328125, 1.287841796875, 1.35369873046875, 1.4195556640625, 1.48541259765625, 1.55126953125, 1.61712646484375, 1.6829833984375, 1.74884033203125, 1.814697265625, 1.88055419921875, 1.9464111328125, 2.01226806640625, 2.078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 8.0, 13.0, 17.0, 16.0, 18.0, 18.0, 17.0, 22.0, 31.0, 37.0, 37.0, 40.0, 32.0, 49.0, 41.0, 45.0, 40.0, 29.0, 43.0, 46.0, 43.0, 28.0, 39.0, 40.0, 39.0, 18.0, 22.0, 10.0, 22.0, 16.0, 17.0, 17.0, 15.0, 6.0, 7.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67333984375, -0.6524810791015625, -0.631622314453125, -0.6107635498046875, -0.58990478515625, -0.5690460205078125, -0.548187255859375, -0.5273284912109375, -0.5064697265625, -0.4856109619140625, -0.464752197265625, -0.4438934326171875, -0.42303466796875, -0.4021759033203125, -0.381317138671875, -0.3604583740234375, -0.339599609375, -0.3187408447265625, -0.297882080078125, -0.2770233154296875, -0.25616455078125, -0.2353057861328125, -0.214447021484375, -0.1935882568359375, -0.1727294921875, -0.1518707275390625, -0.131011962890625, -0.1101531982421875, -0.08929443359375, -0.0684356689453125, -0.047576904296875, -0.0267181396484375, -0.005859375, 0.0149993896484375, 0.035858154296875, 0.0567169189453125, 0.07757568359375, 0.0984344482421875, 0.119293212890625, 0.1401519775390625, 0.1610107421875, 0.1818695068359375, 0.202728271484375, 0.2235870361328125, 0.24444580078125, 0.2653045654296875, 0.286163330078125, 0.3070220947265625, 0.327880859375, 0.3487396240234375, 0.369598388671875, 0.3904571533203125, 0.41131591796875, 0.4321746826171875, 0.453033447265625, 0.4738922119140625, 0.4947509765625, 0.5156097412109375, 0.536468505859375, 0.5573272705078125, 0.57818603515625, 0.5990447998046875, 0.619903564453125, 0.6407623291015625, 0.66162109375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 12.0, 16.0, 16.0, 22.0, 41.0, 40.0, 55.0, 82.0, 120.0, 136.0, 204.0, 314.0, 476.0, 629.0, 931.0, 1464.0, 2310.0, 3865.0, 6961.0, 13487.0, 29605.0, 81226.0, 705160.0, 124056.0, 39279.0, 17107.0, 8492.0, 4572.0, 2723.0, 1669.0, 1066.0, 708.0, 470.0, 351.0, 240.0, 168.0, 151.0, 79.0, 72.0, 48.0, 26.0, 18.0, 31.0, 12.0, 14.0, 7.0, 6.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.818359375, -1.7626800537109375, -1.707000732421875, -1.6513214111328125, -1.59564208984375, -1.5399627685546875, -1.484283447265625, -1.4286041259765625, -1.3729248046875, -1.3172454833984375, -1.261566162109375, -1.2058868408203125, -1.15020751953125, -1.0945281982421875, -1.038848876953125, -0.9831695556640625, -0.927490234375, -0.8718109130859375, -0.816131591796875, -0.7604522705078125, -0.70477294921875, -0.6490936279296875, -0.593414306640625, -0.5377349853515625, -0.4820556640625, -0.4263763427734375, -0.370697021484375, -0.3150177001953125, -0.25933837890625, -0.2036590576171875, -0.147979736328125, -0.0923004150390625, -0.03662109375, 0.0190582275390625, 0.074737548828125, 0.1304168701171875, 0.18609619140625, 0.2417755126953125, 0.297454833984375, 0.3531341552734375, 0.4088134765625, 0.4644927978515625, 0.520172119140625, 0.5758514404296875, 0.63153076171875, 0.6872100830078125, 0.742889404296875, 0.7985687255859375, 0.854248046875, 0.9099273681640625, 0.965606689453125, 1.0212860107421875, 1.07696533203125, 1.1326446533203125, 1.188323974609375, 1.2440032958984375, 1.2996826171875, 1.3553619384765625, 1.411041259765625, 1.4667205810546875, 1.52239990234375, 1.5780792236328125, 1.633758544921875, 1.6894378662109375, 1.7451171875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 5.0, 1.0, 8.0, 8.0, 9.0, 25.0, 27.0, 34.0, 94.0, 418.0, 164.0, 87.0, 32.0, 27.0, 25.0, 7.0, 5.0, 5.0, 6.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.015466690063477e-05, -6.754230707883835e-05, -6.492994725704193e-05, -6.231758743524551e-05, -5.97052276134491e-05, -5.709286779165268e-05, -5.448050796985626e-05, -5.1868148148059845e-05, -4.925578832626343e-05, -4.664342850446701e-05, -4.403106868267059e-05, -4.1418708860874176e-05, -3.880634903907776e-05, -3.619398921728134e-05, -3.3581629395484924e-05, -3.096926957368851e-05, -2.835690975189209e-05, -2.5744549930095673e-05, -2.3132190108299255e-05, -2.0519830286502838e-05, -1.790747046470642e-05, -1.5295110642910004e-05, -1.2682750821113586e-05, -1.007039099931717e-05, -7.458031177520752e-06, -4.845671355724335e-06, -2.2333115339279175e-06, 3.7904828786849976e-07, 2.991408109664917e-06, 5.603767931461334e-06, 8.216127753257751e-06, 1.0828487575054169e-05, 1.3440847396850586e-05, 1.6053207218647003e-05, 1.866556704044342e-05, 2.1277926862239838e-05, 2.3890286684036255e-05, 2.6502646505832672e-05, 2.911500632762909e-05, 3.1727366149425507e-05, 3.4339725971221924e-05, 3.695208579301834e-05, 3.956444561481476e-05, 4.2176805436611176e-05, 4.478916525840759e-05, 4.740152508020401e-05, 5.001388490200043e-05, 5.2626244723796844e-05, 5.523860454559326e-05, 5.785096436738968e-05, 6.0463324189186096e-05, 6.307568401098251e-05, 6.568804383277893e-05, 6.830040365457535e-05, 7.091276347637177e-05, 7.352512329816818e-05, 7.61374831199646e-05, 7.874984294176102e-05, 8.136220276355743e-05, 8.397456258535385e-05, 8.658692240715027e-05, 8.919928222894669e-05, 9.18116420507431e-05, 9.442400187253952e-05, 9.703636169433594e-05]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 3.0, 10.0, 11.0, 13.0, 21.0, 19.0, 48.0, 68.0, 79.0, 96.0, 149.0, 244.0, 346.0, 528.0, 796.0, 1308.0, 2200.0, 3684.0, 6339.0, 11874.0, 24350.0, 66587.0, 703817.0, 146837.0, 40365.0, 17009.0, 8910.0, 5062.0, 2947.0, 1788.0, 1052.0, 656.0, 448.0, 282.0, 181.0, 114.0, 93.0, 60.0, 55.0, 34.0, 20.0, 11.0, 17.0, 5.0, 3.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.671875, -1.61376953125, -1.5556640625, -1.49755859375, -1.439453125, -1.38134765625, -1.3232421875, -1.26513671875, -1.20703125, -1.14892578125, -1.0908203125, -1.03271484375, -0.974609375, -0.91650390625, -0.8583984375, -0.80029296875, -0.7421875, -0.68408203125, -0.6259765625, -0.56787109375, -0.509765625, -0.45166015625, -0.3935546875, -0.33544921875, -0.27734375, -0.21923828125, -0.1611328125, -0.10302734375, -0.044921875, 0.01318359375, 0.0712890625, 0.12939453125, 0.1875, 0.24560546875, 0.3037109375, 0.36181640625, 0.419921875, 0.47802734375, 0.5361328125, 0.59423828125, 0.65234375, 0.71044921875, 0.7685546875, 0.82666015625, 0.884765625, 0.94287109375, 1.0009765625, 1.05908203125, 1.1171875, 1.17529296875, 1.2333984375, 1.29150390625, 1.349609375, 1.40771484375, 1.4658203125, 1.52392578125, 1.58203125, 1.64013671875, 1.6982421875, 1.75634765625, 1.814453125, 1.87255859375, 1.9306640625, 1.98876953125, 2.046875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 5.0, 17.0, 17.0, 4.0, 12.0, 13.0, 30.0, 42.0, 36.0, 51.0, 153.0, 323.0, 50.0, 58.0, 40.0, 20.0, 25.0, 17.0, 11.0, 8.0, 8.0, 12.0, 4.0, 7.0, 7.0, 2.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.393798828125, -0.3792381286621094, -0.36467742919921875, -0.3501167297363281, -0.3355560302734375, -0.3209953308105469, -0.30643463134765625, -0.2918739318847656, -0.277313232421875, -0.2627525329589844, -0.24819183349609375, -0.23363113403320312, -0.2190704345703125, -0.20450973510742188, -0.18994903564453125, -0.17538833618164062, -0.16082763671875, -0.14626693725585938, -0.13170623779296875, -0.11714553833007812, -0.1025848388671875, -0.08802413940429688, -0.07346343994140625, -0.058902740478515625, -0.044342041015625, -0.029781341552734375, -0.01522064208984375, -0.000659942626953125, 0.0139007568359375, 0.028461456298828125, 0.04302215576171875, 0.057582855224609375, 0.0721435546875, 0.08670425415039062, 0.10126495361328125, 0.11582565307617188, 0.1303863525390625, 0.14494705200195312, 0.15950775146484375, 0.17406845092773438, 0.188629150390625, 0.20318984985351562, 0.21775054931640625, 0.23231124877929688, 0.2468719482421875, 0.2614326477050781, 0.27599334716796875, 0.2905540466308594, 0.30511474609375, 0.3196754455566406, 0.33423614501953125, 0.3487968444824219, 0.3633575439453125, 0.3779182434082031, 0.39247894287109375, 0.4070396423339844, 0.421600341796875, 0.4361610412597656, 0.45072174072265625, 0.4652824401855469, 0.4798431396484375, 0.4944038391113281, 0.5089645385742188, 0.5235252380371094, 0.5380859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 10.0, 9.0, 10.0, 9.0, 23.0, 31.0, 39.0, 57.0, 79.0, 88.0, 135.0, 99.0, 93.0, 58.0, 51.0, 53.0, 33.0, 21.0, 23.0, 12.0, 11.0, 6.0, 7.0, 4.0, 3.0, 9.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5896393060684204, -1.5361613035202026, -1.4826831817626953, -1.4292051792144775, -1.3757271766662598, -1.3222490549087524, -1.2687710523605347, -1.2152929306030273, -1.1618149280548096, -1.1083369255065918, -1.0548588037490845, -1.0013808012008667, -0.9479027390480042, -0.8944246768951416, -0.8409466743469238, -0.7874686121940613, -0.7339905500411987, -0.6805124878883362, -0.6270344257354736, -0.5735564231872559, -0.5200783610343933, -0.46660029888153076, -0.4131222665309906, -0.35964423418045044, -0.3061661720275879, -0.25268810987472534, -0.19921007752418518, -0.14573203027248383, -0.09225398302078247, -0.03877592086791992, 0.01470211148262024, 0.0681801438331604, 0.1216580867767334, 0.17513613402843475, 0.2286141812801361, 0.28209221363067627, 0.3355702757835388, 0.38904833793640137, 0.44252637028694153, 0.4960044026374817, 0.5494824647903442, 0.6029605269432068, 0.6564385890960693, 0.7099165916442871, 0.7633946537971497, 0.8168727159500122, 0.87035071849823, 0.9238287806510925, 0.9773068428039551, 1.0307848453521729, 1.0842629671096802, 1.137740969657898, 1.1912190914154053, 1.244697093963623, 1.2981750965118408, 1.3516530990600586, 1.405131220817566, 1.4586092233657837, 1.512087345123291, 1.5655653476715088, 1.6190433502197266, 1.6725214719772339, 1.7259994745254517, 1.779477596282959, 1.8329555988311768]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 9.0, 12.0, 11.0, 11.0, 20.0, 28.0, 26.0, 27.0, 20.0, 29.0, 38.0, 30.0, 40.0, 29.0, 51.0, 35.0, 29.0, 48.0, 39.0, 45.0, 40.0, 34.0, 32.0, 39.0, 26.0, 31.0, 22.0, 26.0, 35.0, 23.0, 16.0, 17.0, 17.0, 6.0, 2.0, 11.0, 8.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.099994421005249, -1.0658196210861206, -1.0316448211669922, -0.9974700808525085, -0.9632953405380249, -0.9291205406188965, -0.8949457406997681, -0.8607709407806396, -0.826596200466156, -0.7924214005470276, -0.758246660232544, -0.7240718603134155, -0.6898970603942871, -0.6557223200798035, -0.621547520160675, -0.5873727798461914, -0.553197979927063, -0.5190231800079346, -0.4848484396934509, -0.4506736397743225, -0.4164988696575165, -0.38232409954071045, -0.34814929962158203, -0.313974529504776, -0.27979975938796997, -0.24562498927116394, -0.21145020425319672, -0.1772754192352295, -0.14310064911842346, -0.10892587900161743, -0.07475109398365021, -0.04057630896568298, -0.006401419639587402, 0.027773357927799225, 0.06194813549518585, 0.09612291306257248, 0.1302976906299591, 0.16447246074676514, 0.19864724576473236, 0.23282203078269958, 0.2669968008995056, 0.30117157101631165, 0.3353463411331177, 0.3695211410522461, 0.4036959111690521, 0.43787068128585815, 0.4720454812049866, 0.5062202215194702, 0.5403950214385986, 0.574569821357727, 0.6087445616722107, 0.6429193615913391, 0.6770941019058228, 0.7112689018249512, 0.7454437017440796, 0.779618501663208, 0.8137932419776917, 0.8479680418968201, 0.8821427822113037, 0.9163175821304321, 0.9504923820495605, 0.9846671223640442, 1.0188418626785278, 1.0530166625976562, 1.0871914625167847]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 7.0, 13.0, 24.0, 25.0, 41.0, 72.0, 78.0, 135.0, 203.0, 278.0, 445.0, 583.0, 864.0, 1244.0, 1812.0, 2720.0, 4235.0, 6503.0, 9993.0, 15467.0, 24844.0, 41406.0, 71534.0, 134132.0, 305540.0, 1079556.0, 1560673.0, 514188.0, 191719.0, 94718.0, 51761.0, 30206.0, 18507.0, 11281.0, 7124.0, 4467.0, 2971.0, 1722.0, 1189.0, 718.0, 423.0, 292.0, 202.0, 117.0, 87.0, 49.0, 45.0, 22.0, 16.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4609375, -1.4155731201171875, -1.370208740234375, -1.3248443603515625, -1.27947998046875, -1.2341156005859375, -1.188751220703125, -1.1433868408203125, -1.0980224609375, -1.0526580810546875, -1.007293701171875, -0.9619293212890625, -0.91656494140625, -0.8712005615234375, -0.825836181640625, -0.7804718017578125, -0.735107421875, -0.6897430419921875, -0.644378662109375, -0.5990142822265625, -0.55364990234375, -0.5082855224609375, -0.462921142578125, -0.4175567626953125, -0.3721923828125, -0.3268280029296875, -0.281463623046875, -0.2360992431640625, -0.19073486328125, -0.1453704833984375, -0.100006103515625, -0.0546417236328125, -0.00927734375, 0.0360870361328125, 0.081451416015625, 0.1268157958984375, 0.17218017578125, 0.2175445556640625, 0.262908935546875, 0.3082733154296875, 0.3536376953125, 0.3990020751953125, 0.444366455078125, 0.4897308349609375, 0.53509521484375, 0.5804595947265625, 0.625823974609375, 0.6711883544921875, 0.716552734375, 0.7619171142578125, 0.807281494140625, 0.8526458740234375, 0.89801025390625, 0.9433746337890625, 0.988739013671875, 1.0341033935546875, 1.0794677734375, 1.1248321533203125, 1.170196533203125, 1.2155609130859375, 1.26092529296875, 1.3062896728515625, 1.351654052734375, 1.3970184326171875, 1.4423828125]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 8.0, 13.0, 9.0, 10.0, 17.0, 13.0, 21.0, 23.0, 23.0, 26.0, 32.0, 30.0, 37.0, 39.0, 45.0, 37.0, 42.0, 44.0, 43.0, 37.0, 42.0, 45.0, 35.0, 36.0, 31.0, 32.0, 31.0, 27.0, 32.0, 18.0, 27.0, 14.0, 19.0, 14.0, 11.0, 4.0, 8.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72021484375, -0.697967529296875, -0.67572021484375, -0.653472900390625, -0.6312255859375, -0.608978271484375, -0.58673095703125, -0.564483642578125, -0.542236328125, -0.519989013671875, -0.49774169921875, -0.475494384765625, -0.4532470703125, -0.430999755859375, -0.40875244140625, -0.386505126953125, -0.3642578125, -0.342010498046875, -0.31976318359375, -0.297515869140625, -0.2752685546875, -0.253021240234375, -0.23077392578125, -0.208526611328125, -0.186279296875, -0.164031982421875, -0.14178466796875, -0.119537353515625, -0.0972900390625, -0.075042724609375, -0.05279541015625, -0.030548095703125, -0.00830078125, 0.013946533203125, 0.03619384765625, 0.058441162109375, 0.0806884765625, 0.102935791015625, 0.12518310546875, 0.147430419921875, 0.169677734375, 0.191925048828125, 0.21417236328125, 0.236419677734375, 0.2586669921875, 0.280914306640625, 0.30316162109375, 0.325408935546875, 0.34765625, 0.369903564453125, 0.39215087890625, 0.414398193359375, 0.4366455078125, 0.458892822265625, 0.48114013671875, 0.503387451171875, 0.525634765625, 0.547882080078125, 0.57012939453125, 0.592376708984375, 0.6146240234375, 0.636871337890625, 0.65911865234375, 0.681365966796875, 0.70361328125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 2.0, 12.0, 21.0, 36.0, 47.0, 64.0, 98.0, 196.0, 276.0, 466.0, 829.0, 1273.0, 2219.0, 3697.0, 6480.0, 11495.0, 21223.0, 39934.0, 81823.0, 179184.0, 454462.0, 1512557.0, 1200104.0, 375146.0, 152547.0, 71062.0, 35686.0, 18790.0, 10407.0, 5893.0, 3320.0, 1945.0, 1200.0, 684.0, 427.0, 239.0, 176.0, 101.0, 55.0, 33.0, 35.0, 19.0, 6.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.4004364013671875, -1.353607177734375, -1.3067779541015625, -1.25994873046875, -1.2131195068359375, -1.166290283203125, -1.1194610595703125, -1.0726318359375, -1.0258026123046875, -0.978973388671875, -0.9321441650390625, -0.88531494140625, -0.8384857177734375, -0.791656494140625, -0.7448272705078125, -0.697998046875, -0.6511688232421875, -0.604339599609375, -0.5575103759765625, -0.51068115234375, -0.4638519287109375, -0.417022705078125, -0.3701934814453125, -0.3233642578125, -0.2765350341796875, -0.229705810546875, -0.1828765869140625, -0.13604736328125, -0.0892181396484375, -0.042388916015625, 0.0044403076171875, 0.05126953125, 0.0980987548828125, 0.144927978515625, 0.1917572021484375, 0.23858642578125, 0.2854156494140625, 0.332244873046875, 0.3790740966796875, 0.4259033203125, 0.4727325439453125, 0.519561767578125, 0.5663909912109375, 0.61322021484375, 0.6600494384765625, 0.706878662109375, 0.7537078857421875, 0.800537109375, 0.8473663330078125, 0.894195556640625, 0.9410247802734375, 0.98785400390625, 1.0346832275390625, 1.081512451171875, 1.1283416748046875, 1.1751708984375, 1.2220001220703125, 1.268829345703125, 1.3156585693359375, 1.36248779296875, 1.4093170166015625, 1.456146240234375, 1.5029754638671875, 1.5498046875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 10.0, 22.0, 19.0, 25.0, 23.0, 33.0, 41.0, 71.0, 85.0, 92.0, 98.0, 125.0, 153.0, 203.0, 195.0, 231.0, 265.0, 286.0, 281.0, 291.0, 226.0, 231.0, 196.0, 156.0, 128.0, 117.0, 89.0, 60.0, 54.0, 60.0, 41.0, 39.0, 25.0, 13.0, 19.0, 10.0, 13.0, 10.0, 4.0, 10.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0], "bins": [-0.436767578125, -0.4246978759765625, -0.412628173828125, -0.4005584716796875, -0.38848876953125, -0.3764190673828125, -0.364349365234375, -0.3522796630859375, -0.3402099609375, -0.3281402587890625, -0.316070556640625, -0.3040008544921875, -0.29193115234375, -0.2798614501953125, -0.267791748046875, -0.2557220458984375, -0.24365234375, -0.2315826416015625, -0.219512939453125, -0.2074432373046875, -0.19537353515625, -0.1833038330078125, -0.171234130859375, -0.1591644287109375, -0.1470947265625, -0.1350250244140625, -0.122955322265625, -0.1108856201171875, -0.09881591796875, -0.0867462158203125, -0.074676513671875, -0.0626068115234375, -0.050537109375, -0.0384674072265625, -0.026397705078125, -0.0143280029296875, -0.00225830078125, 0.0098114013671875, 0.021881103515625, 0.0339508056640625, 0.0460205078125, 0.0580902099609375, 0.070159912109375, 0.0822296142578125, 0.09429931640625, 0.1063690185546875, 0.118438720703125, 0.1305084228515625, 0.142578125, 0.1546478271484375, 0.166717529296875, 0.1787872314453125, 0.19085693359375, 0.2029266357421875, 0.214996337890625, 0.2270660400390625, 0.2391357421875, 0.2512054443359375, 0.263275146484375, 0.2753448486328125, 0.28741455078125, 0.2994842529296875, 0.311553955078125, 0.3236236572265625, 0.335693359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 1.0, 8.0, 6.0, 8.0, 7.0, 13.0, 26.0, 24.0, 44.0, 45.0, 76.0, 82.0, 117.0, 109.0, 105.0, 75.0, 60.0, 56.0, 34.0, 23.0, 14.0, 18.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6699382066726685, -1.6285617351531982, -1.587185263633728, -1.5458087921142578, -1.5044323205947876, -1.4630558490753174, -1.4216793775558472, -1.380302906036377, -1.3389265537261963, -1.297550082206726, -1.2561736106872559, -1.2147971391677856, -1.1734206676483154, -1.1320441961288452, -1.090667724609375, -1.0492913722991943, -1.0079147815704346, -0.9665383100509644, -0.9251618385314941, -0.8837853670120239, -0.8424088954925537, -0.8010324239730835, -0.7596560120582581, -0.7182795405387878, -0.6769030690193176, -0.6355265974998474, -0.5941501259803772, -0.552773654460907, -0.5113972425460815, -0.47002074122428894, -0.4286442995071411, -0.3872678279876709, -0.3458913564682007, -0.30451488494873047, -0.26313841342926025, -0.22176197171211243, -0.1803855001926422, -0.139009028673172, -0.09763257205486298, -0.056256115436553955, -0.01487964391708374, 0.026496820151805878, 0.0678732842206955, 0.10924974828958511, 0.15062621235847473, 0.19200268387794495, 0.23337914049625397, 0.274755597114563, 0.3161320686340332, 0.3575085401535034, 0.39888501167297363, 0.44026145339012146, 0.4816379249095917, 0.5230144262313843, 0.5643908381462097, 0.6057673096656799, 0.6471437811851501, 0.6885202527046204, 0.7298967242240906, 0.7712731957435608, 0.8126496076583862, 0.8540260791778564, 0.8954025506973267, 0.9367790222167969, 0.9781554937362671]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 7.0, 11.0, 13.0, 14.0, 19.0, 24.0, 26.0, 27.0, 20.0, 30.0, 27.0, 23.0, 31.0, 30.0, 33.0, 28.0, 30.0, 35.0, 27.0, 42.0, 46.0, 37.0, 36.0, 38.0, 45.0, 30.0, 38.0, 28.0, 38.0, 22.0, 19.0, 27.0, 12.0, 11.0, 14.0, 14.0, 13.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7955688834190369, -0.7720916867256165, -0.7486144304275513, -0.7251372337341309, -0.7016600370407104, -0.6781827807426453, -0.6547055840492249, -0.6312283277511597, -0.6077511310577393, -0.5842739343643188, -0.5607966780662537, -0.5373194813728333, -0.5138422250747681, -0.49036502838134766, -0.46688783168792725, -0.44341060519218445, -0.41993337869644165, -0.39645615220069885, -0.37297892570495605, -0.34950172901153564, -0.32602450251579285, -0.30254727602005005, -0.27907007932662964, -0.25559285283088684, -0.23211562633514404, -0.20863839983940125, -0.18516118824481964, -0.16168397665023804, -0.13820675015449524, -0.11472953110933304, -0.09125231206417084, -0.06777510046958923, -0.044297873973846436, -0.020820654928684235, 0.0026565641164779663, 0.026133783161640167, 0.04961100220680237, 0.07308822125196457, 0.09656544029712677, 0.12004265189170837, 0.14351987838745117, 0.16699710488319397, 0.19047431647777557, 0.21395152807235718, 0.23742875456809998, 0.2609059810638428, 0.2843831777572632, 0.307860404253006, 0.3313376307487488, 0.3548148572444916, 0.3782920837402344, 0.4017692804336548, 0.4252465069293976, 0.4487237334251404, 0.4722009301185608, 0.4956781566143036, 0.5191553831100464, 0.5426325798034668, 0.566109836101532, 0.5895870327949524, 0.6130642890930176, 0.636541485786438, 0.6600186824798584, 0.6834958791732788, 0.706973135471344]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 8.0, 21.0, 22.0, 37.0, 51.0, 82.0, 111.0, 193.0, 297.0, 436.0, 604.0, 883.0, 1305.0, 1871.0, 2786.0, 4027.0, 6423.0, 10285.0, 17422.0, 30891.0, 60231.0, 132743.0, 328325.0, 239364.0, 98540.0, 46977.0, 25055.0, 14356.0, 8678.0, 5405.0, 3601.0, 2357.0, 1634.0, 1140.0, 805.0, 525.0, 334.0, 224.0, 175.0, 104.0, 80.0, 44.0, 30.0, 25.0, 14.0, 10.0, 9.0, 7.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.56640625, -0.550140380859375, -0.53387451171875, -0.517608642578125, -0.5013427734375, -0.485076904296875, -0.46881103515625, -0.452545166015625, -0.436279296875, -0.420013427734375, -0.40374755859375, -0.387481689453125, -0.3712158203125, -0.354949951171875, -0.33868408203125, -0.322418212890625, -0.30615234375, -0.289886474609375, -0.27362060546875, -0.257354736328125, -0.2410888671875, -0.224822998046875, -0.20855712890625, -0.192291259765625, -0.176025390625, -0.159759521484375, -0.14349365234375, -0.127227783203125, -0.1109619140625, -0.094696044921875, -0.07843017578125, -0.062164306640625, -0.0458984375, -0.029632568359375, -0.01336669921875, 0.002899169921875, 0.0191650390625, 0.035430908203125, 0.05169677734375, 0.067962646484375, 0.084228515625, 0.100494384765625, 0.11676025390625, 0.133026123046875, 0.1492919921875, 0.165557861328125, 0.18182373046875, 0.198089599609375, 0.21435546875, 0.230621337890625, 0.24688720703125, 0.263153076171875, 0.2794189453125, 0.295684814453125, 0.31195068359375, 0.328216552734375, 0.344482421875, 0.360748291015625, 0.37701416015625, 0.393280029296875, 0.4095458984375, 0.425811767578125, 0.44207763671875, 0.458343505859375, 0.474609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 1.0, 6.0, 7.0, 5.0, 10.0, 14.0, 16.0, 14.0, 18.0, 26.0, 23.0, 34.0, 27.0, 31.0, 30.0, 29.0, 31.0, 38.0, 32.0, 30.0, 33.0, 53.0, 51.0, 46.0, 33.0, 37.0, 41.0, 37.0, 33.0, 30.0, 36.0, 32.0, 17.0, 18.0, 18.0, 11.0, 10.0, 17.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.84716796875, -0.8222732543945312, -0.7973785400390625, -0.7724838256835938, -0.747589111328125, -0.7226943969726562, -0.6977996826171875, -0.6729049682617188, -0.64801025390625, -0.6231155395507812, -0.5982208251953125, -0.5733261108398438, -0.548431396484375, -0.5235366821289062, -0.4986419677734375, -0.47374725341796875, -0.4488525390625, -0.42395782470703125, -0.3990631103515625, -0.37416839599609375, -0.349273681640625, -0.32437896728515625, -0.2994842529296875, -0.27458953857421875, -0.24969482421875, -0.22480010986328125, -0.1999053955078125, -0.17501068115234375, -0.150115966796875, -0.12522125244140625, -0.1003265380859375, -0.07543182373046875, -0.050537109375, -0.02564239501953125, -0.0007476806640625, 0.02414703369140625, 0.049041748046875, 0.07393646240234375, 0.0988311767578125, 0.12372589111328125, 0.14862060546875, 0.17351531982421875, 0.1984100341796875, 0.22330474853515625, 0.248199462890625, 0.27309417724609375, 0.2979888916015625, 0.32288360595703125, 0.3477783203125, 0.37267303466796875, 0.3975677490234375, 0.42246246337890625, 0.447357177734375, 0.47225189208984375, 0.4971466064453125, 0.5220413208007812, 0.54693603515625, 0.5718307495117188, 0.5967254638671875, 0.6216201782226562, 0.646514892578125, 0.6714096069335938, 0.6963043212890625, 0.7211990356445312, 0.74609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 11.0, 11.0, 17.0, 24.0, 31.0, 34.0, 59.0, 77.0, 135.0, 183.0, 249.0, 371.0, 485.0, 679.0, 1001.0, 1381.0, 2069.0, 3005.0, 4738.0, 7672.0, 13929.0, 29860.0, 103050.0, 659932.0, 144352.0, 35592.0, 15638.0, 8510.0, 5020.0, 3255.0, 2117.0, 1498.0, 986.0, 711.0, 503.0, 397.0, 265.0, 210.0, 134.0, 99.0, 74.0, 54.0, 42.0, 32.0, 19.0, 12.0, 13.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.873046875, -0.8470535278320312, -0.8210601806640625, -0.7950668334960938, -0.769073486328125, -0.7430801391601562, -0.7170867919921875, -0.6910934448242188, -0.66510009765625, -0.6391067504882812, -0.6131134033203125, -0.5871200561523438, -0.561126708984375, -0.5351333618164062, -0.5091400146484375, -0.48314666748046875, -0.4571533203125, -0.43115997314453125, -0.4051666259765625, -0.37917327880859375, -0.353179931640625, -0.32718658447265625, -0.3011932373046875, -0.27519989013671875, -0.24920654296875, -0.22321319580078125, -0.1972198486328125, -0.17122650146484375, -0.145233154296875, -0.11923980712890625, -0.0932464599609375, -0.06725311279296875, -0.041259765625, -0.01526641845703125, 0.0107269287109375, 0.03672027587890625, 0.062713623046875, 0.08870697021484375, 0.1147003173828125, 0.14069366455078125, 0.16668701171875, 0.19268035888671875, 0.2186737060546875, 0.24466705322265625, 0.270660400390625, 0.29665374755859375, 0.3226470947265625, 0.34864044189453125, 0.3746337890625, 0.40062713623046875, 0.4266204833984375, 0.45261383056640625, 0.478607177734375, 0.5046005249023438, 0.5305938720703125, 0.5565872192382812, 0.58258056640625, 0.6085739135742188, 0.6345672607421875, 0.6605606079101562, 0.686553955078125, 0.7125473022460938, 0.7385406494140625, 0.7645339965820312, 0.79052734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 4.0, 10.0, 12.0, 14.0, 20.0, 17.0, 18.0, 18.0, 20.0, 24.0, 28.0, 36.0, 32.0, 37.0, 29.0, 44.0, 44.0, 37.0, 51.0, 47.0, 33.0, 33.0, 37.0, 35.0, 41.0, 29.0, 29.0, 19.0, 23.0, 24.0, 28.0, 28.0, 11.0, 20.0, 11.0, 6.0, 7.0, 4.0, 6.0, 0.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.50732421875, -0.49143218994140625, -0.4755401611328125, -0.45964813232421875, -0.443756103515625, -0.42786407470703125, -0.4119720458984375, -0.39608001708984375, -0.38018798828125, -0.36429595947265625, -0.3484039306640625, -0.33251190185546875, -0.316619873046875, -0.30072784423828125, -0.2848358154296875, -0.26894378662109375, -0.2530517578125, -0.23715972900390625, -0.2212677001953125, -0.20537567138671875, -0.189483642578125, -0.17359161376953125, -0.1576995849609375, -0.14180755615234375, -0.12591552734375, -0.11002349853515625, -0.0941314697265625, -0.07823944091796875, -0.062347412109375, -0.04645538330078125, -0.0305633544921875, -0.01467132568359375, 0.001220703125, 0.01711273193359375, 0.0330047607421875, 0.04889678955078125, 0.064788818359375, 0.08068084716796875, 0.0965728759765625, 0.11246490478515625, 0.12835693359375, 0.14424896240234375, 0.1601409912109375, 0.17603302001953125, 0.191925048828125, 0.20781707763671875, 0.2237091064453125, 0.23960113525390625, 0.2554931640625, 0.27138519287109375, 0.2872772216796875, 0.30316925048828125, 0.319061279296875, 0.33495330810546875, 0.3508453369140625, 0.36673736572265625, 0.38262939453125, 0.39852142333984375, 0.4144134521484375, 0.43030548095703125, 0.446197509765625, 0.46208953857421875, 0.4779815673828125, 0.49387359619140625, 0.509765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 6.0, 9.0, 18.0, 30.0, 36.0, 46.0, 44.0, 73.0, 112.0, 129.0, 199.0, 302.0, 408.0, 565.0, 866.0, 1524.0, 2738.0, 5480.0, 12417.0, 37934.0, 249229.0, 647300.0, 57331.0, 16560.0, 6869.0, 3304.0, 1771.0, 1013.0, 669.0, 435.0, 320.0, 217.0, 155.0, 94.0, 80.0, 70.0, 41.0, 37.0, 25.0, 18.0, 14.0, 15.0, 10.0, 5.0, 4.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.244384765625, -0.23701095581054688, -0.22963714599609375, -0.22226333618164062, -0.2148895263671875, -0.20751571655273438, -0.20014190673828125, -0.19276809692382812, -0.185394287109375, -0.17802047729492188, -0.17064666748046875, -0.16327285766601562, -0.1558990478515625, -0.14852523803710938, -0.14115142822265625, -0.13377761840820312, -0.12640380859375, -0.11902999877929688, -0.11165618896484375, -0.10428237915039062, -0.0969085693359375, -0.08953475952148438, -0.08216094970703125, -0.07478713989257812, -0.067413330078125, -0.060039520263671875, -0.05266571044921875, -0.045291900634765625, -0.0379180908203125, -0.030544281005859375, -0.02317047119140625, -0.015796661376953125, -0.0084228515625, -0.001049041748046875, 0.00632476806640625, 0.013698577880859375, 0.0210723876953125, 0.028446197509765625, 0.03582000732421875, 0.043193817138671875, 0.050567626953125, 0.057941436767578125, 0.06531524658203125, 0.07268905639648438, 0.0800628662109375, 0.08743667602539062, 0.09481048583984375, 0.10218429565429688, 0.10955810546875, 0.11693191528320312, 0.12430572509765625, 0.13167953491210938, 0.1390533447265625, 0.14642715454101562, 0.15380096435546875, 0.16117477416992188, 0.168548583984375, 0.17592239379882812, 0.18329620361328125, 0.19067001342773438, 0.1980438232421875, 0.20541763305664062, 0.21279144287109375, 0.22016525268554688, 0.2275390625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 5.0, 4.0, 8.0, 11.0, 14.0, 12.0, 14.0, 24.0, 17.0, 20.0, 37.0, 47.0, 53.0, 90.0, 95.0, 93.0, 85.0, 90.0, 78.0, 44.0, 38.0, 27.0, 26.0, 16.0, 16.0, 10.0, 3.0, 6.0, 4.0, 0.0, 1.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-06, -5.142763257026672e-06, -4.9211084842681885e-06, -4.699453711509705e-06, -4.477798938751221e-06, -4.256144165992737e-06, -4.034489393234253e-06, -3.812834620475769e-06, -3.591179847717285e-06, -3.3695250749588013e-06, -3.1478703022003174e-06, -2.9262155294418335e-06, -2.7045607566833496e-06, -2.4829059839248657e-06, -2.261251211166382e-06, -2.039596438407898e-06, -1.817941665649414e-06, -1.5962868928909302e-06, -1.3746321201324463e-06, -1.1529773473739624e-06, -9.313225746154785e-07, -7.096678018569946e-07, -4.880130290985107e-07, -2.6635825634002686e-07, -4.470348358154297e-08, 1.7695128917694092e-07, 3.986060619354248e-07, 6.202608346939087e-07, 8.419156074523926e-07, 1.0635703802108765e-06, 1.2852251529693604e-06, 1.5068799257278442e-06, 1.7285346984863281e-06, 1.950189471244812e-06, 2.171844244003296e-06, 2.3934990167617798e-06, 2.6151537895202637e-06, 2.8368085622787476e-06, 3.0584633350372314e-06, 3.2801181077957153e-06, 3.5017728805541992e-06, 3.723427653312683e-06, 3.945082426071167e-06, 4.166737198829651e-06, 4.388391971588135e-06, 4.610046744346619e-06, 4.8317015171051025e-06, 5.0533562898635864e-06, 5.27501106262207e-06, 5.496665835380554e-06, 5.718320608139038e-06, 5.939975380897522e-06, 6.161630153656006e-06, 6.38328492641449e-06, 6.604939699172974e-06, 6.8265944719314575e-06, 7.048249244689941e-06, 7.269904017448425e-06, 7.491558790206909e-06, 7.713213562965393e-06, 7.934868335723877e-06, 8.15652310848236e-06, 8.378177881240845e-06, 8.599832653999329e-06, 8.821487426757812e-06]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 17.0, 13.0, 17.0, 29.0, 32.0, 49.0, 61.0, 108.0, 141.0, 184.0, 252.0, 358.0, 517.0, 785.0, 1182.0, 1575.0, 2409.0, 3644.0, 5951.0, 10285.0, 18709.0, 38426.0, 92283.0, 347492.0, 347247.0, 91732.0, 38689.0, 18732.0, 10064.0, 5970.0, 3805.0, 2417.0, 1686.0, 1098.0, 790.0, 511.0, 389.0, 273.0, 193.0, 124.0, 106.0, 64.0, 42.0, 28.0, 23.0, 26.0, 13.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.145751953125, -0.14119720458984375, -0.1366424560546875, -0.13208770751953125, -0.127532958984375, -0.12297821044921875, -0.1184234619140625, -0.11386871337890625, -0.10931396484375, -0.10475921630859375, -0.1002044677734375, -0.09564971923828125, -0.091094970703125, -0.08654022216796875, -0.0819854736328125, -0.07743072509765625, -0.0728759765625, -0.06832122802734375, -0.0637664794921875, -0.05921173095703125, -0.054656982421875, -0.05010223388671875, -0.0455474853515625, -0.04099273681640625, -0.03643798828125, -0.03188323974609375, -0.0273284912109375, -0.02277374267578125, -0.018218994140625, -0.01366424560546875, -0.0091094970703125, -0.00455474853515625, 0.0, 0.00455474853515625, 0.0091094970703125, 0.01366424560546875, 0.018218994140625, 0.02277374267578125, 0.0273284912109375, 0.03188323974609375, 0.03643798828125, 0.04099273681640625, 0.0455474853515625, 0.05010223388671875, 0.054656982421875, 0.05921173095703125, 0.0637664794921875, 0.06832122802734375, 0.0728759765625, 0.07743072509765625, 0.0819854736328125, 0.08654022216796875, 0.091094970703125, 0.09564971923828125, 0.1002044677734375, 0.10475921630859375, 0.10931396484375, 0.11386871337890625, 0.1184234619140625, 0.12297821044921875, 0.127532958984375, 0.13208770751953125, 0.1366424560546875, 0.14119720458984375, 0.145751953125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 0.0, 11.0, 2.0, 8.0, 3.0, 5.0, 12.0, 15.0, 15.0, 26.0, 22.0, 35.0, 35.0, 40.0, 61.0, 69.0, 87.0, 77.0, 88.0, 77.0, 56.0, 49.0, 37.0, 28.0, 23.0, 27.0, 21.0, 10.0, 14.0, 9.0, 4.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.029510498046875, -0.028545856475830078, -0.027581214904785156, -0.026616573333740234, -0.025651931762695312, -0.02468729019165039, -0.02372264862060547, -0.022758007049560547, -0.021793365478515625, -0.020828723907470703, -0.01986408233642578, -0.01889944076538086, -0.017934799194335938, -0.016970157623291016, -0.016005516052246094, -0.015040874481201172, -0.01407623291015625, -0.013111591339111328, -0.012146949768066406, -0.011182308197021484, -0.010217666625976562, -0.00925302505493164, -0.008288383483886719, -0.007323741912841797, -0.006359100341796875, -0.005394458770751953, -0.004429817199707031, -0.0034651756286621094, -0.0025005340576171875, -0.0015358924865722656, -0.0005712509155273438, 0.0003933906555175781, 0.0013580322265625, 0.002322673797607422, 0.0032873153686523438, 0.004251956939697266, 0.0052165985107421875, 0.006181240081787109, 0.007145881652832031, 0.008110523223876953, 0.009075164794921875, 0.010039806365966797, 0.011004447937011719, 0.01196908950805664, 0.012933731079101562, 0.013898372650146484, 0.014863014221191406, 0.015827655792236328, 0.01679229736328125, 0.017756938934326172, 0.018721580505371094, 0.019686222076416016, 0.020650863647460938, 0.02161550521850586, 0.02258014678955078, 0.023544788360595703, 0.024509429931640625, 0.025474071502685547, 0.02643871307373047, 0.02740335464477539, 0.028367996215820312, 0.029332637786865234, 0.030297279357910156, 0.03126192092895508, 0.0322265625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 7.0, 5.0, 1.0, 5.0, 7.0, 5.0, 13.0, 14.0, 14.0, 23.0, 36.0, 49.0, 57.0, 90.0, 89.0, 112.0, 103.0, 91.0, 60.0, 55.0, 55.0, 27.0, 19.0, 14.0, 17.0, 5.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.568750262260437, -1.5293562412261963, -1.4899623394012451, -1.4505683183670044, -1.4111742973327637, -1.3717803955078125, -1.3323863744735718, -1.292992353439331, -1.2535984516143799, -1.2142044305801392, -1.174810528755188, -1.1354165077209473, -1.096022605895996, -1.0566285848617554, -1.0172345638275146, -0.9778406023979187, -0.9384466409683228, -0.8990526795387268, -0.8596587181091309, -0.8202646970748901, -0.7808707356452942, -0.7414767742156982, -0.7020827531814575, -0.6626887917518616, -0.6232948303222656, -0.5839008688926697, -0.5445069074630737, -0.505112886428833, -0.46571892499923706, -0.4263249635696411, -0.3869309723377228, -0.34753698110580444, -0.3081430196762085, -0.26874905824661255, -0.2293550670146942, -0.18996109068393707, -0.15056711435317993, -0.11117313802242279, -0.07177916169166565, -0.032385170459747314, 0.007008790969848633, 0.046402767300605774, 0.08579674363136292, 0.12519071996212006, 0.1645846962928772, 0.20397867262363434, 0.24337264895439148, 0.2827666401863098, 0.32216060161590576, 0.3615545630455017, 0.40094855427742004, 0.4403425455093384, 0.4797365069389343, 0.5191304683685303, 0.558524489402771, 0.5979184508323669, 0.6373124122619629, 0.6767063736915588, 0.7161003351211548, 0.7554943561553955, 0.7948883175849915, 0.8342822790145874, 0.8736763000488281, 0.9130702614784241, 0.95246422290802]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 7.0, 8.0, 9.0, 12.0, 15.0, 16.0, 23.0, 34.0, 23.0, 21.0, 27.0, 29.0, 26.0, 26.0, 29.0, 36.0, 28.0, 29.0, 31.0, 31.0, 43.0, 43.0, 42.0, 37.0, 39.0, 41.0, 29.0, 36.0, 29.0, 38.0, 28.0, 20.0, 23.0, 12.0, 13.0, 13.0, 14.0, 12.0, 8.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7862319946289062, -0.7630535960197449, -0.7398751974105835, -0.7166967988014221, -0.6935184001922607, -0.6703400015830994, -0.647161602973938, -0.6239831447601318, -0.6008048057556152, -0.5776264071464539, -0.5544480085372925, -0.5312696099281311, -0.5080912113189697, -0.48491281270980835, -0.4617343842983246, -0.4385559856891632, -0.41537755727767944, -0.39219915866851807, -0.3690207600593567, -0.3458423614501953, -0.32266396284103394, -0.29948556423187256, -0.2763071358203888, -0.2531287372112274, -0.22995033860206604, -0.20677193999290466, -0.1835935413837433, -0.16041512787342072, -0.13723672926425934, -0.11405833065509796, -0.09087991714477539, -0.06770151853561401, -0.04452311992645264, -0.02134471759200096, 0.0018336847424507141, 0.025012090802192688, 0.048190489411354065, 0.07136888802051544, 0.09454730153083801, 0.11772570013999939, 0.14090409874916077, 0.16408249735832214, 0.18726089596748352, 0.2104393094778061, 0.23361770808696747, 0.25679612159729004, 0.2799745202064514, 0.3031529188156128, 0.32633131742477417, 0.34950971603393555, 0.3726881146430969, 0.3958665132522583, 0.4190449118614197, 0.44222331047058105, 0.4654017388820648, 0.4885801374912262, 0.51175856590271, 0.5349369645118713, 0.5581153631210327, 0.5812937617301941, 0.6044721603393555, 0.6276505589485168, 0.6508289575576782, 0.6740074157714844, 0.697185754776001]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 12.0, 8.0, 9.0, 19.0, 43.0, 53.0, 102.0, 147.0, 210.0, 323.0, 500.0, 761.0, 1186.0, 1987.0, 3005.0, 4805.0, 7594.0, 11969.0, 19644.0, 32658.0, 58061.0, 110111.0, 211809.0, 257041.0, 145588.0, 75432.0, 41340.0, 23886.0, 14730.0, 9435.0, 5875.0, 3720.0, 2367.0, 1524.0, 935.0, 601.0, 379.0, 247.0, 177.0, 107.0, 59.0, 41.0, 30.0, 15.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.373046875, -1.3290557861328125, -1.285064697265625, -1.2410736083984375, -1.19708251953125, -1.1530914306640625, -1.109100341796875, -1.0651092529296875, -1.0211181640625, -0.9771270751953125, -0.933135986328125, -0.8891448974609375, -0.84515380859375, -0.8011627197265625, -0.757171630859375, -0.7131805419921875, -0.669189453125, -0.6251983642578125, -0.581207275390625, -0.5372161865234375, -0.49322509765625, -0.4492340087890625, -0.405242919921875, -0.3612518310546875, -0.3172607421875, -0.2732696533203125, -0.229278564453125, -0.1852874755859375, -0.14129638671875, -0.0973052978515625, -0.053314208984375, -0.0093231201171875, 0.03466796875, 0.0786590576171875, 0.122650146484375, 0.1666412353515625, 0.21063232421875, 0.2546234130859375, 0.298614501953125, 0.3426055908203125, 0.3865966796875, 0.4305877685546875, 0.474578857421875, 0.5185699462890625, 0.56256103515625, 0.6065521240234375, 0.650543212890625, 0.6945343017578125, 0.738525390625, 0.7825164794921875, 0.826507568359375, 0.8704986572265625, 0.91448974609375, 0.9584808349609375, 1.002471923828125, 1.0464630126953125, 1.0904541015625, 1.1344451904296875, 1.178436279296875, 1.2224273681640625, 1.26641845703125, 1.3104095458984375, 1.354400634765625, 1.3983917236328125, 1.4423828125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 5.0, 3.0, 10.0, 20.0, 16.0, 20.0, 28.0, 26.0, 16.0, 26.0, 21.0, 38.0, 27.0, 24.0, 17.0, 38.0, 35.0, 33.0, 31.0, 28.0, 38.0, 44.0, 32.0, 28.0, 31.0, 29.0, 31.0, 34.0, 27.0, 33.0, 29.0, 28.0, 20.0, 26.0, 10.0, 12.0, 18.0, 9.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61279296875, -0.5936203002929688, -0.5744476318359375, -0.5552749633789062, -0.536102294921875, -0.5169296264648438, -0.4977569580078125, -0.47858428955078125, -0.45941162109375, -0.44023895263671875, -0.4210662841796875, -0.40189361572265625, -0.382720947265625, -0.36354827880859375, -0.3443756103515625, -0.32520294189453125, -0.3060302734375, -0.28685760498046875, -0.2676849365234375, -0.24851226806640625, -0.229339599609375, -0.21016693115234375, -0.1909942626953125, -0.17182159423828125, -0.15264892578125, -0.13347625732421875, -0.1143035888671875, -0.09513092041015625, -0.075958251953125, -0.05678558349609375, -0.0376129150390625, -0.01844024658203125, 0.000732421875, 0.01990509033203125, 0.0390777587890625, 0.05825042724609375, 0.077423095703125, 0.09659576416015625, 0.1157684326171875, 0.13494110107421875, 0.15411376953125, 0.17328643798828125, 0.1924591064453125, 0.21163177490234375, 0.230804443359375, 0.24997711181640625, 0.2691497802734375, 0.28832244873046875, 0.3074951171875, 0.32666778564453125, 0.3458404541015625, 0.36501312255859375, 0.384185791015625, 0.40335845947265625, 0.4225311279296875, 0.44170379638671875, 0.46087646484375, 0.48004913330078125, 0.4992218017578125, 0.5183944702148438, 0.537567138671875, 0.5567398071289062, 0.5759124755859375, 0.5950851440429688, 0.6142578125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 13.0, 11.0, 28.0, 42.0, 57.0, 84.0, 137.0, 169.0, 284.0, 367.0, 594.0, 870.0, 1324.0, 2077.0, 3321.0, 5222.0, 8426.0, 13939.0, 23593.0, 41650.0, 77837.0, 153947.0, 286682.0, 202817.0, 99656.0, 52073.0, 29032.0, 17017.0, 10048.0, 6134.0, 3924.0, 2449.0, 1675.0, 1009.0, 661.0, 464.0, 315.0, 180.0, 149.0, 74.0, 58.0, 48.0, 30.0, 22.0, 8.0, 11.0, 7.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.462890625, -1.4181365966796875, -1.373382568359375, -1.3286285400390625, -1.28387451171875, -1.2391204833984375, -1.194366455078125, -1.1496124267578125, -1.1048583984375, -1.0601043701171875, -1.015350341796875, -0.9705963134765625, -0.92584228515625, -0.8810882568359375, -0.836334228515625, -0.7915802001953125, -0.746826171875, -0.7020721435546875, -0.657318115234375, -0.6125640869140625, -0.56781005859375, -0.5230560302734375, -0.478302001953125, -0.4335479736328125, -0.3887939453125, -0.3440399169921875, -0.299285888671875, -0.2545318603515625, -0.20977783203125, -0.1650238037109375, -0.120269775390625, -0.0755157470703125, -0.03076171875, 0.0139923095703125, 0.058746337890625, 0.1035003662109375, 0.14825439453125, 0.1930084228515625, 0.237762451171875, 0.2825164794921875, 0.3272705078125, 0.3720245361328125, 0.416778564453125, 0.4615325927734375, 0.50628662109375, 0.5510406494140625, 0.595794677734375, 0.6405487060546875, 0.685302734375, 0.7300567626953125, 0.774810791015625, 0.8195648193359375, 0.86431884765625, 0.9090728759765625, 0.953826904296875, 0.9985809326171875, 1.0433349609375, 1.0880889892578125, 1.132843017578125, 1.1775970458984375, 1.22235107421875, 1.2671051025390625, 1.311859130859375, 1.3566131591796875, 1.4013671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 5.0, 8.0, 15.0, 10.0, 16.0, 13.0, 20.0, 35.0, 23.0, 26.0, 41.0, 34.0, 39.0, 45.0, 53.0, 45.0, 43.0, 62.0, 47.0, 50.0, 48.0, 38.0, 37.0, 35.0, 39.0, 25.0, 23.0, 25.0, 27.0, 17.0, 17.0, 8.0, 13.0, 8.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.456298828125, -0.4395713806152344, -0.42284393310546875, -0.4061164855957031, -0.3893890380859375, -0.3726615905761719, -0.35593414306640625, -0.3392066955566406, -0.322479248046875, -0.3057518005371094, -0.28902435302734375, -0.2722969055175781, -0.2555694580078125, -0.23884201049804688, -0.22211456298828125, -0.20538711547851562, -0.18865966796875, -0.17193222045898438, -0.15520477294921875, -0.13847732543945312, -0.1217498779296875, -0.10502243041992188, -0.08829498291015625, -0.07156753540039062, -0.054840087890625, -0.038112640380859375, -0.02138519287109375, -0.004657745361328125, 0.0120697021484375, 0.028797149658203125, 0.04552459716796875, 0.062252044677734375, 0.0789794921875, 0.09570693969726562, 0.11243438720703125, 0.12916183471679688, 0.1458892822265625, 0.16261672973632812, 0.17934417724609375, 0.19607162475585938, 0.212799072265625, 0.22952651977539062, 0.24625396728515625, 0.2629814147949219, 0.2797088623046875, 0.2964363098144531, 0.31316375732421875, 0.3298912048339844, 0.34661865234375, 0.3633460998535156, 0.38007354736328125, 0.3968009948730469, 0.4135284423828125, 0.4302558898925781, 0.44698333740234375, 0.4637107849121094, 0.480438232421875, 0.4971656799316406, 0.5138931274414062, 0.5306205749511719, 0.5473480224609375, 0.5640754699707031, 0.5808029174804688, 0.5975303649902344, 0.6142578125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 4.0, 14.0, 28.0, 32.0, 57.0, 76.0, 89.0, 137.0, 213.0, 225.0, 356.0, 531.0, 794.0, 1053.0, 1535.0, 2259.0, 3379.0, 5353.0, 8628.0, 15140.0, 29752.0, 76101.0, 625150.0, 175249.0, 48447.0, 21576.0, 11829.0, 6843.0, 4356.0, 2948.0, 1918.0, 1323.0, 901.0, 662.0, 468.0, 341.0, 216.0, 151.0, 127.0, 98.0, 54.0, 48.0, 30.0, 23.0, 13.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.794921875, -0.7706756591796875, -0.746429443359375, -0.7221832275390625, -0.69793701171875, -0.6736907958984375, -0.649444580078125, -0.6251983642578125, -0.6009521484375, -0.5767059326171875, -0.552459716796875, -0.5282135009765625, -0.50396728515625, -0.4797210693359375, -0.455474853515625, -0.4312286376953125, -0.406982421875, -0.3827362060546875, -0.358489990234375, -0.3342437744140625, -0.30999755859375, -0.2857513427734375, -0.261505126953125, -0.2372589111328125, -0.2130126953125, -0.1887664794921875, -0.164520263671875, -0.1402740478515625, -0.11602783203125, -0.0917816162109375, -0.067535400390625, -0.0432891845703125, -0.01904296875, 0.0052032470703125, 0.029449462890625, 0.0536956787109375, 0.07794189453125, 0.1021881103515625, 0.126434326171875, 0.1506805419921875, 0.1749267578125, 0.1991729736328125, 0.223419189453125, 0.2476654052734375, 0.27191162109375, 0.2961578369140625, 0.320404052734375, 0.3446502685546875, 0.368896484375, 0.3931427001953125, 0.417388916015625, 0.4416351318359375, 0.46588134765625, 0.4901275634765625, 0.514373779296875, 0.5386199951171875, 0.5628662109375, 0.5871124267578125, 0.611358642578125, 0.6356048583984375, 0.65985107421875, 0.6840972900390625, 0.708343505859375, 0.7325897216796875, 0.7568359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 15.0, 17.0, 17.0, 32.0, 37.0, 48.0, 69.0, 152.0, 231.0, 78.0, 60.0, 43.0, 36.0, 30.0, 14.0, 16.0, 13.0, 12.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9073486328125e-05, -1.8417835235595703e-05, -1.7762184143066406e-05, -1.710653305053711e-05, -1.6450881958007812e-05, -1.5795230865478516e-05, -1.5139579772949219e-05, -1.4483928680419922e-05, -1.3828277587890625e-05, -1.3172626495361328e-05, -1.2516975402832031e-05, -1.1861324310302734e-05, -1.1205673217773438e-05, -1.055002212524414e-05, -9.894371032714844e-06, -9.238719940185547e-06, -8.58306884765625e-06, -7.927417755126953e-06, -7.271766662597656e-06, -6.616115570068359e-06, -5.9604644775390625e-06, -5.304813385009766e-06, -4.649162292480469e-06, -3.993511199951172e-06, -3.337860107421875e-06, -2.682209014892578e-06, -2.0265579223632812e-06, -1.3709068298339844e-06, -7.152557373046875e-07, -5.960464477539063e-08, 5.960464477539062e-07, 1.2516975402832031e-06, 1.9073486328125e-06, 2.562999725341797e-06, 3.2186508178710938e-06, 3.874301910400391e-06, 4.5299530029296875e-06, 5.185604095458984e-06, 5.841255187988281e-06, 6.496906280517578e-06, 7.152557373046875e-06, 7.808208465576172e-06, 8.463859558105469e-06, 9.119510650634766e-06, 9.775161743164062e-06, 1.043081283569336e-05, 1.1086463928222656e-05, 1.1742115020751953e-05, 1.239776611328125e-05, 1.3053417205810547e-05, 1.3709068298339844e-05, 1.436471939086914e-05, 1.5020370483398438e-05, 1.5676021575927734e-05, 1.633167266845703e-05, 1.6987323760986328e-05, 1.7642974853515625e-05, 1.8298625946044922e-05, 1.895427703857422e-05, 1.9609928131103516e-05, 2.0265579223632812e-05, 2.092123031616211e-05, 2.1576881408691406e-05, 2.2232532501220703e-05, 2.288818359375e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 7.0, 21.0, 27.0, 35.0, 57.0, 66.0, 92.0, 188.0, 185.0, 338.0, 536.0, 916.0, 1250.0, 2090.0, 3406.0, 5448.0, 9118.0, 16304.0, 33389.0, 97461.0, 678363.0, 118274.0, 37548.0, 18050.0, 9961.0, 5778.0, 3511.0, 2198.0, 1333.0, 866.0, 603.0, 414.0, 197.0, 148.0, 120.0, 94.0, 55.0, 25.0, 23.0, 16.0, 13.0, 8.0, 5.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8585433959960938, -0.8313446044921875, -0.8041458129882812, -0.776947021484375, -0.7497482299804688, -0.7225494384765625, -0.6953506469726562, -0.66815185546875, -0.6409530639648438, -0.6137542724609375, -0.5865554809570312, -0.559356689453125, -0.5321578979492188, -0.5049591064453125, -0.47776031494140625, -0.4505615234375, -0.42336273193359375, -0.3961639404296875, -0.36896514892578125, -0.341766357421875, -0.31456756591796875, -0.2873687744140625, -0.26016998291015625, -0.23297119140625, -0.20577239990234375, -0.1785736083984375, -0.15137481689453125, -0.124176025390625, -0.09697723388671875, -0.0697784423828125, -0.04257965087890625, -0.015380859375, 0.01181793212890625, 0.0390167236328125, 0.06621551513671875, 0.093414306640625, 0.12061309814453125, 0.1478118896484375, 0.17501068115234375, 0.20220947265625, 0.22940826416015625, 0.2566070556640625, 0.28380584716796875, 0.311004638671875, 0.33820343017578125, 0.3654022216796875, 0.39260101318359375, 0.4197998046875, 0.44699859619140625, 0.4741973876953125, 0.5013961791992188, 0.528594970703125, 0.5557937622070312, 0.5829925537109375, 0.6101913452148438, 0.63739013671875, 0.6645889282226562, 0.6917877197265625, 0.7189865112304688, 0.746185302734375, 0.7733840942382812, 0.8005828857421875, 0.8277816772460938, 0.85498046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 6.0, 7.0, 6.0, 9.0, 6.0, 17.0, 21.0, 20.0, 23.0, 53.0, 70.0, 75.0, 298.0, 86.0, 56.0, 48.0, 29.0, 18.0, 17.0, 17.0, 14.0, 12.0, 7.0, 15.0, 7.0, 11.0, 6.0, 1.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1964111328125, -0.1897144317626953, -0.18301773071289062, -0.17632102966308594, -0.16962432861328125, -0.16292762756347656, -0.15623092651367188, -0.1495342254638672, -0.1428375244140625, -0.1361408233642578, -0.12944412231445312, -0.12274742126464844, -0.11605072021484375, -0.10935401916503906, -0.10265731811523438, -0.09596061706542969, -0.089263916015625, -0.08256721496582031, -0.07587051391601562, -0.06917381286621094, -0.06247711181640625, -0.05578041076660156, -0.049083709716796875, -0.04238700866699219, -0.0356903076171875, -0.028993606567382812, -0.022296905517578125, -0.015600204467773438, -0.00890350341796875, -0.0022068023681640625, 0.004489898681640625, 0.011186599731445312, 0.01788330078125, 0.024580001831054688, 0.031276702880859375, 0.03797340393066406, 0.04467010498046875, 0.05136680603027344, 0.058063507080078125, 0.06476020812988281, 0.0714569091796875, 0.07815361022949219, 0.08485031127929688, 0.09154701232910156, 0.09824371337890625, 0.10494041442871094, 0.11163711547851562, 0.11833381652832031, 0.125030517578125, 0.1317272186279297, 0.13842391967773438, 0.14512062072753906, 0.15181732177734375, 0.15851402282714844, 0.16521072387695312, 0.1719074249267578, 0.1786041259765625, 0.1853008270263672, 0.19199752807617188, 0.19869422912597656, 0.20539093017578125, 0.21208763122558594, 0.21878433227539062, 0.2254810333251953, 0.232177734375]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 11.0, 11.0, 13.0, 21.0, 26.0, 44.0, 63.0, 94.0, 121.0, 141.0, 110.0, 91.0, 56.0, 40.0, 32.0, 28.0, 22.0, 14.0, 16.0, 12.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.494354248046875, -1.4522393941879272, -1.4101245403289795, -1.3680098056793213, -1.3258949518203735, -1.2837800979614258, -1.241665244102478, -1.1995503902435303, -1.157435655593872, -1.1153208017349243, -1.0732059478759766, -1.0310912132263184, -0.9889763593673706, -0.9468615055084229, -0.9047466516494751, -0.8626317977905273, -0.8205169439315796, -0.7784020900726318, -0.7362872958183289, -0.6941724419593811, -0.6520576477050781, -0.6099427938461304, -0.5678279399871826, -0.5257130861282349, -0.4835982918739319, -0.4414834678173065, -0.39936864376068115, -0.3572537899017334, -0.31513896584510803, -0.27302414178848267, -0.2309092879295349, -0.18879446387290955, -0.14667952060699463, -0.10456468909978867, -0.0624498575925827, -0.020335018634796143, 0.021779805421829224, 0.06389462947845459, 0.10600948333740234, 0.1481243073940277, 0.19023913145065308, 0.23235395550727844, 0.2744687795639038, 0.31658363342285156, 0.35869845747947693, 0.4008132815361023, 0.44292813539505005, 0.4850429594516754, 0.5271577835083008, 0.5692726373672485, 0.6113874316215515, 0.6535022854804993, 0.6956170797348022, 0.73773193359375, 0.7798467874526978, 0.8219616413116455, 0.8640764355659485, 0.9061912894248962, 0.9483060836791992, 0.990420937538147, 1.0325357913970947, 1.074650526046753, 1.1167654991149902, 1.1588802337646484, 1.2009950876235962]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 9.0, 14.0, 9.0, 17.0, 18.0, 10.0, 30.0, 23.0, 19.0, 27.0, 23.0, 31.0, 29.0, 29.0, 25.0, 20.0, 36.0, 44.0, 37.0, 41.0, 43.0, 38.0, 38.0, 28.0, 38.0, 21.0, 32.0, 26.0, 27.0, 28.0, 17.0, 23.0, 18.0, 22.0, 8.0, 10.0, 9.0, 9.0, 10.0, 7.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.6485298275947571, -0.6287035942077637, -0.6088773608207703, -0.5890511274337769, -0.5692248940467834, -0.54939866065979, -0.5295724272727966, -0.5097461938858032, -0.4899199903011322, -0.4700937569141388, -0.4502675235271454, -0.430441290140152, -0.41061508655548096, -0.39078885316848755, -0.37096261978149414, -0.35113638639450073, -0.3313101530075073, -0.3114839196205139, -0.2916576862335205, -0.2718314528465271, -0.2520052194595337, -0.23217900097370148, -0.21235278248786926, -0.19252654910087585, -0.17270031571388245, -0.15287408232688904, -0.13304784893989563, -0.11322163045406342, -0.09339539706707001, -0.0735691636800766, -0.05374293774366379, -0.03391671180725098, -0.014090538024902344, 0.005735691636800766, 0.025561921298503876, 0.045388150960206985, 0.0652143806219101, 0.0850406140089035, 0.10486683994531631, 0.12469306588172913, 0.14451929926872253, 0.16434553265571594, 0.18417176604270935, 0.20399798452854156, 0.22382421791553497, 0.24365045130252838, 0.2634766697883606, 0.283302903175354, 0.3031291365623474, 0.3229553699493408, 0.34278160333633423, 0.36260783672332764, 0.38243407011032104, 0.40226030349731445, 0.4220865070819855, 0.4419127404689789, 0.4617389738559723, 0.4815652072429657, 0.5013914108276367, 0.5212176442146301, 0.5410438776016235, 0.5608701109886169, 0.5806963443756104, 0.6005225777626038, 0.6203488111495972]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 22.0, 32.0, 47.0, 56.0, 99.0, 151.0, 190.0, 254.0, 360.0, 518.0, 687.0, 1036.0, 1398.0, 2081.0, 2906.0, 4400.0, 6342.0, 9829.0, 15349.0, 24160.0, 40745.0, 70161.0, 128735.0, 265407.0, 798388.0, 1628113.0, 663968.0, 248076.0, 118941.0, 64203.0, 36573.0, 22088.0, 13625.0, 8637.0, 5594.0, 3635.0, 2485.0, 1713.0, 1101.0, 744.0, 519.0, 347.0, 182.0, 134.0, 90.0, 50.0, 33.0, 17.0, 15.0, 8.0, 10.0, 13.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.90185546875, -0.8731536865234375, -0.844451904296875, -0.8157501220703125, -0.78704833984375, -0.7583465576171875, -0.729644775390625, -0.7009429931640625, -0.6722412109375, -0.6435394287109375, -0.614837646484375, -0.5861358642578125, -0.55743408203125, -0.5287322998046875, -0.500030517578125, -0.4713287353515625, -0.442626953125, -0.4139251708984375, -0.385223388671875, -0.3565216064453125, -0.32781982421875, -0.2991180419921875, -0.270416259765625, -0.2417144775390625, -0.2130126953125, -0.1843109130859375, -0.155609130859375, -0.1269073486328125, -0.09820556640625, -0.0695037841796875, -0.040802001953125, -0.0121002197265625, 0.0166015625, 0.0453033447265625, 0.074005126953125, 0.1027069091796875, 0.13140869140625, 0.1601104736328125, 0.188812255859375, 0.2175140380859375, 0.2462158203125, 0.2749176025390625, 0.303619384765625, 0.3323211669921875, 0.36102294921875, 0.3897247314453125, 0.418426513671875, 0.4471282958984375, 0.475830078125, 0.5045318603515625, 0.533233642578125, 0.5619354248046875, 0.59063720703125, 0.6193389892578125, 0.648040771484375, 0.6767425537109375, 0.7054443359375, 0.7341461181640625, 0.762847900390625, 0.7915496826171875, 0.82025146484375, 0.8489532470703125, 0.877655029296875, 0.9063568115234375, 0.93505859375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 5.0, 13.0, 8.0, 7.0, 6.0, 11.0, 8.0, 15.0, 20.0, 21.0, 24.0, 19.0, 19.0, 26.0, 33.0, 30.0, 27.0, 29.0, 32.0, 33.0, 35.0, 38.0, 39.0, 38.0, 39.0, 35.0, 30.0, 27.0, 34.0, 28.0, 34.0, 20.0, 31.0, 21.0, 19.0, 22.0, 20.0, 16.0, 10.0, 14.0, 6.0, 10.0, 7.0, 7.0, 8.0, 4.0, 1.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.41650390625, -0.40410614013671875, -0.3917083740234375, -0.37931060791015625, -0.366912841796875, -0.35451507568359375, -0.3421173095703125, -0.32971954345703125, -0.31732177734375, -0.30492401123046875, -0.2925262451171875, -0.28012847900390625, -0.267730712890625, -0.25533294677734375, -0.2429351806640625, -0.23053741455078125, -0.2181396484375, -0.20574188232421875, -0.1933441162109375, -0.18094635009765625, -0.168548583984375, -0.15615081787109375, -0.1437530517578125, -0.13135528564453125, -0.11895751953125, -0.10655975341796875, -0.0941619873046875, -0.08176422119140625, -0.069366455078125, -0.05696868896484375, -0.0445709228515625, -0.03217315673828125, -0.019775390625, -0.00737762451171875, 0.0050201416015625, 0.01741790771484375, 0.029815673828125, 0.04221343994140625, 0.0546112060546875, 0.06700897216796875, 0.07940673828125, 0.09180450439453125, 0.1042022705078125, 0.11660003662109375, 0.128997802734375, 0.14139556884765625, 0.1537933349609375, 0.16619110107421875, 0.1785888671875, 0.19098663330078125, 0.2033843994140625, 0.21578216552734375, 0.228179931640625, 0.24057769775390625, 0.2529754638671875, 0.26537322998046875, 0.27777099609375, 0.29016876220703125, 0.3025665283203125, 0.31496429443359375, 0.327362060546875, 0.33975982666015625, 0.3521575927734375, 0.36455535888671875, 0.376953125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 13.0, 18.0, 25.0, 46.0, 60.0, 97.0, 137.0, 193.0, 304.0, 438.0, 683.0, 1071.0, 1493.0, 2395.0, 3457.0, 5415.0, 8223.0, 12932.0, 20387.0, 33247.0, 54705.0, 94647.0, 173684.0, 351813.0, 827249.0, 1363628.0, 615552.0, 276198.0, 141800.0, 79676.0, 46643.0, 28201.0, 17712.0, 11090.0, 7097.0, 4769.0, 3104.0, 2023.0, 1329.0, 899.0, 620.0, 395.0, 274.0, 151.0, 125.0, 87.0, 57.0, 45.0, 24.0, 19.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.74365234375, -0.7206573486328125, -0.697662353515625, -0.6746673583984375, -0.65167236328125, -0.6286773681640625, -0.605682373046875, -0.5826873779296875, -0.5596923828125, -0.5366973876953125, -0.513702392578125, -0.4907073974609375, -0.46771240234375, -0.4447174072265625, -0.421722412109375, -0.3987274169921875, -0.375732421875, -0.3527374267578125, -0.329742431640625, -0.3067474365234375, -0.28375244140625, -0.2607574462890625, -0.237762451171875, -0.2147674560546875, -0.1917724609375, -0.1687774658203125, -0.145782470703125, -0.1227874755859375, -0.09979248046875, -0.0767974853515625, -0.053802490234375, -0.0308074951171875, -0.0078125, 0.0151824951171875, 0.038177490234375, 0.0611724853515625, 0.08416748046875, 0.1071624755859375, 0.130157470703125, 0.1531524658203125, 0.1761474609375, 0.1991424560546875, 0.222137451171875, 0.2451324462890625, 0.26812744140625, 0.2911224365234375, 0.314117431640625, 0.3371124267578125, 0.360107421875, 0.3831024169921875, 0.406097412109375, 0.4290924072265625, 0.45208740234375, 0.4750823974609375, 0.498077392578125, 0.5210723876953125, 0.5440673828125, 0.5670623779296875, 0.590057373046875, 0.6130523681640625, 0.63604736328125, 0.6590423583984375, 0.682037353515625, 0.7050323486328125, 0.72802734375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 16.0, 22.0, 18.0, 26.0, 30.0, 40.0, 53.0, 76.0, 62.0, 102.0, 106.0, 106.0, 145.0, 181.0, 201.0, 217.0, 238.0, 271.0, 252.0, 259.0, 220.0, 219.0, 206.0, 182.0, 149.0, 134.0, 107.0, 89.0, 67.0, 46.0, 55.0, 33.0, 41.0, 18.0, 18.0, 16.0, 10.0, 2.0, 11.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.249481201171875, -0.24188232421875, -0.234283447265625, -0.2266845703125, -0.219085693359375, -0.21148681640625, -0.203887939453125, -0.1962890625, -0.188690185546875, -0.18109130859375, -0.173492431640625, -0.1658935546875, -0.158294677734375, -0.15069580078125, -0.143096923828125, -0.135498046875, -0.127899169921875, -0.12030029296875, -0.112701416015625, -0.1051025390625, -0.097503662109375, -0.08990478515625, -0.082305908203125, -0.07470703125, -0.067108154296875, -0.05950927734375, -0.051910400390625, -0.0443115234375, -0.036712646484375, -0.02911376953125, -0.021514892578125, -0.013916015625, -0.006317138671875, 0.00128173828125, 0.008880615234375, 0.0164794921875, 0.024078369140625, 0.03167724609375, 0.039276123046875, 0.046875, 0.054473876953125, 0.06207275390625, 0.069671630859375, 0.0772705078125, 0.084869384765625, 0.09246826171875, 0.100067138671875, 0.107666015625, 0.115264892578125, 0.12286376953125, 0.130462646484375, 0.1380615234375, 0.145660400390625, 0.15325927734375, 0.160858154296875, 0.16845703125, 0.176055908203125, 0.18365478515625, 0.191253662109375, 0.1988525390625, 0.206451416015625, 0.21405029296875, 0.221649169921875, 0.229248046875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 8.0, 15.0, 17.0, 17.0, 15.0, 35.0, 53.0, 52.0, 94.0, 114.0, 126.0, 116.0, 88.0, 49.0, 52.0, 32.0, 21.0, 16.0, 24.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9037691950798035, -0.8759884238243103, -0.8482075929641724, -0.8204268217086792, -0.792646050453186, -0.7648652791976929, -0.7370844483375549, -0.7093036770820618, -0.6815229058265686, -0.6537421345710754, -0.6259613037109375, -0.5981805324554443, -0.5703997611999512, -0.542618989944458, -0.5148381590843201, -0.4870573878288269, -0.45927658677101135, -0.4314957857131958, -0.40371501445770264, -0.3759342133998871, -0.3481534421443939, -0.32037264108657837, -0.2925918698310852, -0.26481106877326965, -0.2370302826166153, -0.20924949645996094, -0.18146871030330658, -0.15368792414665222, -0.12590712308883667, -0.09812633693218231, -0.07034555077552795, -0.042564764618873596, -0.014783978462219238, 0.012996809557080269, 0.040777597576379776, 0.06855838745832443, 0.09633917361497879, 0.12411996722221375, 0.1519007533788681, 0.17968153953552246, 0.20746232569217682, 0.23524311184883118, 0.26302391290664673, 0.2908046841621399, 0.31858548521995544, 0.346366286277771, 0.37414705753326416, 0.4019278287887573, 0.4297086298465729, 0.4574894309043884, 0.4852702021598816, 0.5130509734153748, 0.5408318042755127, 0.5686125755310059, 0.596393346786499, 0.6241741180419922, 0.6519549489021301, 0.6797357201576233, 0.7075165510177612, 0.7352973222732544, 0.7630780935287476, 0.7908588647842407, 0.8186396956443787, 0.8464204668998718, 0.874201238155365]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 9.0, 7.0, 11.0, 10.0, 7.0, 9.0, 16.0, 14.0, 18.0, 17.0, 17.0, 23.0, 24.0, 32.0, 21.0, 28.0, 43.0, 33.0, 35.0, 40.0, 45.0, 49.0, 43.0, 29.0, 32.0, 37.0, 31.0, 27.0, 26.0, 38.0, 28.0, 14.0, 26.0, 29.0, 23.0, 18.0, 19.0, 12.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5099623799324036, -0.49492689967155457, -0.4798913896083832, -0.4648559093475342, -0.4498203992843628, -0.4347849190235138, -0.4197494387626648, -0.4047139286994934, -0.389678418636322, -0.374642938375473, -0.35960742831230164, -0.34457194805145264, -0.32953643798828125, -0.31450095772743225, -0.29946547746658325, -0.28442996740341187, -0.26939448714256287, -0.25435900688171387, -0.23932349681854248, -0.22428801655769348, -0.2092525064945221, -0.1942170262336731, -0.1791815310716629, -0.1641460359096527, -0.14911054074764252, -0.13407504558563232, -0.11903955042362213, -0.10400406271219254, -0.08896856755018234, -0.07393307238817215, -0.058897584676742554, -0.04386208951473236, -0.028826594352722168, -0.013791101053357124, 0.0012443922460079193, 0.016279883682727814, 0.03131537884473801, 0.0463508740067482, 0.061386361718177795, 0.07642185688018799, 0.09145735204219818, 0.10649284720420837, 0.12152834236621857, 0.13656383752822876, 0.15159931778907776, 0.16663482785224915, 0.18167030811309814, 0.19670580327510834, 0.21174129843711853, 0.22677679359912872, 0.24181228876113892, 0.2568477690219879, 0.2718832790851593, 0.2869187593460083, 0.3019542694091797, 0.3169897496700287, 0.3320252299308777, 0.3470607101917267, 0.36209622025489807, 0.37713170051574707, 0.39216721057891846, 0.40720269083976746, 0.42223817110061646, 0.43727368116378784, 0.45230919122695923]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 16.0, 13.0, 27.0, 31.0, 45.0, 80.0, 117.0, 147.0, 220.0, 303.0, 496.0, 813.0, 1238.0, 1976.0, 3070.0, 4990.0, 8050.0, 13453.0, 23030.0, 42114.0, 83780.0, 200446.0, 362019.0, 149823.0, 67425.0, 35020.0, 19610.0, 11529.0, 6769.0, 4386.0, 2655.0, 1668.0, 1099.0, 685.0, 491.0, 299.0, 204.0, 126.0, 73.0, 56.0, 48.0, 33.0, 21.0, 16.0, 9.0, 10.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4130859375, -0.39947509765625, -0.3858642578125, -0.37225341796875, -0.358642578125, -0.34503173828125, -0.3314208984375, -0.31781005859375, -0.30419921875, -0.29058837890625, -0.2769775390625, -0.26336669921875, -0.249755859375, -0.23614501953125, -0.2225341796875, -0.20892333984375, -0.1953125, -0.18170166015625, -0.1680908203125, -0.15447998046875, -0.140869140625, -0.12725830078125, -0.1136474609375, -0.10003662109375, -0.08642578125, -0.07281494140625, -0.0592041015625, -0.04559326171875, -0.031982421875, -0.01837158203125, -0.0047607421875, 0.00885009765625, 0.0224609375, 0.03607177734375, 0.0496826171875, 0.06329345703125, 0.076904296875, 0.09051513671875, 0.1041259765625, 0.11773681640625, 0.13134765625, 0.14495849609375, 0.1585693359375, 0.17218017578125, 0.185791015625, 0.19940185546875, 0.2130126953125, 0.22662353515625, 0.240234375, 0.25384521484375, 0.2674560546875, 0.28106689453125, 0.294677734375, 0.30828857421875, 0.3218994140625, 0.33551025390625, 0.34912109375, 0.36273193359375, 0.3763427734375, 0.38995361328125, 0.403564453125, 0.41717529296875, 0.4307861328125, 0.44439697265625, 0.4580078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 5.0, 9.0, 12.0, 6.0, 6.0, 8.0, 13.0, 18.0, 15.0, 20.0, 21.0, 28.0, 29.0, 40.0, 25.0, 31.0, 36.0, 35.0, 48.0, 46.0, 48.0, 39.0, 36.0, 35.0, 38.0, 28.0, 34.0, 38.0, 27.0, 29.0, 19.0, 24.0, 25.0, 23.0, 20.0, 14.0, 14.0, 8.0, 13.0, 9.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.56591796875, -0.5498428344726562, -0.5337677001953125, -0.5176925659179688, -0.501617431640625, -0.48554229736328125, -0.4694671630859375, -0.45339202880859375, -0.43731689453125, -0.42124176025390625, -0.4051666259765625, -0.38909149169921875, -0.373016357421875, -0.35694122314453125, -0.3408660888671875, -0.32479095458984375, -0.3087158203125, -0.29264068603515625, -0.2765655517578125, -0.26049041748046875, -0.244415283203125, -0.22834014892578125, -0.2122650146484375, -0.19618988037109375, -0.18011474609375, -0.16403961181640625, -0.1479644775390625, -0.13188934326171875, -0.115814208984375, -0.09973907470703125, -0.0836639404296875, -0.06758880615234375, -0.051513671875, -0.03543853759765625, -0.0193634033203125, -0.00328826904296875, 0.012786865234375, 0.02886199951171875, 0.0449371337890625, 0.06101226806640625, 0.07708740234375, 0.09316253662109375, 0.1092376708984375, 0.12531280517578125, 0.141387939453125, 0.15746307373046875, 0.1735382080078125, 0.18961334228515625, 0.2056884765625, 0.22176361083984375, 0.2378387451171875, 0.25391387939453125, 0.269989013671875, 0.28606414794921875, 0.3021392822265625, 0.31821441650390625, 0.33428955078125, 0.35036468505859375, 0.3664398193359375, 0.38251495361328125, 0.398590087890625, 0.41466522216796875, 0.4307403564453125, 0.44681549072265625, 0.462890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 8.0, 9.0, 20.0, 25.0, 39.0, 58.0, 67.0, 104.0, 141.0, 187.0, 293.0, 398.0, 579.0, 876.0, 1195.0, 1774.0, 2697.0, 4315.0, 7242.0, 13099.0, 28314.0, 93432.0, 673731.0, 146395.0, 35380.0, 15710.0, 8262.0, 4924.0, 3043.0, 1875.0, 1304.0, 914.0, 602.0, 457.0, 331.0, 200.0, 151.0, 122.0, 87.0, 51.0, 35.0, 33.0, 20.0, 19.0, 10.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.71533203125, -0.6940536499023438, -0.6727752685546875, -0.6514968872070312, -0.630218505859375, -0.6089401245117188, -0.5876617431640625, -0.5663833618164062, -0.54510498046875, -0.5238265991210938, -0.5025482177734375, -0.48126983642578125, -0.459991455078125, -0.43871307373046875, -0.4174346923828125, -0.39615631103515625, -0.3748779296875, -0.35359954833984375, -0.3323211669921875, -0.31104278564453125, -0.289764404296875, -0.26848602294921875, -0.2472076416015625, -0.22592926025390625, -0.20465087890625, -0.18337249755859375, -0.1620941162109375, -0.14081573486328125, -0.119537353515625, -0.09825897216796875, -0.0769805908203125, -0.05570220947265625, -0.034423828125, -0.01314544677734375, 0.0081329345703125, 0.02941131591796875, 0.050689697265625, 0.07196807861328125, 0.0932464599609375, 0.11452484130859375, 0.13580322265625, 0.15708160400390625, 0.1783599853515625, 0.19963836669921875, 0.220916748046875, 0.24219512939453125, 0.2634735107421875, 0.28475189208984375, 0.3060302734375, 0.32730865478515625, 0.3485870361328125, 0.36986541748046875, 0.391143798828125, 0.41242218017578125, 0.4337005615234375, 0.45497894287109375, 0.47625732421875, 0.49753570556640625, 0.5188140869140625, 0.5400924682617188, 0.561370849609375, 0.5826492309570312, 0.6039276123046875, 0.6252059936523438, 0.646484375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 8.0, 4.0, 7.0, 16.0, 18.0, 11.0, 15.0, 21.0, 22.0, 33.0, 24.0, 15.0, 30.0, 38.0, 40.0, 42.0, 34.0, 40.0, 26.0, 43.0, 31.0, 44.0, 53.0, 40.0, 40.0, 35.0, 34.0, 33.0, 27.0, 19.0, 20.0, 16.0, 23.0, 9.0, 18.0, 14.0, 11.0, 7.0, 7.0, 11.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.34375, -0.3334503173828125, -0.323150634765625, -0.3128509521484375, -0.30255126953125, -0.2922515869140625, -0.281951904296875, -0.2716522216796875, -0.2613525390625, -0.2510528564453125, -0.240753173828125, -0.2304534912109375, -0.22015380859375, -0.2098541259765625, -0.199554443359375, -0.1892547607421875, -0.178955078125, -0.1686553955078125, -0.158355712890625, -0.1480560302734375, -0.13775634765625, -0.1274566650390625, -0.117156982421875, -0.1068572998046875, -0.0965576171875, -0.0862579345703125, -0.075958251953125, -0.0656585693359375, -0.05535888671875, -0.0450592041015625, -0.034759521484375, -0.0244598388671875, -0.01416015625, -0.0038604736328125, 0.006439208984375, 0.0167388916015625, 0.02703857421875, 0.0373382568359375, 0.047637939453125, 0.0579376220703125, 0.0682373046875, 0.0785369873046875, 0.088836669921875, 0.0991363525390625, 0.10943603515625, 0.1197357177734375, 0.130035400390625, 0.1403350830078125, 0.150634765625, 0.1609344482421875, 0.171234130859375, 0.1815338134765625, 0.19183349609375, 0.2021331787109375, 0.212432861328125, 0.2227325439453125, 0.2330322265625, 0.2433319091796875, 0.253631591796875, 0.2639312744140625, 0.27423095703125, 0.2845306396484375, 0.294830322265625, 0.3051300048828125, 0.3154296875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 14.0, 14.0, 25.0, 28.0, 38.0, 53.0, 74.0, 119.0, 132.0, 172.0, 256.0, 367.0, 486.0, 691.0, 917.0, 1302.0, 2010.0, 3162.0, 5065.0, 9110.0, 17871.0, 40556.0, 126376.0, 635452.0, 123087.0, 39370.0, 17708.0, 9089.0, 5217.0, 3189.0, 2072.0, 1297.0, 908.0, 607.0, 470.0, 354.0, 233.0, 193.0, 125.0, 89.0, 77.0, 54.0, 35.0, 22.0, 20.0, 13.0, 7.0, 9.0, 3.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.08941650390625, -0.08648395538330078, -0.08355140686035156, -0.08061885833740234, -0.07768630981445312, -0.0747537612915039, -0.07182121276855469, -0.06888866424560547, -0.06595611572265625, -0.06302356719970703, -0.06009101867675781, -0.057158470153808594, -0.054225921630859375, -0.051293373107910156, -0.04836082458496094, -0.04542827606201172, -0.0424957275390625, -0.03956317901611328, -0.03663063049316406, -0.033698081970214844, -0.030765533447265625, -0.027832984924316406, -0.024900436401367188, -0.02196788787841797, -0.01903533935546875, -0.01610279083251953, -0.013170242309570312, -0.010237693786621094, -0.007305145263671875, -0.004372596740722656, -0.0014400482177734375, 0.0014925003051757812, 0.004425048828125, 0.007357597351074219, 0.010290145874023438, 0.013222694396972656, 0.016155242919921875, 0.019087791442871094, 0.022020339965820312, 0.02495288848876953, 0.02788543701171875, 0.03081798553466797, 0.03375053405761719, 0.036683082580566406, 0.039615631103515625, 0.042548179626464844, 0.04548072814941406, 0.04841327667236328, 0.0513458251953125, 0.05427837371826172, 0.05721092224121094, 0.060143470764160156, 0.06307601928710938, 0.0660085678100586, 0.06894111633300781, 0.07187366485595703, 0.07480621337890625, 0.07773876190185547, 0.08067131042480469, 0.0836038589477539, 0.08653640747070312, 0.08946895599365234, 0.09240150451660156, 0.09533405303955078, 0.0982666015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 2.0, 9.0, 8.0, 17.0, 6.0, 16.0, 20.0, 22.0, 27.0, 22.0, 37.0, 83.0, 64.0, 68.0, 66.0, 141.0, 83.0, 51.0, 54.0, 36.0, 42.0, 19.0, 18.0, 18.0, 14.0, 11.0, 7.0, 6.0, 4.0, 6.0, 0.0, 0.0, 0.0, 7.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.76837158203125e-06, -4.636123776435852e-06, -4.503875970840454e-06, -4.371628165245056e-06, -4.239380359649658e-06, -4.10713255405426e-06, -3.974884748458862e-06, -3.842636942863464e-06, -3.7103891372680664e-06, -3.5781413316726685e-06, -3.4458935260772705e-06, -3.3136457204818726e-06, -3.1813979148864746e-06, -3.0491501092910767e-06, -2.9169023036956787e-06, -2.7846544981002808e-06, -2.652406692504883e-06, -2.520158886909485e-06, -2.387911081314087e-06, -2.255663275718689e-06, -2.123415470123291e-06, -1.991167664527893e-06, -1.8589198589324951e-06, -1.7266720533370972e-06, -1.5944242477416992e-06, -1.4621764421463013e-06, -1.3299286365509033e-06, -1.1976808309555054e-06, -1.0654330253601074e-06, -9.331852197647095e-07, -8.009374141693115e-07, -6.686896085739136e-07, -5.364418029785156e-07, -4.041939973831177e-07, -2.7194619178771973e-07, -1.3969838619232178e-07, -7.450580596923828e-09, 1.2479722499847412e-07, 2.5704503059387207e-07, 3.8929283618927e-07, 5.21540641784668e-07, 6.537884473800659e-07, 7.860362529754639e-07, 9.182840585708618e-07, 1.0505318641662598e-06, 1.1827796697616577e-06, 1.3150274753570557e-06, 1.4472752809524536e-06, 1.5795230865478516e-06, 1.7117708921432495e-06, 1.8440186977386475e-06, 1.9762665033340454e-06, 2.1085143089294434e-06, 2.2407621145248413e-06, 2.3730099201202393e-06, 2.505257725715637e-06, 2.637505531311035e-06, 2.769753336906433e-06, 2.902001142501831e-06, 3.034248948097229e-06, 3.166496753692627e-06, 3.298744559288025e-06, 3.430992364883423e-06, 3.563240170478821e-06, 3.6954879760742188e-06]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 11.0, 10.0, 22.0, 43.0, 43.0, 57.0, 86.0, 143.0, 216.0, 388.0, 597.0, 885.0, 1475.0, 2472.0, 4073.0, 7176.0, 12653.0, 23852.0, 49382.0, 119409.0, 435768.0, 233603.0, 78666.0, 35698.0, 17996.0, 9776.0, 5616.0, 3267.0, 1892.0, 1201.0, 773.0, 459.0, 303.0, 188.0, 116.0, 76.0, 37.0, 44.0, 42.0, 20.0, 9.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08151912689208984, -0.07887077331542969, -0.07622241973876953, -0.07357406616210938, -0.07092571258544922, -0.06827735900878906, -0.0656290054321289, -0.06298065185546875, -0.060332298278808594, -0.05768394470214844, -0.05503559112548828, -0.052387237548828125, -0.04973888397216797, -0.04709053039550781, -0.044442176818847656, -0.0417938232421875, -0.039145469665527344, -0.03649711608886719, -0.03384876251220703, -0.031200408935546875, -0.02855205535888672, -0.025903701782226562, -0.023255348205566406, -0.02060699462890625, -0.017958641052246094, -0.015310287475585938, -0.012661933898925781, -0.010013580322265625, -0.007365226745605469, -0.0047168731689453125, -0.0020685195922851562, 0.000579833984375, 0.0032281875610351562, 0.0058765411376953125, 0.008524894714355469, 0.011173248291015625, 0.013821601867675781, 0.016469955444335938, 0.019118309020996094, 0.02176666259765625, 0.024415016174316406, 0.027063369750976562, 0.02971172332763672, 0.032360076904296875, 0.03500843048095703, 0.03765678405761719, 0.040305137634277344, 0.0429534912109375, 0.045601844787597656, 0.04825019836425781, 0.05089855194091797, 0.053546905517578125, 0.05619525909423828, 0.05884361267089844, 0.061491966247558594, 0.06414031982421875, 0.0667886734008789, 0.06943702697753906, 0.07208538055419922, 0.07473373413085938, 0.07738208770751953, 0.08003044128417969, 0.08267879486083984, 0.0853271484375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 6.0, 2.0, 12.0, 6.0, 19.0, 17.0, 26.0, 27.0, 30.0, 50.0, 64.0, 107.0, 168.0, 146.0, 82.0, 61.0, 34.0, 30.0, 20.0, 10.0, 15.0, 11.0, 17.0, 4.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0394287109375, -0.038153648376464844, -0.03687858581542969, -0.03560352325439453, -0.034328460693359375, -0.03305339813232422, -0.03177833557128906, -0.030503273010253906, -0.02922821044921875, -0.027953147888183594, -0.026678085327148438, -0.02540302276611328, -0.024127960205078125, -0.02285289764404297, -0.021577835083007812, -0.020302772521972656, -0.0190277099609375, -0.017752647399902344, -0.016477584838867188, -0.015202522277832031, -0.013927459716796875, -0.012652397155761719, -0.011377334594726562, -0.010102272033691406, -0.00882720947265625, -0.007552146911621094, -0.0062770843505859375, -0.005002021789550781, -0.003726959228515625, -0.0024518966674804688, -0.0011768341064453125, 9.822845458984375e-05, 0.001373291015625, 0.0026483535766601562, 0.0039234161376953125, 0.005198478698730469, 0.006473541259765625, 0.007748603820800781, 0.009023666381835938, 0.010298728942871094, 0.01157379150390625, 0.012848854064941406, 0.014123916625976562, 0.015398979187011719, 0.016674041748046875, 0.01794910430908203, 0.019224166870117188, 0.020499229431152344, 0.0217742919921875, 0.023049354553222656, 0.024324417114257812, 0.02559947967529297, 0.026874542236328125, 0.02814960479736328, 0.029424667358398438, 0.030699729919433594, 0.03197479248046875, 0.033249855041503906, 0.03452491760253906, 0.03579998016357422, 0.037075042724609375, 0.03835010528564453, 0.03962516784667969, 0.040900230407714844, 0.04217529296875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 6.0, 11.0, 12.0, 17.0, 16.0, 12.0, 30.0, 33.0, 50.0, 47.0, 101.0, 124.0, 113.0, 125.0, 77.0, 52.0, 39.0, 34.0, 18.0, 26.0, 15.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8401376008987427, -0.813301146030426, -0.7864646911621094, -0.759628176689148, -0.7327917218208313, -0.7059552669525146, -0.6791187524795532, -0.6522822976112366, -0.6254458427429199, -0.5986093878746033, -0.5717729330062866, -0.5449364185333252, -0.5180999636650085, -0.4912635087966919, -0.46442702412605286, -0.4375905394554138, -0.41075408458709717, -0.3839176297187805, -0.3570811450481415, -0.33024466037750244, -0.3034082055091858, -0.27657175064086914, -0.2497352659702301, -0.22289879620075226, -0.19606232643127441, -0.16922585666179657, -0.14238938689231873, -0.11555291712284088, -0.08871644735336304, -0.06187997758388519, -0.03504350781440735, -0.008207038044929504, 0.018629491329193115, 0.04546596109867096, 0.0723024308681488, 0.09913890063762665, 0.1259753704071045, 0.15281184017658234, 0.17964830994606018, 0.20648477971553802, 0.23332124948501587, 0.2601577043533325, 0.28699418902397156, 0.3138306736946106, 0.34066712856292725, 0.3675035834312439, 0.39434006810188293, 0.421176552772522, 0.4480130076408386, 0.4748494625091553, 0.5016859769821167, 0.5285224318504333, 0.55535888671875, 0.5821953415870667, 0.6090317964553833, 0.6358683109283447, 0.6627047657966614, 0.689541220664978, 0.7163777351379395, 0.7432141900062561, 0.7700506448745728, 0.7968870997428894, 0.823723554611206, 0.8505600690841675, 0.8773965239524841]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 5.0, 3.0, 9.0, 9.0, 12.0, 8.0, 6.0, 16.0, 16.0, 17.0, 9.0, 18.0, 25.0, 25.0, 22.0, 29.0, 26.0, 34.0, 38.0, 36.0, 39.0, 41.0, 49.0, 44.0, 35.0, 34.0, 30.0, 35.0, 28.0, 28.0, 36.0, 26.0, 27.0, 19.0, 29.0, 28.0, 21.0, 16.0, 13.0, 13.0, 10.0, 13.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5082613229751587, -0.4933927655220032, -0.47852417826652527, -0.46365562081336975, -0.44878706336021423, -0.43391847610473633, -0.4190499186515808, -0.4041813611984253, -0.3893127739429474, -0.37444421648979187, -0.35957562923431396, -0.34470707178115845, -0.32983851432800293, -0.314969927072525, -0.3001013696193695, -0.2852327823638916, -0.2703642249107361, -0.25549566745758057, -0.24062709510326385, -0.22575852274894714, -0.21088995039463043, -0.19602137804031372, -0.1811528205871582, -0.1662842482328415, -0.15141570568084717, -0.13654713332653046, -0.12167856842279434, -0.10681000351905823, -0.09194143116474152, -0.0770728662610054, -0.06220430135726929, -0.047335729002952576, -0.032467156648635864, -0.01759858801960945, -0.0027300212532281876, 0.012138545513153076, 0.02700711414217949, 0.0418756827712059, 0.05674424767494202, 0.07161282002925873, 0.08648138493299484, 0.10134994983673096, 0.11621852219104767, 0.13108709454536438, 0.1459556519985199, 0.1608242243528366, 0.17569279670715332, 0.19056135416030884, 0.20542992651462555, 0.22029849886894226, 0.23516705632209778, 0.2500356435775757, 0.2649042010307312, 0.2797727584838867, 0.29464131593704224, 0.30950990319252014, 0.32437846064567566, 0.3392470180988312, 0.3541156053543091, 0.3689841628074646, 0.3838527202606201, 0.398721307516098, 0.41358986496925354, 0.42845845222473145, 0.44332700967788696]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 8.0, 11.0, 9.0, 28.0, 43.0, 74.0, 77.0, 126.0, 192.0, 279.0, 396.0, 538.0, 814.0, 1222.0, 1755.0, 2700.0, 4101.0, 6248.0, 9708.0, 15649.0, 25860.0, 42874.0, 73726.0, 132146.0, 236596.0, 211744.0, 115428.0, 65353.0, 38337.0, 22877.0, 14037.0, 8887.0, 5596.0, 3633.0, 2417.0, 1542.0, 1065.0, 789.0, 505.0, 331.0, 250.0, 188.0, 114.0, 92.0, 65.0, 36.0, 30.0, 13.0, 12.0, 12.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.82666015625, -0.799896240234375, -0.77313232421875, -0.746368408203125, -0.7196044921875, -0.692840576171875, -0.66607666015625, -0.639312744140625, -0.612548828125, -0.585784912109375, -0.55902099609375, -0.532257080078125, -0.5054931640625, -0.478729248046875, -0.45196533203125, -0.425201416015625, -0.3984375, -0.371673583984375, -0.34490966796875, -0.318145751953125, -0.2913818359375, -0.264617919921875, -0.23785400390625, -0.211090087890625, -0.184326171875, -0.157562255859375, -0.13079833984375, -0.104034423828125, -0.0772705078125, -0.050506591796875, -0.02374267578125, 0.003021240234375, 0.02978515625, 0.056549072265625, 0.08331298828125, 0.110076904296875, 0.1368408203125, 0.163604736328125, 0.19036865234375, 0.217132568359375, 0.243896484375, 0.270660400390625, 0.29742431640625, 0.324188232421875, 0.3509521484375, 0.377716064453125, 0.40447998046875, 0.431243896484375, 0.4580078125, 0.484771728515625, 0.51153564453125, 0.538299560546875, 0.5650634765625, 0.591827392578125, 0.61859130859375, 0.645355224609375, 0.672119140625, 0.698883056640625, 0.72564697265625, 0.752410888671875, 0.7791748046875, 0.805938720703125, 0.83270263671875, 0.859466552734375, 0.88623046875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 10.0, 5.0, 6.0, 4.0, 5.0, 7.0, 8.0, 11.0, 10.0, 13.0, 23.0, 18.0, 29.0, 16.0, 30.0, 30.0, 17.0, 26.0, 46.0, 39.0, 31.0, 34.0, 40.0, 42.0, 34.0, 36.0, 32.0, 39.0, 35.0, 34.0, 30.0, 28.0, 27.0, 20.0, 26.0, 21.0, 29.0, 21.0, 9.0, 13.0, 14.0, 13.0, 9.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.46435546875, -0.45098114013671875, -0.4376068115234375, -0.42423248291015625, -0.410858154296875, -0.39748382568359375, -0.3841094970703125, -0.37073516845703125, -0.35736083984375, -0.34398651123046875, -0.3306121826171875, -0.31723785400390625, -0.303863525390625, -0.29048919677734375, -0.2771148681640625, -0.26374053955078125, -0.2503662109375, -0.23699188232421875, -0.2236175537109375, -0.21024322509765625, -0.196868896484375, -0.18349456787109375, -0.1701202392578125, -0.15674591064453125, -0.14337158203125, -0.12999725341796875, -0.1166229248046875, -0.10324859619140625, -0.089874267578125, -0.07649993896484375, -0.0631256103515625, -0.04975128173828125, -0.036376953125, -0.02300262451171875, -0.0096282958984375, 0.00374603271484375, 0.017120361328125, 0.03049468994140625, 0.0438690185546875, 0.05724334716796875, 0.07061767578125, 0.08399200439453125, 0.0973663330078125, 0.11074066162109375, 0.124114990234375, 0.13748931884765625, 0.1508636474609375, 0.16423797607421875, 0.1776123046875, 0.19098663330078125, 0.2043609619140625, 0.21773529052734375, 0.231109619140625, 0.24448394775390625, 0.2578582763671875, 0.27123260498046875, 0.28460693359375, 0.29798126220703125, 0.3113555908203125, 0.32472991943359375, 0.338104248046875, 0.35147857666015625, 0.3648529052734375, 0.37822723388671875, 0.3916015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 10.0, 13.0, 25.0, 33.0, 45.0, 78.0, 86.0, 108.0, 197.0, 283.0, 412.0, 617.0, 913.0, 1380.0, 2164.0, 3230.0, 5181.0, 8467.0, 13840.0, 23543.0, 41154.0, 74667.0, 145128.0, 279377.0, 210091.0, 103737.0, 55347.0, 30890.0, 18119.0, 10894.0, 6611.0, 4145.0, 2619.0, 1744.0, 1090.0, 716.0, 490.0, 338.0, 250.0, 165.0, 111.0, 85.0, 43.0, 34.0, 31.0, 20.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8564682006835938, -0.8276824951171875, -0.7988967895507812, -0.770111083984375, -0.7413253784179688, -0.7125396728515625, -0.6837539672851562, -0.65496826171875, -0.6261825561523438, -0.5973968505859375, -0.5686111450195312, -0.539825439453125, -0.5110397338867188, -0.4822540283203125, -0.45346832275390625, -0.4246826171875, -0.39589691162109375, -0.3671112060546875, -0.33832550048828125, -0.309539794921875, -0.28075408935546875, -0.2519683837890625, -0.22318267822265625, -0.19439697265625, -0.16561126708984375, -0.1368255615234375, -0.10803985595703125, -0.079254150390625, -0.05046844482421875, -0.0216827392578125, 0.00710296630859375, 0.035888671875, 0.06467437744140625, 0.0934600830078125, 0.12224578857421875, 0.151031494140625, 0.17981719970703125, 0.2086029052734375, 0.23738861083984375, 0.26617431640625, 0.29496002197265625, 0.3237457275390625, 0.35253143310546875, 0.381317138671875, 0.41010284423828125, 0.4388885498046875, 0.46767425537109375, 0.4964599609375, 0.5252456665039062, 0.5540313720703125, 0.5828170776367188, 0.611602783203125, 0.6403884887695312, 0.6691741943359375, 0.6979598999023438, 0.72674560546875, 0.7555313110351562, 0.7843170166015625, 0.8131027221679688, 0.841888427734375, 0.8706741333007812, 0.8994598388671875, 0.9282455444335938, 0.95703125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 2.0, 5.0, 4.0, 3.0, 10.0, 12.0, 13.0, 15.0, 13.0, 12.0, 16.0, 20.0, 23.0, 25.0, 39.0, 31.0, 30.0, 34.0, 55.0, 42.0, 40.0, 42.0, 42.0, 37.0, 48.0, 39.0, 42.0, 42.0, 33.0, 37.0, 26.0, 21.0, 20.0, 23.0, 15.0, 14.0, 11.0, 10.0, 8.0, 13.0, 13.0, 7.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.335205078125, -0.3254280090332031, -0.31565093994140625, -0.3058738708496094, -0.2960968017578125, -0.2863197326660156, -0.27654266357421875, -0.2667655944824219, -0.256988525390625, -0.24721145629882812, -0.23743438720703125, -0.22765731811523438, -0.2178802490234375, -0.20810317993164062, -0.19832611083984375, -0.18854904174804688, -0.17877197265625, -0.16899490356445312, -0.15921783447265625, -0.14944076538085938, -0.1396636962890625, -0.12988662719726562, -0.12010955810546875, -0.11033248901367188, -0.100555419921875, -0.09077835083007812, -0.08100128173828125, -0.07122421264648438, -0.0614471435546875, -0.051670074462890625, -0.04189300537109375, -0.032115936279296875, -0.0223388671875, -0.012561798095703125, -0.00278472900390625, 0.006992340087890625, 0.0167694091796875, 0.026546478271484375, 0.03632354736328125, 0.046100616455078125, 0.055877685546875, 0.06565475463867188, 0.07543182373046875, 0.08520889282226562, 0.0949859619140625, 0.10476303100585938, 0.11454010009765625, 0.12431716918945312, 0.13409423828125, 0.14387130737304688, 0.15364837646484375, 0.16342544555664062, 0.1732025146484375, 0.18297958374023438, 0.19275665283203125, 0.20253372192382812, 0.212310791015625, 0.22208786010742188, 0.23186492919921875, 0.24164199829101562, 0.2514190673828125, 0.2611961364746094, 0.27097320556640625, 0.2807502746582031, 0.29052734375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 9.0, 9.0, 15.0, 14.0, 32.0, 34.0, 57.0, 66.0, 95.0, 142.0, 221.0, 353.0, 504.0, 801.0, 1229.0, 2055.0, 3133.0, 4967.0, 8653.0, 14732.0, 28311.0, 64162.0, 605827.0, 203233.0, 52440.0, 24312.0, 13076.0, 7552.0, 4581.0, 2816.0, 1831.0, 1062.0, 735.0, 491.0, 313.0, 218.0, 116.0, 95.0, 68.0, 52.0, 25.0, 31.0, 23.0, 16.0, 10.0, 11.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.5947265625, -0.5766448974609375, -0.558563232421875, -0.5404815673828125, -0.52239990234375, -0.5043182373046875, -0.486236572265625, -0.4681549072265625, -0.4500732421875, -0.4319915771484375, -0.413909912109375, -0.3958282470703125, -0.37774658203125, -0.3596649169921875, -0.341583251953125, -0.3235015869140625, -0.305419921875, -0.2873382568359375, -0.269256591796875, -0.2511749267578125, -0.23309326171875, -0.2150115966796875, -0.196929931640625, -0.1788482666015625, -0.1607666015625, -0.1426849365234375, -0.124603271484375, -0.1065216064453125, -0.08843994140625, -0.0703582763671875, -0.052276611328125, -0.0341949462890625, -0.01611328125, 0.0019683837890625, 0.020050048828125, 0.0381317138671875, 0.05621337890625, 0.0742950439453125, 0.092376708984375, 0.1104583740234375, 0.1285400390625, 0.1466217041015625, 0.164703369140625, 0.1827850341796875, 0.20086669921875, 0.2189483642578125, 0.237030029296875, 0.2551116943359375, 0.273193359375, 0.2912750244140625, 0.309356689453125, 0.3274383544921875, 0.34552001953125, 0.3636016845703125, 0.381683349609375, 0.3997650146484375, 0.4178466796875, 0.4359283447265625, 0.454010009765625, 0.4720916748046875, 0.49017333984375, 0.5082550048828125, 0.526336669921875, 0.5444183349609375, 0.5625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 8.0, 11.0, 7.0, 11.0, 18.0, 18.0, 36.0, 46.0, 77.0, 165.0, 279.0, 109.0, 62.0, 34.0, 18.0, 18.0, 17.0, 12.0, 8.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.996755599975586e-05, -1.9385479390621185e-05, -1.880340278148651e-05, -1.8221326172351837e-05, -1.7639249563217163e-05, -1.705717295408249e-05, -1.6475096344947815e-05, -1.589301973581314e-05, -1.5310943126678467e-05, -1.4728866517543793e-05, -1.4146789908409119e-05, -1.3564713299274445e-05, -1.298263669013977e-05, -1.2400560081005096e-05, -1.1818483471870422e-05, -1.1236406862735748e-05, -1.0654330253601074e-05, -1.00722536444664e-05, -9.490177035331726e-06, -8.908100426197052e-06, -8.326023817062378e-06, -7.743947207927704e-06, -7.16187059879303e-06, -6.579793989658356e-06, -5.997717380523682e-06, -5.4156407713890076e-06, -4.8335641622543335e-06, -4.2514875531196594e-06, -3.6694109439849854e-06, -3.0873343348503113e-06, -2.505257725715637e-06, -1.923181116580963e-06, -1.341104507446289e-06, -7.59027898311615e-07, -1.7695128917694092e-07, 4.0512531995773315e-07, 9.872019290924072e-07, 1.5692785382270813e-06, 2.1513551473617554e-06, 2.7334317564964294e-06, 3.3155083656311035e-06, 3.897584974765778e-06, 4.479661583900452e-06, 5.061738193035126e-06, 5.6438148021698e-06, 6.225891411304474e-06, 6.807968020439148e-06, 7.390044629573822e-06, 7.972121238708496e-06, 8.55419784784317e-06, 9.136274456977844e-06, 9.718351066112518e-06, 1.0300427675247192e-05, 1.0882504284381866e-05, 1.146458089351654e-05, 1.2046657502651215e-05, 1.2628734111785889e-05, 1.3210810720920563e-05, 1.3792887330055237e-05, 1.4374963939189911e-05, 1.4957040548324585e-05, 1.553911715745926e-05, 1.6121193766593933e-05, 1.6703270375728607e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 9.0, 14.0, 16.0, 28.0, 30.0, 49.0, 98.0, 104.0, 198.0, 253.0, 427.0, 618.0, 942.0, 1454.0, 2197.0, 3476.0, 5825.0, 10047.0, 20742.0, 49331.0, 255262.0, 592530.0, 55121.0, 22294.0, 11020.0, 6044.0, 3609.0, 2362.0, 1515.0, 1007.0, 665.0, 419.0, 292.0, 186.0, 128.0, 66.0, 64.0, 33.0, 30.0, 13.0, 11.0, 11.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.78173828125, -0.758087158203125, -0.73443603515625, -0.710784912109375, -0.6871337890625, -0.663482666015625, -0.63983154296875, -0.616180419921875, -0.592529296875, -0.568878173828125, -0.54522705078125, -0.521575927734375, -0.4979248046875, -0.474273681640625, -0.45062255859375, -0.426971435546875, -0.4033203125, -0.379669189453125, -0.35601806640625, -0.332366943359375, -0.3087158203125, -0.285064697265625, -0.26141357421875, -0.237762451171875, -0.214111328125, -0.190460205078125, -0.16680908203125, -0.143157958984375, -0.1195068359375, -0.095855712890625, -0.07220458984375, -0.048553466796875, -0.02490234375, -0.001251220703125, 0.02239990234375, 0.046051025390625, 0.0697021484375, 0.093353271484375, 0.11700439453125, 0.140655517578125, 0.164306640625, 0.187957763671875, 0.21160888671875, 0.235260009765625, 0.2589111328125, 0.282562255859375, 0.30621337890625, 0.329864501953125, 0.353515625, 0.377166748046875, 0.40081787109375, 0.424468994140625, 0.4481201171875, 0.471771240234375, 0.49542236328125, 0.519073486328125, 0.542724609375, 0.566375732421875, 0.59002685546875, 0.613677978515625, 0.6373291015625, 0.660980224609375, 0.68463134765625, 0.708282470703125, 0.73193359375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 3.0, 10.0, 8.0, 7.0, 15.0, 19.0, 26.0, 25.0, 42.0, 44.0, 85.0, 366.0, 93.0, 41.0, 43.0, 31.0, 28.0, 10.0, 23.0, 13.0, 7.0, 9.0, 7.0, 3.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22577667236328125, -0.2196197509765625, -0.21346282958984375, -0.207305908203125, -0.20114898681640625, -0.1949920654296875, -0.18883514404296875, -0.18267822265625, -0.17652130126953125, -0.1703643798828125, -0.16420745849609375, -0.158050537109375, -0.15189361572265625, -0.1457366943359375, -0.13957977294921875, -0.1334228515625, -0.12726593017578125, -0.1211090087890625, -0.11495208740234375, -0.108795166015625, -0.10263824462890625, -0.0964813232421875, -0.09032440185546875, -0.08416748046875, -0.07801055908203125, -0.0718536376953125, -0.06569671630859375, -0.059539794921875, -0.05338287353515625, -0.0472259521484375, -0.04106903076171875, -0.034912109375, -0.02875518798828125, -0.0225982666015625, -0.01644134521484375, -0.010284423828125, -0.00412750244140625, 0.0020294189453125, 0.00818634033203125, 0.01434326171875, 0.02050018310546875, 0.0266571044921875, 0.03281402587890625, 0.038970947265625, 0.04512786865234375, 0.0512847900390625, 0.05744171142578125, 0.0635986328125, 0.06975555419921875, 0.0759124755859375, 0.08206939697265625, 0.088226318359375, 0.09438323974609375, 0.1005401611328125, 0.10669708251953125, 0.11285400390625, 0.11901092529296875, 0.1251678466796875, 0.13132476806640625, 0.137481689453125, 0.14363861083984375, 0.1497955322265625, 0.15595245361328125, 0.162109375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 7.0, 6.0, 8.0, 14.0, 9.0, 25.0, 24.0, 36.0, 39.0, 55.0, 62.0, 103.0, 95.0, 101.0, 74.0, 67.0, 51.0, 42.0, 34.0, 25.0, 22.0, 18.0, 20.0, 6.0, 6.0, 4.0, 10.0, 4.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6671497821807861, -0.6462233662605286, -0.625296950340271, -0.6043705344200134, -0.5834441184997559, -0.5625177621841431, -0.5415913462638855, -0.5206649303436279, -0.49973851442337036, -0.4788120985031128, -0.4578856825828552, -0.43695929646492004, -0.4160328805446625, -0.3951064646244049, -0.3741800785064697, -0.35325366258621216, -0.3323272466659546, -0.311400830745697, -0.29047441482543945, -0.2695480287075043, -0.2486216127872467, -0.22769519686698914, -0.20676879584789276, -0.1858423948287964, -0.16491597890853882, -0.14398956298828125, -0.12306316196918488, -0.1021367534995079, -0.08121034502983093, -0.06028393656015396, -0.03935752809047699, -0.018431127071380615, 0.002495288848876953, 0.023421697318553925, 0.044348105788230896, 0.06527451425790787, 0.08620092272758484, 0.10712733119726181, 0.12805373966693878, 0.14898014068603516, 0.16990655660629272, 0.1908329725265503, 0.21175937354564667, 0.23268577456474304, 0.2536121904850006, 0.2745386064052582, 0.29546499252319336, 0.3163914084434509, 0.3373178243637085, 0.35824424028396606, 0.37917065620422363, 0.4000970423221588, 0.4210234582424164, 0.44194987416267395, 0.46287626028060913, 0.4838026762008667, 0.5047290921211243, 0.5256555080413818, 0.5465819239616394, 0.567508339881897, 0.5884346961975098, 0.6093611121177673, 0.6302875280380249, 0.6512139439582825, 0.67214035987854]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 11.0, 6.0, 8.0, 5.0, 7.0, 12.0, 8.0, 12.0, 10.0, 13.0, 8.0, 21.0, 29.0, 26.0, 24.0, 28.0, 32.0, 35.0, 34.0, 22.0, 28.0, 36.0, 27.0, 31.0, 40.0, 32.0, 38.0, 45.0, 20.0, 35.0, 31.0, 24.0, 34.0, 30.0, 27.0, 28.0, 22.0, 30.0, 22.0, 9.0, 6.0, 7.0, 8.0, 3.0, 6.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.4383643865585327, -0.42473548650741577, -0.41110658645629883, -0.3974776864051819, -0.38384878635406494, -0.370219886302948, -0.35659098625183105, -0.3429620862007141, -0.32933318614959717, -0.3157042860984802, -0.3020753860473633, -0.28844648599624634, -0.2748175859451294, -0.26118868589401245, -0.2475597858428955, -0.23393088579177856, -0.22030198574066162, -0.20667308568954468, -0.19304418563842773, -0.1794152855873108, -0.16578638553619385, -0.1521574854850769, -0.13852858543395996, -0.12489968538284302, -0.11127078533172607, -0.09764188528060913, -0.08401298522949219, -0.07038408517837524, -0.0567551851272583, -0.04312628507614136, -0.029497385025024414, -0.01586848497390747, -0.0022395551204681396, 0.011389344930648804, 0.025018244981765747, 0.03864714503288269, 0.052276045083999634, 0.06590494513511658, 0.07953384518623352, 0.09316274523735046, 0.10679164528846741, 0.12042054533958435, 0.1340494453907013, 0.14767834544181824, 0.16130724549293518, 0.17493614554405212, 0.18856504559516907, 0.202193945646286, 0.21582284569740295, 0.2294517457485199, 0.24308064579963684, 0.2567095458507538, 0.2703384459018707, 0.28396734595298767, 0.2975962460041046, 0.31122514605522156, 0.3248540461063385, 0.33848294615745544, 0.3521118462085724, 0.36574074625968933, 0.3793696463108063, 0.3929985463619232, 0.40662744641304016, 0.4202563464641571, 0.43388524651527405]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 11.0, 18.0, 29.0, 29.0, 48.0, 73.0, 96.0, 131.0, 146.0, 250.0, 389.0, 536.0, 780.0, 1201.0, 1678.0, 2488.0, 3722.0, 5888.0, 9101.0, 14550.0, 24008.0, 40630.0, 72011.0, 135255.0, 294106.0, 909029.0, 1647415.0, 569537.0, 210251.0, 104799.0, 57923.0, 33013.0, 20225.0, 12103.0, 7871.0, 4938.0, 3313.0, 2122.0, 1453.0, 1031.0, 624.0, 471.0, 314.0, 228.0, 135.0, 97.0, 67.0, 55.0, 28.0, 22.0, 13.0, 12.0, 9.0, 4.0, 3.0, 2.0], "bins": [-0.67822265625, -0.6584625244140625, -0.638702392578125, -0.6189422607421875, -0.59918212890625, -0.5794219970703125, -0.559661865234375, -0.5399017333984375, -0.5201416015625, -0.5003814697265625, -0.480621337890625, -0.4608612060546875, -0.44110107421875, -0.4213409423828125, -0.401580810546875, -0.3818206787109375, -0.362060546875, -0.3423004150390625, -0.322540283203125, -0.3027801513671875, -0.28302001953125, -0.2632598876953125, -0.243499755859375, -0.2237396240234375, -0.2039794921875, -0.1842193603515625, -0.164459228515625, -0.1446990966796875, -0.12493896484375, -0.1051788330078125, -0.085418701171875, -0.0656585693359375, -0.0458984375, -0.0261383056640625, -0.006378173828125, 0.0133819580078125, 0.03314208984375, 0.0529022216796875, 0.072662353515625, 0.0924224853515625, 0.1121826171875, 0.1319427490234375, 0.151702880859375, 0.1714630126953125, 0.19122314453125, 0.2109832763671875, 0.230743408203125, 0.2505035400390625, 0.270263671875, 0.2900238037109375, 0.309783935546875, 0.3295440673828125, 0.34930419921875, 0.3690643310546875, 0.388824462890625, 0.4085845947265625, 0.4283447265625, 0.4481048583984375, 0.467864990234375, 0.4876251220703125, 0.50738525390625, 0.5271453857421875, 0.546905517578125, 0.5666656494140625, 0.58642578125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 8.0, 3.0, 3.0, 6.0, 5.0, 10.0, 8.0, 7.0, 13.0, 13.0, 10.0, 12.0, 13.0, 9.0, 18.0, 22.0, 27.0, 30.0, 20.0, 25.0, 38.0, 23.0, 33.0, 32.0, 21.0, 34.0, 47.0, 41.0, 36.0, 39.0, 35.0, 31.0, 24.0, 35.0, 25.0, 24.0, 27.0, 27.0, 27.0, 22.0, 23.0, 17.0, 14.0, 10.0, 9.0, 11.0, 8.0, 5.0, 6.0, 2.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.255859375, -0.24770736694335938, -0.23955535888671875, -0.23140335083007812, -0.2232513427734375, -0.21509933471679688, -0.20694732666015625, -0.19879531860351562, -0.190643310546875, -0.18249130249023438, -0.17433929443359375, -0.16618728637695312, -0.1580352783203125, -0.14988327026367188, -0.14173126220703125, -0.13357925415039062, -0.12542724609375, -0.11727523803710938, -0.10912322998046875, -0.10097122192382812, -0.0928192138671875, -0.08466720581054688, -0.07651519775390625, -0.06836318969726562, -0.060211181640625, -0.052059173583984375, -0.04390716552734375, -0.035755157470703125, -0.0276031494140625, -0.019451141357421875, -0.01129913330078125, -0.003147125244140625, 0.0050048828125, 0.013156890869140625, 0.02130889892578125, 0.029460906982421875, 0.0376129150390625, 0.045764923095703125, 0.05391693115234375, 0.062068939208984375, 0.070220947265625, 0.07837295532226562, 0.08652496337890625, 0.09467697143554688, 0.1028289794921875, 0.11098098754882812, 0.11913299560546875, 0.12728500366210938, 0.13543701171875, 0.14358901977539062, 0.15174102783203125, 0.15989303588867188, 0.1680450439453125, 0.17619705200195312, 0.18434906005859375, 0.19250106811523438, 0.200653076171875, 0.20880508422851562, 0.21695709228515625, 0.22510910034179688, 0.2332611083984375, 0.24141311645507812, 0.24956512451171875, 0.2577171325683594, 0.265869140625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 12.0, 32.0, 30.0, 53.0, 82.0, 133.0, 229.0, 319.0, 477.0, 790.0, 1206.0, 1920.0, 3177.0, 5110.0, 8531.0, 14446.0, 24476.0, 43595.0, 80998.0, 162526.0, 360165.0, 1021028.0, 1501234.0, 515460.0, 214380.0, 104194.0, 54910.0, 30402.0, 17498.0, 10446.0, 6166.0, 3944.0, 2384.0, 1390.0, 883.0, 598.0, 379.0, 223.0, 157.0, 104.0, 61.0, 51.0, 28.0, 18.0, 13.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5881729125976562, -0.5699005126953125, -0.5516281127929688, -0.533355712890625, -0.5150833129882812, -0.4968109130859375, -0.47853851318359375, -0.46026611328125, -0.44199371337890625, -0.4237213134765625, -0.40544891357421875, -0.387176513671875, -0.36890411376953125, -0.3506317138671875, -0.33235931396484375, -0.3140869140625, -0.29581451416015625, -0.2775421142578125, -0.25926971435546875, -0.240997314453125, -0.22272491455078125, -0.2044525146484375, -0.18618011474609375, -0.16790771484375, -0.14963531494140625, -0.1313629150390625, -0.11309051513671875, -0.094818115234375, -0.07654571533203125, -0.0582733154296875, -0.04000091552734375, -0.021728515625, -0.00345611572265625, 0.0148162841796875, 0.03308868408203125, 0.051361083984375, 0.06963348388671875, 0.0879058837890625, 0.10617828369140625, 0.12445068359375, 0.14272308349609375, 0.1609954833984375, 0.17926788330078125, 0.197540283203125, 0.21581268310546875, 0.2340850830078125, 0.25235748291015625, 0.2706298828125, 0.28890228271484375, 0.3071746826171875, 0.32544708251953125, 0.343719482421875, 0.36199188232421875, 0.3802642822265625, 0.39853668212890625, 0.41680908203125, 0.43508148193359375, 0.4533538818359375, 0.47162628173828125, 0.489898681640625, 0.5081710815429688, 0.5264434814453125, 0.5447158813476562, 0.56298828125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 9.0, 10.0, 21.0, 18.0, 16.0, 40.0, 33.0, 45.0, 50.0, 61.0, 101.0, 89.0, 102.0, 126.0, 163.0, 197.0, 204.0, 216.0, 262.0, 281.0, 280.0, 267.0, 241.0, 202.0, 164.0, 136.0, 136.0, 97.0, 89.0, 80.0, 66.0, 42.0, 46.0, 31.0, 27.0, 22.0, 15.0, 23.0, 10.0, 7.0, 7.0, 15.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.15771484375, -0.1527729034423828, -0.14783096313476562, -0.14288902282714844, -0.13794708251953125, -0.13300514221191406, -0.12806320190429688, -0.12312126159667969, -0.1181793212890625, -0.11323738098144531, -0.10829544067382812, -0.10335350036621094, -0.09841156005859375, -0.09346961975097656, -0.08852767944335938, -0.08358573913574219, -0.078643798828125, -0.07370185852050781, -0.06875991821289062, -0.06381797790527344, -0.05887603759765625, -0.05393409729003906, -0.048992156982421875, -0.04405021667480469, -0.0391082763671875, -0.03416633605957031, -0.029224395751953125, -0.024282455444335938, -0.01934051513671875, -0.014398574829101562, -0.009456634521484375, -0.0045146942138671875, 0.00042724609375, 0.0053691864013671875, 0.010311126708984375, 0.015253067016601562, 0.02019500732421875, 0.025136947631835938, 0.030078887939453125, 0.03502082824707031, 0.0399627685546875, 0.04490470886230469, 0.049846649169921875, 0.05478858947753906, 0.05973052978515625, 0.06467247009277344, 0.06961441040039062, 0.07455635070800781, 0.079498291015625, 0.08444023132324219, 0.08938217163085938, 0.09432411193847656, 0.09926605224609375, 0.10420799255371094, 0.10914993286132812, 0.11409187316894531, 0.1190338134765625, 0.12397575378417969, 0.12891769409179688, 0.13385963439941406, 0.13880157470703125, 0.14374351501464844, 0.14868545532226562, 0.1536273956298828, 0.1585693359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 10.0, 7.0, 5.0, 9.0, 12.0, 14.0, 21.0, 18.0, 35.0, 43.0, 47.0, 56.0, 72.0, 86.0, 111.0, 80.0, 88.0, 43.0, 42.0, 41.0, 24.0, 25.0, 17.0, 20.0, 6.0, 18.0, 6.0, 5.0, 8.0, 6.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4045407772064209, -0.3903734087944031, -0.37620604038238525, -0.36203867197036743, -0.3478713035583496, -0.3337039351463318, -0.31953656673431396, -0.30536919832229614, -0.2912018299102783, -0.2770344614982605, -0.2628670930862427, -0.24869972467422485, -0.23453235626220703, -0.2203649878501892, -0.2061976194381714, -0.19203025102615356, -0.17786286771297455, -0.16369549930095673, -0.1495281308889389, -0.13536076247692108, -0.12119339406490326, -0.10702601820230484, -0.09285864979028702, -0.0786912813782692, -0.06452391296625137, -0.05035654455423355, -0.03618917614221573, -0.022021804004907608, -0.007854435592889786, 0.006312936544418335, 0.020480304956436157, 0.03464767336845398, 0.0488150417804718, 0.06298241019248962, 0.07714977860450745, 0.09131714701652527, 0.10548451542854309, 0.11965189129114151, 0.13381925225257874, 0.14798662066459656, 0.16215398907661438, 0.1763213574886322, 0.19048872590065002, 0.20465609431266785, 0.21882346272468567, 0.2329908311367035, 0.2471581995487213, 0.26132556796073914, 0.27549296617507935, 0.28966033458709717, 0.303827702999115, 0.3179950714111328, 0.33216243982315063, 0.34632980823516846, 0.3604971766471863, 0.3746645450592041, 0.3888319134712219, 0.40299928188323975, 0.41716665029525757, 0.4313340187072754, 0.4455013871192932, 0.45966875553131104, 0.47383612394332886, 0.4880034923553467, 0.5021708607673645]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 8.0, 10.0, 9.0, 11.0, 15.0, 21.0, 17.0, 20.0, 22.0, 26.0, 30.0, 28.0, 25.0, 27.0, 32.0, 34.0, 36.0, 45.0, 39.0, 30.0, 29.0, 36.0, 33.0, 39.0, 38.0, 30.0, 37.0, 39.0, 42.0, 21.0, 31.0, 25.0, 22.0, 12.0, 11.0, 11.0, 14.0, 12.0, 6.0, 5.0, 2.0, 3.0, 6.0, 2.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34295332431793213, -0.332820862531662, -0.32268840074539185, -0.3125559687614441, -0.30242350697517395, -0.2922910451889038, -0.28215858340263367, -0.2720261216163635, -0.2618936598300934, -0.25176119804382324, -0.2416287511587143, -0.23149628937244415, -0.221363827586174, -0.21123138070106506, -0.20109891891479492, -0.19096645712852478, -0.18083401024341583, -0.1707015484571457, -0.16056910157203674, -0.1504366397857666, -0.14030417799949646, -0.13017171621322632, -0.12003926932811737, -0.10990680754184723, -0.09977435320615768, -0.08964189887046814, -0.079509437084198, -0.06937698274850845, -0.05924452468752861, -0.04911206662654877, -0.03897961229085922, -0.02884715050458908, -0.018714696168899536, -0.008582239039242268, 0.001550218090415001, 0.011682674288749695, 0.021815132349729538, 0.03194759041070938, 0.042080044746398926, 0.05221250653266907, 0.06234496086835861, 0.07247741520404816, 0.0826098769903183, 0.09274233132600784, 0.10287478566169739, 0.11300724744796753, 0.12313970178365707, 0.1332721710205078, 0.14340461790561676, 0.1535370796918869, 0.16366952657699585, 0.173801988363266, 0.18393445014953613, 0.19406691193580627, 0.20419935882091522, 0.21433182060718536, 0.2244642674922943, 0.23459672927856445, 0.2447291761636734, 0.25486165285110474, 0.2649940848350525, 0.27512654662132263, 0.2852590084075928, 0.2953914701938629, 0.30552393198013306]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 13.0, 11.0, 12.0, 16.0, 34.0, 43.0, 61.0, 87.0, 119.0, 197.0, 270.0, 388.0, 530.0, 863.0, 1254.0, 1950.0, 3077.0, 4732.0, 7404.0, 11642.0, 18952.0, 31720.0, 56523.0, 112819.0, 280803.0, 269237.0, 109335.0, 54857.0, 31084.0, 18592.0, 11310.0, 7208.0, 4645.0, 2994.0, 1888.0, 1302.0, 805.0, 571.0, 370.0, 259.0, 188.0, 121.0, 94.0, 58.0, 41.0, 28.0, 23.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.2841796875, -0.2755622863769531, -0.26694488525390625, -0.2583274841308594, -0.2497100830078125, -0.24109268188476562, -0.23247528076171875, -0.22385787963867188, -0.215240478515625, -0.20662307739257812, -0.19800567626953125, -0.18938827514648438, -0.1807708740234375, -0.17215347290039062, -0.16353607177734375, -0.15491867065429688, -0.14630126953125, -0.13768386840820312, -0.12906646728515625, -0.12044906616210938, -0.1118316650390625, -0.10321426391601562, -0.09459686279296875, -0.08597946166992188, -0.077362060546875, -0.06874465942382812, -0.06012725830078125, -0.051509857177734375, -0.0428924560546875, -0.034275054931640625, -0.02565765380859375, -0.017040252685546875, -0.0084228515625, 0.000194549560546875, 0.00881195068359375, 0.017429351806640625, 0.0260467529296875, 0.034664154052734375, 0.04328155517578125, 0.051898956298828125, 0.060516357421875, 0.06913375854492188, 0.07775115966796875, 0.08636856079101562, 0.0949859619140625, 0.10360336303710938, 0.11222076416015625, 0.12083816528320312, 0.12945556640625, 0.13807296752929688, 0.14669036865234375, 0.15530776977539062, 0.1639251708984375, 0.17254257202148438, 0.18115997314453125, 0.18977737426757812, 0.198394775390625, 0.20701217651367188, 0.21562957763671875, 0.22424697875976562, 0.2328643798828125, 0.24148178100585938, 0.25009918212890625, 0.2587165832519531, 0.267333984375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 13.0, 15.0, 18.0, 9.0, 16.0, 28.0, 28.0, 28.0, 16.0, 26.0, 26.0, 29.0, 25.0, 32.0, 45.0, 30.0, 38.0, 29.0, 32.0, 41.0, 35.0, 34.0, 38.0, 29.0, 37.0, 35.0, 28.0, 26.0, 31.0, 31.0, 18.0, 17.0, 11.0, 3.0, 14.0, 13.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.3203125, -0.31081390380859375, -0.3013153076171875, -0.29181671142578125, -0.282318115234375, -0.27281951904296875, -0.2633209228515625, -0.25382232666015625, -0.24432373046875, -0.23482513427734375, -0.2253265380859375, -0.21582794189453125, -0.206329345703125, -0.19683074951171875, -0.1873321533203125, -0.17783355712890625, -0.1683349609375, -0.15883636474609375, -0.1493377685546875, -0.13983917236328125, -0.130340576171875, -0.12084197998046875, -0.1113433837890625, -0.10184478759765625, -0.09234619140625, -0.08284759521484375, -0.0733489990234375, -0.06385040283203125, -0.054351806640625, -0.04485321044921875, -0.0353546142578125, -0.02585601806640625, -0.016357421875, -0.00685882568359375, 0.0026397705078125, 0.01213836669921875, 0.021636962890625, 0.03113555908203125, 0.0406341552734375, 0.05013275146484375, 0.05963134765625, 0.06912994384765625, 0.0786285400390625, 0.08812713623046875, 0.097625732421875, 0.10712432861328125, 0.1166229248046875, 0.12612152099609375, 0.1356201171875, 0.14511871337890625, 0.1546173095703125, 0.16411590576171875, 0.173614501953125, 0.18311309814453125, 0.1926116943359375, 0.20211029052734375, 0.21160888671875, 0.22110748291015625, 0.2306060791015625, 0.24010467529296875, 0.249603271484375, 0.25910186767578125, 0.2686004638671875, 0.27809906005859375, 0.28759765625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 5.0, 10.0, 9.0, 13.0, 10.0, 22.0, 26.0, 40.0, 51.0, 55.0, 93.0, 125.0, 184.0, 224.0, 330.0, 460.0, 657.0, 939.0, 1298.0, 1912.0, 2744.0, 4335.0, 6970.0, 12102.0, 24455.0, 65429.0, 561610.0, 268413.0, 47678.0, 20074.0, 10230.0, 6100.0, 3740.0, 2458.0, 1642.0, 1171.0, 809.0, 589.0, 425.0, 287.0, 229.0, 174.0, 125.0, 97.0, 63.0, 43.0, 40.0, 20.0, 12.0, 8.0, 13.0, 6.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.45458984375, -0.4398612976074219, -0.42513275146484375, -0.4104042053222656, -0.3956756591796875, -0.3809471130371094, -0.36621856689453125, -0.3514900207519531, -0.336761474609375, -0.3220329284667969, -0.30730438232421875, -0.2925758361816406, -0.2778472900390625, -0.2631187438964844, -0.24839019775390625, -0.23366165161132812, -0.21893310546875, -0.20420455932617188, -0.18947601318359375, -0.17474746704101562, -0.1600189208984375, -0.14529037475585938, -0.13056182861328125, -0.11583328247070312, -0.101104736328125, -0.08637619018554688, -0.07164764404296875, -0.056919097900390625, -0.0421905517578125, -0.027462005615234375, -0.01273345947265625, 0.001995086669921875, 0.0167236328125, 0.031452178955078125, 0.04618072509765625, 0.060909271240234375, 0.0756378173828125, 0.09036636352539062, 0.10509490966796875, 0.11982345581054688, 0.134552001953125, 0.14928054809570312, 0.16400909423828125, 0.17873764038085938, 0.1934661865234375, 0.20819473266601562, 0.22292327880859375, 0.23765182495117188, 0.25238037109375, 0.2671089172363281, 0.28183746337890625, 0.2965660095214844, 0.3112945556640625, 0.3260231018066406, 0.34075164794921875, 0.3554801940917969, 0.370208740234375, 0.3849372863769531, 0.39966583251953125, 0.4143943786621094, 0.4291229248046875, 0.4438514709472656, 0.45858001708984375, 0.4733085632324219, 0.488037109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 5.0, 7.0, 9.0, 18.0, 11.0, 10.0, 20.0, 23.0, 23.0, 19.0, 32.0, 20.0, 35.0, 35.0, 21.0, 33.0, 40.0, 42.0, 55.0, 38.0, 52.0, 31.0, 25.0, 29.0, 32.0, 35.0, 25.0, 32.0, 30.0, 11.0, 22.0, 32.0, 13.0, 16.0, 14.0, 14.0, 21.0, 13.0, 7.0, 9.0, 3.0, 7.0, 12.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.19677734375, -0.19060897827148438, -0.18444061279296875, -0.17827224731445312, -0.1721038818359375, -0.16593551635742188, -0.15976715087890625, -0.15359878540039062, -0.147430419921875, -0.14126205444335938, -0.13509368896484375, -0.12892532348632812, -0.1227569580078125, -0.11658859252929688, -0.11042022705078125, -0.10425186157226562, -0.09808349609375, -0.09191513061523438, -0.08574676513671875, -0.07957839965820312, -0.0734100341796875, -0.06724166870117188, -0.06107330322265625, -0.054904937744140625, -0.048736572265625, -0.042568206787109375, -0.03639984130859375, -0.030231475830078125, -0.0240631103515625, -0.017894744873046875, -0.01172637939453125, -0.005558013916015625, 0.0006103515625, 0.006778717041015625, 0.01294708251953125, 0.019115447998046875, 0.0252838134765625, 0.031452178955078125, 0.03762054443359375, 0.043788909912109375, 0.049957275390625, 0.056125640869140625, 0.06229400634765625, 0.06846237182617188, 0.0746307373046875, 0.08079910278320312, 0.08696746826171875, 0.09313583374023438, 0.09930419921875, 0.10547256469726562, 0.11164093017578125, 0.11780929565429688, 0.1239776611328125, 0.13014602661132812, 0.13631439208984375, 0.14248275756835938, 0.148651123046875, 0.15481948852539062, 0.16098785400390625, 0.16715621948242188, 0.1733245849609375, 0.17949295043945312, 0.18566131591796875, 0.19182968139648438, 0.197998046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 12.0, 12.0, 8.0, 15.0, 20.0, 25.0, 36.0, 45.0, 54.0, 53.0, 78.0, 123.0, 130.0, 192.0, 247.0, 323.0, 475.0, 712.0, 1136.0, 1808.0, 3080.0, 5899.0, 14006.0, 50561.0, 779155.0, 147121.0, 23801.0, 8568.0, 4257.0, 2326.0, 1294.0, 848.0, 553.0, 356.0, 287.0, 215.0, 147.0, 120.0, 106.0, 78.0, 61.0, 44.0, 43.0, 25.0, 23.0, 23.0, 20.0, 6.0, 8.0, 4.0, 2.0, 10.0, 2.0, 0.0, 3.0, 3.0], "bins": [-0.11767578125, -0.11408138275146484, -0.11048698425292969, -0.10689258575439453, -0.10329818725585938, -0.09970378875732422, -0.09610939025878906, -0.0925149917602539, -0.08892059326171875, -0.0853261947631836, -0.08173179626464844, -0.07813739776611328, -0.07454299926757812, -0.07094860076904297, -0.06735420227050781, -0.06375980377197266, -0.0601654052734375, -0.056571006774902344, -0.05297660827636719, -0.04938220977783203, -0.045787811279296875, -0.04219341278076172, -0.03859901428222656, -0.035004615783691406, -0.03141021728515625, -0.027815818786621094, -0.024221420288085938, -0.02062702178955078, -0.017032623291015625, -0.013438224792480469, -0.009843826293945312, -0.006249427795410156, -0.002655029296875, 0.0009393692016601562, 0.0045337677001953125, 0.008128166198730469, 0.011722564697265625, 0.015316963195800781, 0.018911361694335938, 0.022505760192871094, 0.02610015869140625, 0.029694557189941406, 0.03328895568847656, 0.03688335418701172, 0.040477752685546875, 0.04407215118408203, 0.04766654968261719, 0.051260948181152344, 0.0548553466796875, 0.058449745178222656, 0.06204414367675781, 0.06563854217529297, 0.06923294067382812, 0.07282733917236328, 0.07642173767089844, 0.0800161361694336, 0.08361053466796875, 0.0872049331665039, 0.09079933166503906, 0.09439373016357422, 0.09798812866210938, 0.10158252716064453, 0.10517692565917969, 0.10877132415771484, 0.11236572265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 9.0, 3.0, 10.0, 15.0, 16.0, 30.0, 28.0, 20.0, 57.0, 71.0, 33.0, 85.0, 74.0, 33.0, 101.0, 77.0, 29.0, 75.0, 37.0, 21.0, 19.0, 29.0, 15.0, 13.0, 23.0, 7.0, 11.0, 11.0, 2.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.337860107421875e-06, -3.238208591938019e-06, -3.1385570764541626e-06, -3.0389055609703064e-06, -2.93925404548645e-06, -2.839602530002594e-06, -2.739951014518738e-06, -2.6402994990348816e-06, -2.5406479835510254e-06, -2.440996468067169e-06, -2.341344952583313e-06, -2.2416934370994568e-06, -2.1420419216156006e-06, -2.0423904061317444e-06, -1.942738890647888e-06, -1.843087375164032e-06, -1.7434358596801758e-06, -1.6437843441963196e-06, -1.5441328287124634e-06, -1.4444813132286072e-06, -1.344829797744751e-06, -1.2451782822608948e-06, -1.1455267667770386e-06, -1.0458752512931824e-06, -9.462237358093262e-07, -8.4657222032547e-07, -7.469207048416138e-07, -6.472691893577576e-07, -5.476176738739014e-07, -4.4796615839004517e-07, -3.4831464290618896e-07, -2.4866312742233276e-07, -1.4901161193847656e-07, -4.936009645462036e-08, 5.029141902923584e-08, 1.4994293451309204e-07, 2.4959444999694824e-07, 3.4924596548080444e-07, 4.4889748096466064e-07, 5.485489964485168e-07, 6.48200511932373e-07, 7.478520274162292e-07, 8.475035429000854e-07, 9.471550583839417e-07, 1.0468065738677979e-06, 1.146458089351654e-06, 1.2461096048355103e-06, 1.3457611203193665e-06, 1.4454126358032227e-06, 1.5450641512870789e-06, 1.644715666770935e-06, 1.7443671822547913e-06, 1.8440186977386475e-06, 1.9436702132225037e-06, 2.04332172870636e-06, 2.142973244190216e-06, 2.2426247596740723e-06, 2.3422762751579285e-06, 2.4419277906417847e-06, 2.541579306125641e-06, 2.641230821609497e-06, 2.7408823370933533e-06, 2.8405338525772095e-06, 2.9401853680610657e-06, 3.039836883544922e-06]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 10.0, 6.0, 18.0, 13.0, 28.0, 32.0, 56.0, 69.0, 113.0, 155.0, 212.0, 284.0, 414.0, 585.0, 857.0, 1192.0, 1939.0, 3117.0, 4910.0, 8706.0, 16125.0, 34633.0, 96432.0, 515809.0, 243459.0, 62671.0, 25379.0, 12542.0, 6909.0, 4104.0, 2546.0, 1691.0, 1070.0, 744.0, 537.0, 317.0, 237.0, 189.0, 146.0, 93.0, 62.0, 48.0, 36.0, 26.0, 11.0, 5.0, 12.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0841064453125, -0.08154296875, -0.0789794921875, -0.076416015625, -0.0738525390625, -0.0712890625, -0.0687255859375, -0.066162109375, -0.0635986328125, -0.06103515625, -0.0584716796875, -0.055908203125, -0.0533447265625, -0.05078125, -0.0482177734375, -0.045654296875, -0.0430908203125, -0.04052734375, -0.0379638671875, -0.035400390625, -0.0328369140625, -0.0302734375, -0.0277099609375, -0.025146484375, -0.0225830078125, -0.02001953125, -0.0174560546875, -0.014892578125, -0.0123291015625, -0.009765625, -0.0072021484375, -0.004638671875, -0.0020751953125, 0.00048828125, 0.0030517578125, 0.005615234375, 0.0081787109375, 0.0107421875, 0.0133056640625, 0.015869140625, 0.0184326171875, 0.02099609375, 0.0235595703125, 0.026123046875, 0.0286865234375, 0.03125, 0.0338134765625, 0.036376953125, 0.0389404296875, 0.04150390625, 0.0440673828125, 0.046630859375, 0.0491943359375, 0.0517578125, 0.0543212890625, 0.056884765625, 0.0594482421875, 0.06201171875, 0.0645751953125, 0.067138671875, 0.0697021484375, 0.072265625, 0.0748291015625, 0.077392578125, 0.0799560546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 7.0, 8.0, 14.0, 11.0, 14.0, 17.0, 14.0, 18.0, 25.0, 33.0, 40.0, 63.0, 84.0, 125.0, 141.0, 78.0, 56.0, 60.0, 41.0, 26.0, 19.0, 15.0, 21.0, 15.0, 5.0, 11.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.015106201171875, -0.014635562896728516, -0.014164924621582031, -0.013694286346435547, -0.013223648071289062, -0.012753009796142578, -0.012282371520996094, -0.01181173324584961, -0.011341094970703125, -0.01087045669555664, -0.010399818420410156, -0.009929180145263672, -0.009458541870117188, -0.008987903594970703, -0.008517265319824219, -0.008046627044677734, -0.00757598876953125, -0.007105350494384766, -0.006634712219238281, -0.006164073944091797, -0.0056934356689453125, -0.005222797393798828, -0.004752159118652344, -0.004281520843505859, -0.003810882568359375, -0.0033402442932128906, -0.0028696060180664062, -0.002398967742919922, -0.0019283294677734375, -0.0014576911926269531, -0.0009870529174804688, -0.0005164146423339844, -4.57763671875e-05, 0.0004248619079589844, 0.0008955001831054688, 0.0013661384582519531, 0.0018367767333984375, 0.002307415008544922, 0.0027780532836914062, 0.0032486915588378906, 0.003719329833984375, 0.004189968109130859, 0.004660606384277344, 0.005131244659423828, 0.0056018829345703125, 0.006072521209716797, 0.006543159484863281, 0.007013797760009766, 0.00748443603515625, 0.007955074310302734, 0.008425712585449219, 0.008896350860595703, 0.009366989135742188, 0.009837627410888672, 0.010308265686035156, 0.01077890396118164, 0.011249542236328125, 0.01172018051147461, 0.012190818786621094, 0.012661457061767578, 0.013132095336914062, 0.013602733612060547, 0.014073371887207031, 0.014544010162353516, 0.0150146484375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 11.0, 9.0, 9.0, 6.0, 11.0, 19.0, 16.0, 27.0, 33.0, 47.0, 58.0, 49.0, 74.0, 98.0, 96.0, 90.0, 72.0, 47.0, 34.0, 34.0, 37.0, 19.0, 11.0, 16.0, 13.0, 12.0, 6.0, 11.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38890865445137024, -0.37509986758232117, -0.3612910509109497, -0.34748226404190063, -0.3336734473705292, -0.3198646605014801, -0.30605584383010864, -0.29224705696105957, -0.2784382402896881, -0.26462945342063904, -0.2508206367492676, -0.2370118349790573, -0.22320303320884705, -0.20939424633979797, -0.1955854296684265, -0.18177664279937744, -0.16796784102916718, -0.1541590392589569, -0.14035023748874664, -0.12654143571853638, -0.11273263394832611, -0.09892383962869644, -0.08511503785848618, -0.07130623608827591, -0.05749743431806564, -0.04368863254785538, -0.02987983264029026, -0.016071032732725143, -0.0022622309625148773, 0.01154656708240509, 0.025355368852615356, 0.03916417062282562, 0.05297297239303589, 0.06678177416324615, 0.08059057593345642, 0.09439937770366669, 0.10820817947387695, 0.12201697379350662, 0.13582578301429749, 0.14963456988334656, 0.16344338655471802, 0.17725218832492828, 0.19106099009513855, 0.20486979186534882, 0.21867859363555908, 0.23248738050460815, 0.24629619717597961, 0.2601049840450287, 0.27391380071640015, 0.2877225875854492, 0.3015314042568207, 0.31534019112586975, 0.3291490077972412, 0.3429577946662903, 0.35676661133766174, 0.3705753982067108, 0.3843841850757599, 0.39819297194480896, 0.4120017886161804, 0.4258105754852295, 0.43961939215660095, 0.45342817902565, 0.4672369956970215, 0.48104578256607056, 0.494854599237442]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 3.0, 5.0, 9.0, 6.0, 12.0, 11.0, 15.0, 21.0, 16.0, 20.0, 22.0, 24.0, 27.0, 28.0, 28.0, 29.0, 21.0, 42.0, 33.0, 47.0, 34.0, 35.0, 31.0, 34.0, 30.0, 37.0, 43.0, 28.0, 40.0, 34.0, 39.0, 27.0, 34.0, 19.0, 24.0, 14.0, 13.0, 8.0, 15.0, 12.0, 10.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3349111080169678, -0.3250650465488434, -0.315218985080719, -0.3053729236125946, -0.2955268621444702, -0.2856808006763458, -0.27583473920822144, -0.26598864793777466, -0.25614261627197266, -0.24629655480384827, -0.23645049333572388, -0.2266044318675995, -0.2167583703994751, -0.2069123089313507, -0.19706623256206512, -0.18722017109394073, -0.17737409472465515, -0.16752803325653076, -0.15768197178840637, -0.14783591032028198, -0.1379898488521576, -0.1281437873840332, -0.11829771101474762, -0.10845164954662323, -0.09860558807849884, -0.08875952661037445, -0.07891346514225006, -0.06906739622354507, -0.059221334755420685, -0.049375273287296295, -0.03952920809388161, -0.02968314290046692, -0.01983705163002014, -0.009990988299250603, -0.00014492496848106384, 0.009701138362288475, 0.019547201693058014, 0.029393263161182404, 0.03923932835459709, 0.04908539354801178, 0.05893145501613617, 0.06877751648426056, 0.07862357795238495, 0.08846964687108994, 0.09831570833921432, 0.10816176980733871, 0.1180078387260437, 0.1278539001941681, 0.13769996166229248, 0.14754602313041687, 0.15739208459854126, 0.16723814606666565, 0.17708420753479004, 0.18693026900291443, 0.1967763453722, 0.2066224068403244, 0.2164684683084488, 0.22631452977657318, 0.23616059124469757, 0.24600665271282196, 0.25585272908210754, 0.26569879055023193, 0.2755448520183563, 0.2853909134864807, 0.2952369749546051]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 12.0, 12.0, 20.0, 29.0, 46.0, 81.0, 98.0, 151.0, 295.0, 437.0, 708.0, 1147.0, 1895.0, 3095.0, 5290.0, 8812.0, 15128.0, 26636.0, 49716.0, 97333.0, 204638.0, 296789.0, 162885.0, 78781.0, 40686.0, 22257.0, 12653.0, 7453.0, 4535.0, 2666.0, 1642.0, 998.0, 595.0, 378.0, 238.0, 163.0, 96.0, 48.0, 44.0, 23.0, 15.0, 20.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59814453125, -0.5762710571289062, -0.5543975830078125, -0.5325241088867188, -0.510650634765625, -0.48877716064453125, -0.4669036865234375, -0.44503021240234375, -0.42315673828125, -0.40128326416015625, -0.3794097900390625, -0.35753631591796875, -0.335662841796875, -0.31378936767578125, -0.2919158935546875, -0.27004241943359375, -0.2481689453125, -0.22629547119140625, -0.2044219970703125, -0.18254852294921875, -0.160675048828125, -0.13880157470703125, -0.1169281005859375, -0.09505462646484375, -0.07318115234375, -0.05130767822265625, -0.0294342041015625, -0.00756072998046875, 0.014312744140625, 0.03618621826171875, 0.0580596923828125, 0.07993316650390625, 0.101806640625, 0.12368011474609375, 0.1455535888671875, 0.16742706298828125, 0.189300537109375, 0.21117401123046875, 0.2330474853515625, 0.25492095947265625, 0.27679443359375, 0.29866790771484375, 0.3205413818359375, 0.34241485595703125, 0.364288330078125, 0.38616180419921875, 0.4080352783203125, 0.42990875244140625, 0.4517822265625, 0.47365570068359375, 0.4955291748046875, 0.5174026489257812, 0.539276123046875, 0.5611495971679688, 0.5830230712890625, 0.6048965454101562, 0.62677001953125, 0.6486434936523438, 0.6705169677734375, 0.6923904418945312, 0.714263916015625, 0.7361373901367188, 0.7580108642578125, 0.7798843383789062, 0.8017578125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 4.0, 9.0, 10.0, 11.0, 12.0, 8.0, 18.0, 21.0, 20.0, 12.0, 31.0, 32.0, 22.0, 29.0, 30.0, 40.0, 34.0, 37.0, 47.0, 37.0, 39.0, 30.0, 43.0, 34.0, 39.0, 32.0, 43.0, 41.0, 37.0, 23.0, 21.0, 20.0, 27.0, 21.0, 12.0, 18.0, 10.0, 12.0, 8.0, 8.0, 3.0, 8.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.317138671875, -0.3077545166015625, -0.298370361328125, -0.2889862060546875, -0.27960205078125, -0.2702178955078125, -0.260833740234375, -0.2514495849609375, -0.2420654296875, -0.2326812744140625, -0.223297119140625, -0.2139129638671875, -0.20452880859375, -0.1951446533203125, -0.185760498046875, -0.1763763427734375, -0.1669921875, -0.1576080322265625, -0.148223876953125, -0.1388397216796875, -0.12945556640625, -0.1200714111328125, -0.110687255859375, -0.1013031005859375, -0.0919189453125, -0.0825347900390625, -0.073150634765625, -0.0637664794921875, -0.05438232421875, -0.0449981689453125, -0.035614013671875, -0.0262298583984375, -0.016845703125, -0.0074615478515625, 0.001922607421875, 0.0113067626953125, 0.02069091796875, 0.0300750732421875, 0.039459228515625, 0.0488433837890625, 0.0582275390625, 0.0676116943359375, 0.076995849609375, 0.0863800048828125, 0.09576416015625, 0.1051483154296875, 0.114532470703125, 0.1239166259765625, 0.13330078125, 0.1426849365234375, 0.152069091796875, 0.1614532470703125, 0.17083740234375, 0.1802215576171875, 0.189605712890625, 0.1989898681640625, 0.2083740234375, 0.2177581787109375, 0.227142333984375, 0.2365264892578125, 0.24591064453125, 0.2552947998046875, 0.264678955078125, 0.2740631103515625, 0.283447265625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 11.0, 21.0, 22.0, 35.0, 54.0, 67.0, 96.0, 150.0, 241.0, 336.0, 567.0, 846.0, 1358.0, 2155.0, 3537.0, 6375.0, 10802.0, 19876.0, 38313.0, 77756.0, 166300.0, 331421.0, 200099.0, 90729.0, 44316.0, 22977.0, 12392.0, 6918.0, 4123.0, 2492.0, 1440.0, 969.0, 610.0, 370.0, 254.0, 208.0, 86.0, 68.0, 52.0, 40.0, 21.0, 15.0, 13.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7473526000976562, -0.7237091064453125, -0.7000656127929688, -0.676422119140625, -0.6527786254882812, -0.6291351318359375, -0.6054916381835938, -0.58184814453125, -0.5582046508789062, -0.5345611572265625, -0.5109176635742188, -0.487274169921875, -0.46363067626953125, -0.4399871826171875, -0.41634368896484375, -0.3927001953125, -0.36905670166015625, -0.3454132080078125, -0.32176971435546875, -0.298126220703125, -0.27448272705078125, -0.2508392333984375, -0.22719573974609375, -0.20355224609375, -0.17990875244140625, -0.1562652587890625, -0.13262176513671875, -0.108978271484375, -0.08533477783203125, -0.0616912841796875, -0.03804779052734375, -0.014404296875, 0.00923919677734375, 0.0328826904296875, 0.05652618408203125, 0.080169677734375, 0.10381317138671875, 0.1274566650390625, 0.15110015869140625, 0.17474365234375, 0.19838714599609375, 0.2220306396484375, 0.24567413330078125, 0.269317626953125, 0.29296112060546875, 0.3166046142578125, 0.34024810791015625, 0.3638916015625, 0.38753509521484375, 0.4111785888671875, 0.43482208251953125, 0.458465576171875, 0.48210906982421875, 0.5057525634765625, 0.5293960571289062, 0.55303955078125, 0.5766830444335938, 0.6003265380859375, 0.6239700317382812, 0.647613525390625, 0.6712570190429688, 0.6949005126953125, 0.7185440063476562, 0.7421875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 10.0, 10.0, 9.0, 10.0, 19.0, 17.0, 28.0, 27.0, 17.0, 34.0, 33.0, 43.0, 42.0, 42.0, 47.0, 48.0, 34.0, 52.0, 48.0, 35.0, 44.0, 38.0, 41.0, 45.0, 33.0, 25.0, 32.0, 18.0, 26.0, 12.0, 11.0, 17.0, 14.0, 8.0, 6.0, 6.0, 6.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2335205078125, -0.22669410705566406, -0.21986770629882812, -0.2130413055419922, -0.20621490478515625, -0.1993885040283203, -0.19256210327148438, -0.18573570251464844, -0.1789093017578125, -0.17208290100097656, -0.16525650024414062, -0.1584300994873047, -0.15160369873046875, -0.1447772979736328, -0.13795089721679688, -0.13112449645996094, -0.124298095703125, -0.11747169494628906, -0.11064529418945312, -0.10381889343261719, -0.09699249267578125, -0.09016609191894531, -0.08333969116210938, -0.07651329040527344, -0.0696868896484375, -0.06286048889160156, -0.056034088134765625, -0.04920768737792969, -0.04238128662109375, -0.03555488586425781, -0.028728485107421875, -0.021902084350585938, -0.01507568359375, -0.008249282836914062, -0.001422882080078125, 0.0054035186767578125, 0.01222991943359375, 0.019056320190429688, 0.025882720947265625, 0.03270912170410156, 0.0395355224609375, 0.04636192321777344, 0.053188323974609375, 0.06001472473144531, 0.06684112548828125, 0.07366752624511719, 0.08049392700195312, 0.08732032775878906, 0.094146728515625, 0.10097312927246094, 0.10779953002929688, 0.11462593078613281, 0.12145233154296875, 0.1282787322998047, 0.13510513305664062, 0.14193153381347656, 0.1487579345703125, 0.15558433532714844, 0.16241073608398438, 0.1692371368408203, 0.17606353759765625, 0.1828899383544922, 0.18971633911132812, 0.19654273986816406, 0.203369140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 7.0, 9.0, 12.0, 11.0, 22.0, 23.0, 33.0, 48.0, 65.0, 92.0, 153.0, 168.0, 261.0, 298.0, 447.0, 620.0, 803.0, 1115.0, 1532.0, 2050.0, 2751.0, 3952.0, 5518.0, 8024.0, 12207.0, 19044.0, 31720.0, 60678.0, 699964.0, 89388.0, 38846.0, 22788.0, 13959.0, 9370.0, 6331.0, 4483.0, 3132.0, 2291.0, 1657.0, 1218.0, 941.0, 678.0, 510.0, 356.0, 253.0, 214.0, 132.0, 101.0, 86.0, 62.0, 43.0, 28.0, 29.0, 17.0, 10.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.162841796875, -0.1577014923095703, -0.15256118774414062, -0.14742088317871094, -0.14228057861328125, -0.13714027404785156, -0.13199996948242188, -0.1268596649169922, -0.1217193603515625, -0.11657905578613281, -0.11143875122070312, -0.10629844665527344, -0.10115814208984375, -0.09601783752441406, -0.09087753295898438, -0.08573722839355469, -0.080596923828125, -0.07545661926269531, -0.07031631469726562, -0.06517601013183594, -0.06003570556640625, -0.05489540100097656, -0.049755096435546875, -0.04461479187011719, -0.0394744873046875, -0.03433418273925781, -0.029193878173828125, -0.024053573608398438, -0.01891326904296875, -0.013772964477539062, -0.008632659912109375, -0.0034923553466796875, 0.00164794921875, 0.0067882537841796875, 0.011928558349609375, 0.017068862915039062, 0.02220916748046875, 0.027349472045898438, 0.032489776611328125, 0.03763008117675781, 0.0427703857421875, 0.04791069030761719, 0.053050994873046875, 0.05819129943847656, 0.06333160400390625, 0.06847190856933594, 0.07361221313476562, 0.07875251770019531, 0.083892822265625, 0.08903312683105469, 0.09417343139648438, 0.09931373596191406, 0.10445404052734375, 0.10959434509277344, 0.11473464965820312, 0.11987495422363281, 0.1250152587890625, 0.1301555633544922, 0.13529586791992188, 0.14043617248535156, 0.14557647705078125, 0.15071678161621094, 0.15585708618164062, 0.1609973907470703, 0.1661376953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 15.0, 15.0, 20.0, 27.0, 41.0, 89.0, 340.0, 235.0, 80.0, 31.0, 29.0, 20.0, 10.0, 11.0, 4.0, 5.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5795230865478516e-05, -1.5407800674438477e-05, -1.5020370483398438e-05, -1.4632940292358398e-05, -1.424551010131836e-05, -1.385807991027832e-05, -1.3470649719238281e-05, -1.3083219528198242e-05, -1.2695789337158203e-05, -1.2308359146118164e-05, -1.1920928955078125e-05, -1.1533498764038086e-05, -1.1146068572998047e-05, -1.0758638381958008e-05, -1.0371208190917969e-05, -9.98377799987793e-06, -9.59634780883789e-06, -9.208917617797852e-06, -8.821487426757812e-06, -8.434057235717773e-06, -8.046627044677734e-06, -7.659196853637695e-06, -7.271766662597656e-06, -6.884336471557617e-06, -6.496906280517578e-06, -6.109476089477539e-06, -5.7220458984375e-06, -5.334615707397461e-06, -4.947185516357422e-06, -4.559755325317383e-06, -4.172325134277344e-06, -3.7848949432373047e-06, -3.3974647521972656e-06, -3.0100345611572266e-06, -2.6226043701171875e-06, -2.2351741790771484e-06, -1.8477439880371094e-06, -1.4603137969970703e-06, -1.0728836059570312e-06, -6.854534149169922e-07, -2.980232238769531e-07, 8.940696716308594e-08, 4.76837158203125e-07, 8.642673492431641e-07, 1.2516975402832031e-06, 1.6391277313232422e-06, 2.0265579223632812e-06, 2.4139881134033203e-06, 2.8014183044433594e-06, 3.1888484954833984e-06, 3.5762786865234375e-06, 3.9637088775634766e-06, 4.351139068603516e-06, 4.738569259643555e-06, 5.125999450683594e-06, 5.513429641723633e-06, 5.900859832763672e-06, 6.288290023803711e-06, 6.67572021484375e-06, 7.063150405883789e-06, 7.450580596923828e-06, 7.838010787963867e-06, 8.225440979003906e-06, 8.612871170043945e-06, 9.000301361083984e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 13.0, 17.0, 32.0, 27.0, 43.0, 69.0, 82.0, 116.0, 161.0, 188.0, 264.0, 402.0, 488.0, 712.0, 960.0, 1352.0, 1955.0, 2822.0, 4243.0, 6563.0, 10490.0, 18110.0, 34109.0, 77087.0, 750941.0, 62990.0, 29867.0, 16063.0, 9408.0, 5888.0, 3911.0, 2687.0, 1797.0, 1305.0, 883.0, 724.0, 448.0, 366.0, 244.0, 193.0, 137.0, 102.0, 78.0, 64.0, 34.0, 27.0, 27.0, 16.0, 13.0, 7.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.2462158203125, -0.2383747100830078, -0.23053359985351562, -0.22269248962402344, -0.21485137939453125, -0.20701026916503906, -0.19916915893554688, -0.1913280487060547, -0.1834869384765625, -0.1756458282470703, -0.16780471801757812, -0.15996360778808594, -0.15212249755859375, -0.14428138732910156, -0.13644027709960938, -0.1285991668701172, -0.120758056640625, -0.11291694641113281, -0.10507583618164062, -0.09723472595214844, -0.08939361572265625, -0.08155250549316406, -0.07371139526367188, -0.06587028503417969, -0.0580291748046875, -0.05018806457519531, -0.042346954345703125, -0.03450584411621094, -0.02666473388671875, -0.018823623657226562, -0.010982513427734375, -0.0031414031982421875, 0.00469970703125, 0.012540817260742188, 0.020381927490234375, 0.028223037719726562, 0.03606414794921875, 0.04390525817871094, 0.051746368408203125, 0.05958747863769531, 0.0674285888671875, 0.07526969909667969, 0.08311080932617188, 0.09095191955566406, 0.09879302978515625, 0.10663414001464844, 0.11447525024414062, 0.12231636047363281, 0.130157470703125, 0.1379985809326172, 0.14583969116210938, 0.15368080139160156, 0.16152191162109375, 0.16936302185058594, 0.17720413208007812, 0.1850452423095703, 0.1928863525390625, 0.2007274627685547, 0.20856857299804688, 0.21640968322753906, 0.22425079345703125, 0.23209190368652344, 0.23993301391601562, 0.2477741241455078, 0.255615234375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 6.0, 12.0, 16.0, 13.0, 16.0, 25.0, 37.0, 21.0, 43.0, 556.0, 48.0, 22.0, 15.0, 22.0, 20.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0823974609375, -0.07986640930175781, -0.07733535766601562, -0.07480430603027344, -0.07227325439453125, -0.06974220275878906, -0.06721115112304688, -0.06468009948730469, -0.0621490478515625, -0.05961799621582031, -0.057086944580078125, -0.05455589294433594, -0.05202484130859375, -0.04949378967285156, -0.046962738037109375, -0.04443168640136719, -0.041900634765625, -0.03936958312988281, -0.036838531494140625, -0.03430747985839844, -0.03177642822265625, -0.029245376586914062, -0.026714324951171875, -0.024183273315429688, -0.0216522216796875, -0.019121170043945312, -0.016590118408203125, -0.014059066772460938, -0.01152801513671875, -0.008996963500976562, -0.006465911865234375, -0.0039348602294921875, -0.00140380859375, 0.0011272430419921875, 0.003658294677734375, 0.0061893463134765625, 0.00872039794921875, 0.011251449584960938, 0.013782501220703125, 0.016313552856445312, 0.0188446044921875, 0.021375656127929688, 0.023906707763671875, 0.026437759399414062, 0.02896881103515625, 0.03149986267089844, 0.034030914306640625, 0.03656196594238281, 0.039093017578125, 0.04162406921386719, 0.044155120849609375, 0.04668617248535156, 0.04921722412109375, 0.05174827575683594, 0.054279327392578125, 0.05681037902832031, 0.0593414306640625, 0.06187248229980469, 0.06440353393554688, 0.06693458557128906, 0.06946563720703125, 0.07199668884277344, 0.07452774047851562, 0.07705879211425781, 0.07958984375]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 3.0, 6.0, 6.0, 11.0, 13.0, 16.0, 19.0, 21.0, 34.0, 38.0, 46.0, 76.0, 105.0, 102.0, 110.0, 82.0, 58.0, 47.0, 41.0, 18.0, 30.0, 23.0, 17.0, 12.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4173910915851593, -0.40293681621551514, -0.38848257064819336, -0.3740282952785492, -0.35957401990890503, -0.34511977434158325, -0.3306654989719391, -0.3162112236022949, -0.30175697803497314, -0.287302702665329, -0.2728484570980072, -0.25839418172836304, -0.24393990635871887, -0.2294856458902359, -0.21503138542175293, -0.20057711005210876, -0.1861228346824646, -0.17166857421398163, -0.15721429884433746, -0.1427600383758545, -0.12830576300621033, -0.11385150253772736, -0.09939724206924438, -0.08494297415018082, -0.07048870623111725, -0.05603443831205368, -0.04158017411828041, -0.02712590992450714, -0.012671642005443573, 0.0017826259136199951, 0.016236886382102966, 0.030691154301166534, 0.04514545202255249, 0.05959971994161606, 0.07405398786067963, 0.0885082483291626, 0.10296251624822617, 0.11741678416728973, 0.1318710446357727, 0.14632532000541687, 0.16077958047389984, 0.1752338409423828, 0.18968811631202698, 0.20414237678050995, 0.21859663724899292, 0.23305091261863708, 0.24750517308712006, 0.261959433555603, 0.2764137089252472, 0.29086798429489136, 0.30532222986221313, 0.3197765052318573, 0.33423078060150146, 0.34868502616882324, 0.3631393015384674, 0.3775935769081116, 0.39204782247543335, 0.4065020978450775, 0.4209563434123993, 0.43541061878204346, 0.4498648941516876, 0.4643191695213318, 0.47877341508865356, 0.49322769045829773, 0.5076819658279419]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 9.0, 8.0, 3.0, 5.0, 11.0, 16.0, 14.0, 17.0, 20.0, 15.0, 24.0, 19.0, 29.0, 33.0, 30.0, 33.0, 44.0, 40.0, 25.0, 35.0, 40.0, 26.0, 39.0, 43.0, 33.0, 43.0, 38.0, 26.0, 33.0, 28.0, 41.0, 24.0, 27.0, 19.0, 23.0, 15.0, 13.0, 13.0, 8.0, 12.0, 9.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.30924877524375916, -0.29950910806655884, -0.2897694408893585, -0.2800297737121582, -0.2702901065349579, -0.26055043935775757, -0.25081077218055725, -0.24107110500335693, -0.23133143782615662, -0.2215917706489563, -0.21185210347175598, -0.20211243629455566, -0.19237276911735535, -0.18263310194015503, -0.1728934347629547, -0.1631537675857544, -0.15341410040855408, -0.14367443323135376, -0.13393476605415344, -0.12419509887695312, -0.11445543169975281, -0.10471576452255249, -0.09497609734535217, -0.08523643016815186, -0.07549676299095154, -0.06575709581375122, -0.0560174286365509, -0.046277761459350586, -0.03653809428215027, -0.02679842710494995, -0.017058759927749634, -0.007319092750549316, 0.0024205446243286133, 0.01216021180152893, 0.021899878978729248, 0.031639546155929565, 0.04137921333312988, 0.0511188805103302, 0.06085854768753052, 0.07059821486473083, 0.08033788204193115, 0.09007754921913147, 0.09981721639633179, 0.1095568835735321, 0.11929655075073242, 0.12903621792793274, 0.13877588510513306, 0.14851555228233337, 0.1582552194595337, 0.167994886636734, 0.17773455381393433, 0.18747422099113464, 0.19721388816833496, 0.20695355534553528, 0.2166932225227356, 0.2264328896999359, 0.23617255687713623, 0.24591222405433655, 0.25565189123153687, 0.2653915584087372, 0.2751312255859375, 0.2848708927631378, 0.29461055994033813, 0.30435022711753845, 0.31408989429473877]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 6.0, 14.0, 13.0, 18.0, 30.0, 71.0, 94.0, 133.0, 232.0, 393.0, 648.0, 1087.0, 1774.0, 2974.0, 4988.0, 8500.0, 14579.0, 25476.0, 46905.0, 91702.0, 195657.0, 556398.0, 1880694.0, 874088.0, 253392.0, 109996.0, 54293.0, 29479.0, 16508.0, 9685.0, 5939.0, 3550.0, 2033.0, 1248.0, 726.0, 401.0, 223.0, 118.0, 71.0, 51.0, 36.0, 21.0, 22.0, 11.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.4167366027832031, -0.40110015869140625, -0.3854637145996094, -0.3698272705078125, -0.3541908264160156, -0.33855438232421875, -0.3229179382324219, -0.307281494140625, -0.2916450500488281, -0.27600860595703125, -0.2603721618652344, -0.2447357177734375, -0.22909927368164062, -0.21346282958984375, -0.19782638549804688, -0.18218994140625, -0.16655349731445312, -0.15091705322265625, -0.13528060913085938, -0.1196441650390625, -0.10400772094726562, -0.08837127685546875, -0.07273483276367188, -0.057098388671875, -0.041461944580078125, -0.02582550048828125, -0.010189056396484375, 0.0054473876953125, 0.021083831787109375, 0.03672027587890625, 0.052356719970703125, 0.0679931640625, 0.08362960815429688, 0.09926605224609375, 0.11490249633789062, 0.1305389404296875, 0.14617538452148438, 0.16181182861328125, 0.17744827270507812, 0.193084716796875, 0.20872116088867188, 0.22435760498046875, 0.23999404907226562, 0.2556304931640625, 0.2712669372558594, 0.28690338134765625, 0.3025398254394531, 0.31817626953125, 0.3338127136230469, 0.34944915771484375, 0.3650856018066406, 0.3807220458984375, 0.3963584899902344, 0.41199493408203125, 0.4276313781738281, 0.443267822265625, 0.4589042663574219, 0.47454071044921875, 0.4901771545410156, 0.5058135986328125, 0.5214500427246094, 0.5370864868164062, 0.5527229309082031, 0.568359375]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 11.0, 8.0, 20.0, 16.0, 11.0, 19.0, 20.0, 19.0, 26.0, 39.0, 33.0, 34.0, 34.0, 48.0, 41.0, 46.0, 38.0, 36.0, 56.0, 38.0, 35.0, 49.0, 34.0, 35.0, 31.0, 35.0, 29.0, 19.0, 22.0, 21.0, 10.0, 16.0, 12.0, 11.0, 4.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.18994712829589844, -0.18348312377929688, -0.1770191192626953, -0.17055511474609375, -0.1640911102294922, -0.15762710571289062, -0.15116310119628906, -0.1446990966796875, -0.13823509216308594, -0.13177108764648438, -0.1253070831298828, -0.11884307861328125, -0.11237907409667969, -0.10591506958007812, -0.09945106506347656, -0.092987060546875, -0.08652305603027344, -0.08005905151367188, -0.07359504699707031, -0.06713104248046875, -0.06066703796386719, -0.054203033447265625, -0.04773902893066406, -0.0412750244140625, -0.03481101989746094, -0.028347015380859375, -0.021883010864257812, -0.01541900634765625, -0.008955001831054688, -0.002490997314453125, 0.0039730072021484375, 0.01043701171875, 0.016901016235351562, 0.023365020751953125, 0.029829025268554688, 0.03629302978515625, 0.04275703430175781, 0.049221038818359375, 0.05568504333496094, 0.0621490478515625, 0.06861305236816406, 0.07507705688476562, 0.08154106140136719, 0.08800506591796875, 0.09446907043457031, 0.10093307495117188, 0.10739707946777344, 0.113861083984375, 0.12032508850097656, 0.12678909301757812, 0.1332530975341797, 0.13971710205078125, 0.1461811065673828, 0.15264511108398438, 0.15910911560058594, 0.1655731201171875, 0.17203712463378906, 0.17850112915039062, 0.1849651336669922, 0.19142913818359375, 0.1978931427001953, 0.20435714721679688, 0.21082115173339844, 0.21728515625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 4.0, 7.0, 11.0, 13.0, 13.0, 20.0, 40.0, 41.0, 69.0, 118.0, 179.0, 314.0, 500.0, 834.0, 1504.0, 2576.0, 4406.0, 7492.0, 13016.0, 22825.0, 40263.0, 75189.0, 148170.0, 320659.0, 854228.0, 1593315.0, 603994.0, 246066.0, 118600.0, 61511.0, 33146.0, 18927.0, 10830.0, 6350.0, 3725.0, 2090.0, 1238.0, 783.0, 445.0, 262.0, 176.0, 105.0, 67.0, 48.0, 26.0, 28.0, 15.0, 16.0, 5.0, 12.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.401123046875, -0.38909149169921875, -0.3770599365234375, -0.36502838134765625, -0.352996826171875, -0.34096527099609375, -0.3289337158203125, -0.31690216064453125, -0.30487060546875, -0.29283905029296875, -0.2808074951171875, -0.26877593994140625, -0.256744384765625, -0.24471282958984375, -0.2326812744140625, -0.22064971923828125, -0.2086181640625, -0.19658660888671875, -0.1845550537109375, -0.17252349853515625, -0.160491943359375, -0.14846038818359375, -0.1364288330078125, -0.12439727783203125, -0.11236572265625, -0.10033416748046875, -0.0883026123046875, -0.07627105712890625, -0.064239501953125, -0.05220794677734375, -0.0401763916015625, -0.02814483642578125, -0.01611328125, -0.00408172607421875, 0.0079498291015625, 0.01998138427734375, 0.032012939453125, 0.04404449462890625, 0.0560760498046875, 0.06810760498046875, 0.08013916015625, 0.09217071533203125, 0.1042022705078125, 0.11623382568359375, 0.128265380859375, 0.14029693603515625, 0.1523284912109375, 0.16436004638671875, 0.1763916015625, 0.18842315673828125, 0.2004547119140625, 0.21248626708984375, 0.224517822265625, 0.23654937744140625, 0.2485809326171875, 0.26061248779296875, 0.27264404296875, 0.28467559814453125, 0.2967071533203125, 0.30873870849609375, 0.320770263671875, 0.33280181884765625, 0.3448333740234375, 0.35686492919921875, 0.368896484375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 12.0, 17.0, 25.0, 18.0, 38.0, 32.0, 53.0, 69.0, 61.0, 86.0, 114.0, 144.0, 175.0, 218.0, 238.0, 245.0, 324.0, 347.0, 294.0, 277.0, 236.0, 229.0, 175.0, 133.0, 119.0, 98.0, 71.0, 60.0, 35.0, 38.0, 27.0, 17.0, 15.0, 7.0, 10.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10736083984375, -0.10346317291259766, -0.09956550598144531, -0.09566783905029297, -0.09177017211914062, -0.08787250518798828, -0.08397483825683594, -0.0800771713256836, -0.07617950439453125, -0.0722818374633789, -0.06838417053222656, -0.06448650360107422, -0.060588836669921875, -0.05669116973876953, -0.05279350280761719, -0.048895835876464844, -0.0449981689453125, -0.041100502014160156, -0.03720283508300781, -0.03330516815185547, -0.029407501220703125, -0.02550983428955078, -0.021612167358398438, -0.017714500427246094, -0.01381683349609375, -0.009919166564941406, -0.0060214996337890625, -0.0021238327026367188, 0.001773834228515625, 0.005671501159667969, 0.009569168090820312, 0.013466835021972656, 0.017364501953125, 0.021262168884277344, 0.025159835815429688, 0.02905750274658203, 0.032955169677734375, 0.03685283660888672, 0.04075050354003906, 0.044648170471191406, 0.04854583740234375, 0.052443504333496094, 0.05634117126464844, 0.06023883819580078, 0.06413650512695312, 0.06803417205810547, 0.07193183898925781, 0.07582950592041016, 0.0797271728515625, 0.08362483978271484, 0.08752250671386719, 0.09142017364501953, 0.09531784057617188, 0.09921550750732422, 0.10311317443847656, 0.1070108413696289, 0.11090850830078125, 0.1148061752319336, 0.11870384216308594, 0.12260150909423828, 0.12649917602539062, 0.13039684295654297, 0.1342945098876953, 0.13819217681884766, 0.14208984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 11.0, 9.0, 8.0, 9.0, 9.0, 22.0, 21.0, 27.0, 39.0, 43.0, 58.0, 62.0, 98.0, 104.0, 103.0, 84.0, 60.0, 50.0, 43.0, 31.0, 28.0, 20.0, 12.0, 10.0, 10.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.4097573757171631, -0.3989008069038391, -0.38804423809051514, -0.37718766927719116, -0.3663311004638672, -0.3554745614528656, -0.3446179926395416, -0.33376142382621765, -0.3229048550128937, -0.3120482861995697, -0.3011917173862457, -0.29033514857292175, -0.27947860956192017, -0.2686220407485962, -0.2577654719352722, -0.24690890312194824, -0.23605233430862427, -0.2251957654953003, -0.21433919668197632, -0.20348264276981354, -0.19262607395648956, -0.1817695051431656, -0.1709129512310028, -0.16005638241767883, -0.14919981360435486, -0.13834324479103088, -0.1274866759777069, -0.11663012206554413, -0.10577355325222015, -0.09491698443889618, -0.0840604230761528, -0.07320386171340942, -0.06234732270240784, -0.05149075761437416, -0.040634192526340485, -0.02977762743830681, -0.018921062350273132, -0.008064497262239456, 0.00279206782579422, 0.013648629188537598, 0.024505198001861572, 0.03536176308989525, 0.046218328177928925, 0.0570748932659626, 0.06793145835399628, 0.07878802716732025, 0.08964458853006363, 0.100501149892807, 0.11135771870613098, 0.12221428751945496, 0.13307085633277893, 0.1439274102449417, 0.15478397905826569, 0.16564054787158966, 0.17649710178375244, 0.18735367059707642, 0.1982102394104004, 0.20906680822372437, 0.21992337703704834, 0.23077993094921112, 0.2416364997625351, 0.2524930536746979, 0.26334962248802185, 0.2742061913013458, 0.2850627601146698]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 1.0, 2.0, 5.0, 2.0, 12.0, 13.0, 9.0, 17.0, 18.0, 20.0, 19.0, 22.0, 31.0, 27.0, 28.0, 33.0, 28.0, 34.0, 35.0, 34.0, 41.0, 35.0, 39.0, 36.0, 33.0, 36.0, 45.0, 35.0, 40.0, 23.0, 24.0, 30.0, 36.0, 15.0, 25.0, 21.0, 14.0, 12.0, 9.0, 10.0, 9.0, 10.0, 10.0, 5.0, 2.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20034931600093842, -0.19382792711257935, -0.18730653822422028, -0.1807851493358612, -0.17426376044750214, -0.16774237155914307, -0.1612209975719452, -0.15469959378242493, -0.14817821979522705, -0.14165683090686798, -0.1351354420185089, -0.12861405313014984, -0.12209266424179077, -0.1155712753534317, -0.10904989391565323, -0.10252850502729416, -0.09600710868835449, -0.08948571979999542, -0.08296433091163635, -0.07644294202327728, -0.06992155313491821, -0.06340016424655914, -0.05687878280878067, -0.0503573939204216, -0.04383600503206253, -0.03731461614370346, -0.03079322911798954, -0.02427184209227562, -0.01775045320391655, -0.01122906431555748, -0.0047076791524887085, 0.0018137097358703613, 0.008335113525390625, 0.01485650148242712, 0.021377889439463615, 0.027899276465177536, 0.034420665353536606, 0.040942054241895676, 0.04746343940496445, 0.05398482829332352, 0.06050621718168259, 0.06702760607004166, 0.07354899495840073, 0.0800703763961792, 0.08659176528453827, 0.09311315417289734, 0.09963454306125641, 0.10615593194961548, 0.11267732083797455, 0.11919870972633362, 0.1257200986146927, 0.13224148750305176, 0.13876287639141083, 0.1452842652797699, 0.15180563926696777, 0.15832704305648804, 0.1648484170436859, 0.17136980593204498, 0.17789119482040405, 0.18441258370876312, 0.1909339725971222, 0.19745536148548126, 0.20397675037384033, 0.2104981243610382, 0.21701952815055847]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 4.0, 15.0, 13.0, 19.0, 25.0, 51.0, 64.0, 107.0, 155.0, 269.0, 484.0, 690.0, 1195.0, 1856.0, 3166.0, 5264.0, 9227.0, 16368.0, 30339.0, 62674.0, 170256.0, 452341.0, 164648.0, 61053.0, 29824.0, 16119.0, 8973.0, 5290.0, 3080.0, 1945.0, 1152.0, 703.0, 416.0, 285.0, 179.0, 94.0, 62.0, 45.0, 38.0, 19.0, 8.0, 6.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2327880859375, -0.22562217712402344, -0.21845626831054688, -0.2112903594970703, -0.20412445068359375, -0.1969585418701172, -0.18979263305664062, -0.18262672424316406, -0.1754608154296875, -0.16829490661621094, -0.16112899780273438, -0.1539630889892578, -0.14679718017578125, -0.1396312713623047, -0.13246536254882812, -0.12529945373535156, -0.118133544921875, -0.11096763610839844, -0.10380172729492188, -0.09663581848144531, -0.08946990966796875, -0.08230400085449219, -0.07513809204101562, -0.06797218322753906, -0.0608062744140625, -0.05364036560058594, -0.046474456787109375, -0.03930854797363281, -0.03214263916015625, -0.024976730346679688, -0.017810821533203125, -0.010644912719726562, -0.00347900390625, 0.0036869049072265625, 0.010852813720703125, 0.018018722534179688, 0.02518463134765625, 0.03235054016113281, 0.039516448974609375, 0.04668235778808594, 0.0538482666015625, 0.06101417541503906, 0.06818008422851562, 0.07534599304199219, 0.08251190185546875, 0.08967781066894531, 0.09684371948242188, 0.10400962829589844, 0.111175537109375, 0.11834144592285156, 0.12550735473632812, 0.1326732635498047, 0.13983917236328125, 0.1470050811767578, 0.15417098999023438, 0.16133689880371094, 0.1685028076171875, 0.17566871643066406, 0.18283462524414062, 0.1900005340576172, 0.19716644287109375, 0.2043323516845703, 0.21149826049804688, 0.21866416931152344, 0.225830078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 12.0, 6.0, 13.0, 7.0, 16.0, 17.0, 17.0, 23.0, 20.0, 26.0, 28.0, 26.0, 44.0, 34.0, 36.0, 29.0, 34.0, 40.0, 30.0, 39.0, 35.0, 37.0, 40.0, 33.0, 38.0, 42.0, 32.0, 30.0, 39.0, 28.0, 22.0, 18.0, 16.0, 13.0, 14.0, 8.0, 10.0, 11.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2086181640625, -0.2018299102783203, -0.19504165649414062, -0.18825340270996094, -0.18146514892578125, -0.17467689514160156, -0.16788864135742188, -0.1611003875732422, -0.1543121337890625, -0.1475238800048828, -0.14073562622070312, -0.13394737243652344, -0.12715911865234375, -0.12037086486816406, -0.11358261108398438, -0.10679435729980469, -0.100006103515625, -0.09321784973144531, -0.08642959594726562, -0.07964134216308594, -0.07285308837890625, -0.06606483459472656, -0.059276580810546875, -0.05248832702636719, -0.0457000732421875, -0.03891181945800781, -0.032123565673828125, -0.025335311889648438, -0.01854705810546875, -0.011758804321289062, -0.004970550537109375, 0.0018177032470703125, 0.00860595703125, 0.015394210815429688, 0.022182464599609375, 0.028970718383789062, 0.03575897216796875, 0.04254722595214844, 0.049335479736328125, 0.05612373352050781, 0.0629119873046875, 0.06970024108886719, 0.07648849487304688, 0.08327674865722656, 0.09006500244140625, 0.09685325622558594, 0.10364151000976562, 0.11042976379394531, 0.117218017578125, 0.12400627136230469, 0.13079452514648438, 0.13758277893066406, 0.14437103271484375, 0.15115928649902344, 0.15794754028320312, 0.1647357940673828, 0.1715240478515625, 0.1783123016357422, 0.18510055541992188, 0.19188880920410156, 0.19867706298828125, 0.20546531677246094, 0.21225357055664062, 0.2190418243408203, 0.225830078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 8.0, 6.0, 7.0, 22.0, 20.0, 36.0, 31.0, 66.0, 84.0, 131.0, 159.0, 233.0, 350.0, 524.0, 751.0, 1137.0, 1646.0, 2659.0, 4377.0, 7484.0, 14900.0, 37470.0, 234837.0, 642954.0, 56074.0, 19148.0, 9344.0, 5169.0, 3046.0, 1868.0, 1223.0, 843.0, 609.0, 378.0, 257.0, 204.0, 128.0, 98.0, 86.0, 42.0, 43.0, 29.0, 18.0, 18.0, 6.0, 9.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.370849609375, -0.35894775390625, -0.3470458984375, -0.33514404296875, -0.3232421875, -0.31134033203125, -0.2994384765625, -0.28753662109375, -0.275634765625, -0.26373291015625, -0.2518310546875, -0.23992919921875, -0.22802734375, -0.21612548828125, -0.2042236328125, -0.19232177734375, -0.180419921875, -0.16851806640625, -0.1566162109375, -0.14471435546875, -0.1328125, -0.12091064453125, -0.1090087890625, -0.09710693359375, -0.085205078125, -0.07330322265625, -0.0614013671875, -0.04949951171875, -0.03759765625, -0.02569580078125, -0.0137939453125, -0.00189208984375, 0.010009765625, 0.02191162109375, 0.0338134765625, 0.04571533203125, 0.0576171875, 0.06951904296875, 0.0814208984375, 0.09332275390625, 0.105224609375, 0.11712646484375, 0.1290283203125, 0.14093017578125, 0.15283203125, 0.16473388671875, 0.1766357421875, 0.18853759765625, 0.200439453125, 0.21234130859375, 0.2242431640625, 0.23614501953125, 0.248046875, 0.25994873046875, 0.2718505859375, 0.28375244140625, 0.295654296875, 0.30755615234375, 0.3194580078125, 0.33135986328125, 0.34326171875, 0.35516357421875, 0.3670654296875, 0.37896728515625, 0.390869140625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 7.0, 3.0, 7.0, 16.0, 19.0, 12.0, 24.0, 20.0, 22.0, 31.0, 24.0, 22.0, 42.0, 46.0, 42.0, 41.0, 47.0, 44.0, 46.0, 40.0, 46.0, 55.0, 45.0, 36.0, 30.0, 33.0, 29.0, 26.0, 23.0, 21.0, 15.0, 13.0, 15.0, 12.0, 17.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173095703125, -0.1680736541748047, -0.16305160522460938, -0.15802955627441406, -0.15300750732421875, -0.14798545837402344, -0.14296340942382812, -0.1379413604736328, -0.1329193115234375, -0.1278972625732422, -0.12287521362304688, -0.11785316467285156, -0.11283111572265625, -0.10780906677246094, -0.10278701782226562, -0.09776496887207031, -0.092742919921875, -0.08772087097167969, -0.08269882202148438, -0.07767677307128906, -0.07265472412109375, -0.06763267517089844, -0.06261062622070312, -0.05758857727050781, -0.0525665283203125, -0.04754447937011719, -0.042522430419921875, -0.03750038146972656, -0.03247833251953125, -0.027456283569335938, -0.022434234619140625, -0.017412185668945312, -0.01239013671875, -0.0073680877685546875, -0.002346038818359375, 0.0026760101318359375, 0.00769805908203125, 0.012720108032226562, 0.017742156982421875, 0.022764205932617188, 0.0277862548828125, 0.03280830383300781, 0.037830352783203125, 0.04285240173339844, 0.04787445068359375, 0.05289649963378906, 0.057918548583984375, 0.06294059753417969, 0.067962646484375, 0.07298469543457031, 0.07800674438476562, 0.08302879333496094, 0.08805084228515625, 0.09307289123535156, 0.09809494018554688, 0.10311698913574219, 0.1081390380859375, 0.11316108703613281, 0.11818313598632812, 0.12320518493652344, 0.12822723388671875, 0.13324928283691406, 0.13827133178710938, 0.1432933807373047, 0.1483154296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 10.0, 6.0, 13.0, 13.0, 16.0, 22.0, 41.0, 53.0, 68.0, 65.0, 103.0, 133.0, 141.0, 220.0, 322.0, 376.0, 553.0, 768.0, 1121.0, 1712.0, 2643.0, 4193.0, 7551.0, 15571.0, 45142.0, 438701.0, 448323.0, 44697.0, 15725.0, 7576.0, 4258.0, 2601.0, 1701.0, 1156.0, 746.0, 560.0, 408.0, 302.0, 231.0, 170.0, 127.0, 108.0, 71.0, 65.0, 47.0, 32.0, 26.0, 20.0, 13.0, 10.0, 8.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0], "bins": [-0.047760009765625, -0.046312808990478516, -0.04486560821533203, -0.04341840744018555, -0.04197120666503906, -0.04052400588989258, -0.039076805114746094, -0.03762960433959961, -0.036182403564453125, -0.03473520278930664, -0.033288002014160156, -0.03184080123901367, -0.030393600463867188, -0.028946399688720703, -0.02749919891357422, -0.026051998138427734, -0.02460479736328125, -0.023157596588134766, -0.02171039581298828, -0.020263195037841797, -0.018815994262695312, -0.017368793487548828, -0.015921592712402344, -0.01447439193725586, -0.013027191162109375, -0.01157999038696289, -0.010132789611816406, -0.008685588836669922, -0.0072383880615234375, -0.005791187286376953, -0.004343986511230469, -0.0028967857360839844, -0.0014495849609375, -2.384185791015625e-06, 0.0014448165893554688, 0.002892017364501953, 0.0043392181396484375, 0.005786418914794922, 0.007233619689941406, 0.00868082046508789, 0.010128021240234375, 0.01157522201538086, 0.013022422790527344, 0.014469623565673828, 0.015916824340820312, 0.017364025115966797, 0.01881122589111328, 0.020258426666259766, 0.02170562744140625, 0.023152828216552734, 0.02460002899169922, 0.026047229766845703, 0.027494430541992188, 0.028941631317138672, 0.030388832092285156, 0.03183603286743164, 0.033283233642578125, 0.03473043441772461, 0.036177635192871094, 0.03762483596801758, 0.03907203674316406, 0.04051923751831055, 0.04196643829345703, 0.043413639068603516, 0.04486083984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 11.0, 7.0, 8.0, 6.0, 18.0, 11.0, 21.0, 20.0, 24.0, 67.0, 41.0, 39.0, 68.0, 54.0, 138.0, 67.0, 66.0, 56.0, 92.0, 30.0, 17.0, 19.0, 12.0, 26.0, 7.0, 9.0, 12.0, 15.0, 10.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.3115426301956177e-06, -2.2388994693756104e-06, -2.166256308555603e-06, -2.0936131477355957e-06, -2.0209699869155884e-06, -1.948326826095581e-06, -1.8756836652755737e-06, -1.8030405044555664e-06, -1.730397343635559e-06, -1.6577541828155518e-06, -1.5851110219955444e-06, -1.5124678611755371e-06, -1.4398247003555298e-06, -1.3671815395355225e-06, -1.2945383787155151e-06, -1.2218952178955078e-06, -1.1492520570755005e-06, -1.0766088962554932e-06, -1.0039657354354858e-06, -9.313225746154785e-07, -8.586794137954712e-07, -7.860362529754639e-07, -7.133930921554565e-07, -6.407499313354492e-07, -5.681067705154419e-07, -4.954636096954346e-07, -4.2282044887542725e-07, -3.501772880554199e-07, -2.775341272354126e-07, -2.0489096641540527e-07, -1.3224780559539795e-07, -5.960464477539063e-08, 1.30385160446167e-08, 8.568167686462402e-08, 1.5832483768463135e-07, 2.3096799850463867e-07, 3.03611159324646e-07, 3.762543201446533e-07, 4.4889748096466064e-07, 5.21540641784668e-07, 5.941838026046753e-07, 6.668269634246826e-07, 7.394701242446899e-07, 8.121132850646973e-07, 8.847564458847046e-07, 9.57399606704712e-07, 1.0300427675247192e-06, 1.1026859283447266e-06, 1.1753290891647339e-06, 1.2479722499847412e-06, 1.3206154108047485e-06, 1.3932585716247559e-06, 1.4659017324447632e-06, 1.5385448932647705e-06, 1.6111880540847778e-06, 1.6838312149047852e-06, 1.7564743757247925e-06, 1.8291175365447998e-06, 1.9017606973648071e-06, 1.9744038581848145e-06, 2.0470470190048218e-06, 2.119690179824829e-06, 2.1923333406448364e-06, 2.2649765014648438e-06]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 6.0, 15.0, 7.0, 21.0, 28.0, 37.0, 36.0, 50.0, 70.0, 122.0, 142.0, 181.0, 284.0, 381.0, 536.0, 739.0, 936.0, 1275.0, 1737.0, 2509.0, 3422.0, 5068.0, 7616.0, 11575.0, 19850.0, 34829.0, 75192.0, 296157.0, 400982.0, 86285.0, 38169.0, 21082.0, 12696.0, 8088.0, 5219.0, 3705.0, 2523.0, 1853.0, 1351.0, 997.0, 753.0, 516.0, 423.0, 289.0, 246.0, 132.0, 146.0, 81.0, 66.0, 46.0, 27.0, 23.0, 17.0, 9.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.03460693359375, -0.03352785110473633, -0.032448768615722656, -0.031369686126708984, -0.030290603637695312, -0.02921152114868164, -0.02813243865966797, -0.027053356170654297, -0.025974273681640625, -0.024895191192626953, -0.02381610870361328, -0.02273702621459961, -0.021657943725585938, -0.020578861236572266, -0.019499778747558594, -0.018420696258544922, -0.01734161376953125, -0.016262531280517578, -0.015183448791503906, -0.014104366302490234, -0.013025283813476562, -0.01194620132446289, -0.010867118835449219, -0.009788036346435547, -0.008708953857421875, -0.007629871368408203, -0.006550788879394531, -0.005471706390380859, -0.0043926239013671875, -0.0033135414123535156, -0.0022344589233398438, -0.0011553764343261719, -7.62939453125e-05, 0.0010027885437011719, 0.0020818710327148438, 0.0031609535217285156, 0.0042400360107421875, 0.005319118499755859, 0.006398200988769531, 0.007477283477783203, 0.008556365966796875, 0.009635448455810547, 0.010714530944824219, 0.01179361343383789, 0.012872695922851562, 0.013951778411865234, 0.015030860900878906, 0.016109943389892578, 0.01718902587890625, 0.018268108367919922, 0.019347190856933594, 0.020426273345947266, 0.021505355834960938, 0.02258443832397461, 0.02366352081298828, 0.024742603302001953, 0.025821685791015625, 0.026900768280029297, 0.02797985076904297, 0.02905893325805664, 0.030138015747070312, 0.031217098236083984, 0.032296180725097656, 0.03337526321411133, 0.034454345703125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 5.0, 4.0, 11.0, 10.0, 4.0, 21.0, 15.0, 19.0, 27.0, 34.0, 44.0, 76.0, 93.0, 169.0, 144.0, 77.0, 38.0, 52.0, 28.0, 25.0, 21.0, 16.0, 19.0, 15.0, 7.0, 8.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.0114593505859375, -0.01109933853149414, -0.010739326477050781, -0.010379314422607422, -0.010019302368164062, -0.009659290313720703, -0.009299278259277344, -0.008939266204833984, -0.008579254150390625, -0.008219242095947266, -0.007859230041503906, -0.007499217987060547, -0.0071392059326171875, -0.006779193878173828, -0.006419181823730469, -0.006059169769287109, -0.00569915771484375, -0.005339145660400391, -0.004979133605957031, -0.004619121551513672, -0.0042591094970703125, -0.003899097442626953, -0.0035390853881835938, -0.0031790733337402344, -0.002819061279296875, -0.0024590492248535156, -0.0020990371704101562, -0.0017390251159667969, -0.0013790130615234375, -0.0010190010070800781, -0.0006589889526367188, -0.0002989768981933594, 6.103515625e-05, 0.0004210472106933594, 0.0007810592651367188, 0.0011410713195800781, 0.0015010833740234375, 0.0018610954284667969, 0.0022211074829101562, 0.0025811195373535156, 0.002941131591796875, 0.0033011436462402344, 0.0036611557006835938, 0.004021167755126953, 0.0043811798095703125, 0.004741191864013672, 0.005101203918457031, 0.005461215972900391, 0.00582122802734375, 0.006181240081787109, 0.006541252136230469, 0.006901264190673828, 0.0072612762451171875, 0.007621288299560547, 0.007981300354003906, 0.008341312408447266, 0.008701324462890625, 0.009061336517333984, 0.009421348571777344, 0.009781360626220703, 0.010141372680664062, 0.010501384735107422, 0.010861396789550781, 0.01122140884399414, 0.0115814208984375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 12.0, 12.0, 12.0, 14.0, 27.0, 29.0, 38.0, 53.0, 61.0, 79.0, 113.0, 96.0, 99.0, 73.0, 56.0, 43.0, 40.0, 28.0, 19.0, 20.0, 13.0, 11.0, 7.0, 9.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.40748143196105957, -0.39656150341033936, -0.38564157485961914, -0.3747216761112213, -0.3638017475605011, -0.3528818190097809, -0.34196192026138306, -0.33104199171066284, -0.3201220631599426, -0.3092021346092224, -0.2982822060585022, -0.28736230731010437, -0.27644237875938416, -0.26552245020866394, -0.2546025514602661, -0.2436826229095459, -0.23276269435882568, -0.22184276580810547, -0.21092285215854645, -0.20000293850898743, -0.1890830099582672, -0.178163081407547, -0.16724316775798798, -0.15632325410842896, -0.14540332555770874, -0.13448339700698853, -0.1235634833574295, -0.11264356225728989, -0.10172364115715027, -0.09080372005701065, -0.07988379895687103, -0.06896387785673141, -0.058043986558914185, -0.04712406545877457, -0.03620414435863495, -0.02528422325849533, -0.014364302158355713, -0.003444381058216095, 0.007475540041923523, 0.01839546114206314, 0.02931538224220276, 0.04023530334234238, 0.051155224442481995, 0.06207514554262161, 0.07299506664276123, 0.08391498774290085, 0.09483490884304047, 0.10575482994318008, 0.1166747510433197, 0.12759467959403992, 0.13851459324359894, 0.14943450689315796, 0.16035443544387817, 0.1712743639945984, 0.1821942776441574, 0.19311419129371643, 0.20403411984443665, 0.21495404839515686, 0.22587396204471588, 0.2367938756942749, 0.24771380424499512, 0.25863373279571533, 0.26955366134643555, 0.2804735600948334, 0.2913934886455536]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 5.0, 1.0, 5.0, 10.0, 13.0, 7.0, 16.0, 18.0, 21.0, 22.0, 20.0, 29.0, 32.0, 20.0, 38.0, 25.0, 34.0, 36.0, 36.0, 37.0, 38.0, 35.0, 39.0, 33.0, 39.0, 36.0, 45.0, 38.0, 23.0, 23.0, 31.0, 30.0, 22.0, 20.0, 26.0, 13.0, 13.0, 8.0, 10.0, 10.0, 9.0, 11.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1973443478345871, -0.19091796875, -0.1844916045665741, -0.178065225481987, -0.1716388463973999, -0.1652124673128128, -0.1587860882282257, -0.1523597240447998, -0.1459333449602127, -0.1395069658756256, -0.1330806016921997, -0.1266542226076126, -0.12022784352302551, -0.11380146443843842, -0.10737509280443192, -0.10094872117042542, -0.09452234208583832, -0.08809596300125122, -0.08166959136724472, -0.07524321973323822, -0.06881684064865112, -0.062390465289354324, -0.055964089930057526, -0.04953771457076073, -0.04311133921146393, -0.03668496385216713, -0.03025858849287033, -0.023832213133573532, -0.017405837774276733, -0.010979462414979935, -0.004553087055683136, 0.0018732883036136627, 0.008299678564071655, 0.014726053923368454, 0.021152429282665253, 0.02757880464196205, 0.03400518000125885, 0.04043155536055565, 0.04685793071985245, 0.053284306079149246, 0.059710681438446045, 0.06613706052303314, 0.07256343215703964, 0.07898980379104614, 0.08541618287563324, 0.09184256196022034, 0.09826893359422684, 0.10469530522823334, 0.11112168431282043, 0.11754806339740753, 0.12397443503141403, 0.13040080666542053, 0.13682718575000763, 0.14325356483459473, 0.14967992901802063, 0.15610630810260773, 0.16253268718719482, 0.16895906627178192, 0.17538544535636902, 0.18181180953979492, 0.18823818862438202, 0.19466456770896912, 0.20109093189239502, 0.20751731097698212, 0.2139436900615692]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 6.0, 9.0, 12.0, 19.0, 20.0, 32.0, 49.0, 75.0, 110.0, 141.0, 196.0, 289.0, 387.0, 678.0, 880.0, 1312.0, 2022.0, 3046.0, 4763.0, 7119.0, 11000.0, 17654.0, 27817.0, 44829.0, 76776.0, 140441.0, 244609.0, 199076.0, 106098.0, 59695.0, 36057.0, 22462.0, 14215.0, 9056.0, 5911.0, 3867.0, 2564.0, 1663.0, 1140.0, 779.0, 555.0, 359.0, 228.0, 159.0, 120.0, 93.0, 50.0, 46.0, 23.0, 13.0, 14.0, 6.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.376953125, -0.3647041320800781, -0.35245513916015625, -0.3402061462402344, -0.3279571533203125, -0.3157081604003906, -0.30345916748046875, -0.2912101745605469, -0.278961181640625, -0.2667121887207031, -0.25446319580078125, -0.24221420288085938, -0.2299652099609375, -0.21771621704101562, -0.20546722412109375, -0.19321823120117188, -0.18096923828125, -0.16872024536132812, -0.15647125244140625, -0.14422225952148438, -0.1319732666015625, -0.11972427368164062, -0.10747528076171875, -0.09522628784179688, -0.082977294921875, -0.07072830200195312, -0.05847930908203125, -0.046230316162109375, -0.0339813232421875, -0.021732330322265625, -0.00948333740234375, 0.002765655517578125, 0.0150146484375, 0.027263641357421875, 0.03951263427734375, 0.051761627197265625, 0.0640106201171875, 0.07625961303710938, 0.08850860595703125, 0.10075759887695312, 0.113006591796875, 0.12525558471679688, 0.13750457763671875, 0.14975357055664062, 0.1620025634765625, 0.17425155639648438, 0.18650054931640625, 0.19874954223632812, 0.21099853515625, 0.22324752807617188, 0.23549652099609375, 0.24774551391601562, 0.2599945068359375, 0.2722434997558594, 0.28449249267578125, 0.2967414855957031, 0.308990478515625, 0.3212394714355469, 0.33348846435546875, 0.3457374572753906, 0.3579864501953125, 0.3702354431152344, 0.38248443603515625, 0.3947334289550781, 0.406982421875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 3.0, 6.0, 5.0, 7.0, 2.0, 17.0, 15.0, 17.0, 25.0, 12.0, 32.0, 30.0, 28.0, 34.0, 37.0, 39.0, 24.0, 42.0, 37.0, 39.0, 35.0, 45.0, 50.0, 37.0, 49.0, 38.0, 37.0, 27.0, 23.0, 26.0, 30.0, 22.0, 25.0, 15.0, 14.0, 22.0, 17.0, 5.0, 9.0, 6.0, 4.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20458984375, -0.19836807250976562, -0.19214630126953125, -0.18592453002929688, -0.1797027587890625, -0.17348098754882812, -0.16725921630859375, -0.16103744506835938, -0.154815673828125, -0.14859390258789062, -0.14237213134765625, -0.13615036010742188, -0.1299285888671875, -0.12370681762695312, -0.11748504638671875, -0.11126327514648438, -0.10504150390625, -0.09881973266601562, -0.09259796142578125, -0.08637619018554688, -0.0801544189453125, -0.07393264770507812, -0.06771087646484375, -0.061489105224609375, -0.055267333984375, -0.049045562744140625, -0.04282379150390625, -0.036602020263671875, -0.0303802490234375, -0.024158477783203125, -0.01793670654296875, -0.011714935302734375, -0.0054931640625, 0.000728607177734375, 0.00695037841796875, 0.013172149658203125, 0.0193939208984375, 0.025615692138671875, 0.03183746337890625, 0.038059234619140625, 0.044281005859375, 0.050502777099609375, 0.05672454833984375, 0.06294631958007812, 0.0691680908203125, 0.07538986206054688, 0.08161163330078125, 0.08783340454101562, 0.09405517578125, 0.10027694702148438, 0.10649871826171875, 0.11272048950195312, 0.1189422607421875, 0.12516403198242188, 0.13138580322265625, 0.13760757446289062, 0.143829345703125, 0.15005111694335938, 0.15627288818359375, 0.16249465942382812, 0.1687164306640625, 0.17493820190429688, 0.18115997314453125, 0.18738174438476562, 0.193603515625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 11.0, 17.0, 23.0, 31.0, 55.0, 86.0, 124.0, 182.0, 255.0, 399.0, 620.0, 946.0, 1495.0, 2294.0, 3725.0, 5830.0, 9652.0, 16596.0, 28929.0, 52298.0, 98119.0, 202300.0, 300450.0, 149071.0, 76058.0, 40976.0, 23014.0, 13598.0, 8025.0, 4774.0, 3017.0, 1984.0, 1232.0, 814.0, 510.0, 334.0, 259.0, 153.0, 104.0, 68.0, 35.0, 28.0, 22.0, 13.0, 10.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.47119140625, -0.45660400390625, -0.4420166015625, -0.42742919921875, -0.412841796875, -0.39825439453125, -0.3836669921875, -0.36907958984375, -0.3544921875, -0.33990478515625, -0.3253173828125, -0.31072998046875, -0.296142578125, -0.28155517578125, -0.2669677734375, -0.25238037109375, -0.23779296875, -0.22320556640625, -0.2086181640625, -0.19403076171875, -0.179443359375, -0.16485595703125, -0.1502685546875, -0.13568115234375, -0.12109375, -0.10650634765625, -0.0919189453125, -0.07733154296875, -0.062744140625, -0.04815673828125, -0.0335693359375, -0.01898193359375, -0.00439453125, 0.01019287109375, 0.0247802734375, 0.03936767578125, 0.053955078125, 0.06854248046875, 0.0831298828125, 0.09771728515625, 0.1123046875, 0.12689208984375, 0.1414794921875, 0.15606689453125, 0.170654296875, 0.18524169921875, 0.1998291015625, 0.21441650390625, 0.22900390625, 0.24359130859375, 0.2581787109375, 0.27276611328125, 0.287353515625, 0.30194091796875, 0.3165283203125, 0.33111572265625, 0.345703125, 0.36029052734375, 0.3748779296875, 0.38946533203125, 0.404052734375, 0.41864013671875, 0.4332275390625, 0.44781494140625, 0.46240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 8.0, 12.0, 10.0, 11.0, 24.0, 23.0, 22.0, 21.0, 30.0, 26.0, 31.0, 37.0, 44.0, 40.0, 29.0, 51.0, 47.0, 43.0, 33.0, 45.0, 30.0, 31.0, 41.0, 33.0, 31.0, 36.0, 26.0, 26.0, 28.0, 15.0, 16.0, 12.0, 11.0, 12.0, 16.0, 10.0, 6.0, 8.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.141357421875, -0.13730430603027344, -0.13325119018554688, -0.1291980743408203, -0.12514495849609375, -0.12109184265136719, -0.11703872680664062, -0.11298561096191406, -0.1089324951171875, -0.10487937927246094, -0.10082626342773438, -0.09677314758300781, -0.09272003173828125, -0.08866691589355469, -0.08461380004882812, -0.08056068420410156, -0.076507568359375, -0.07245445251464844, -0.06840133666992188, -0.06434822082519531, -0.06029510498046875, -0.05624198913574219, -0.052188873291015625, -0.04813575744628906, -0.0440826416015625, -0.04002952575683594, -0.035976409912109375, -0.03192329406738281, -0.02787017822265625, -0.023817062377929688, -0.019763946533203125, -0.015710830688476562, -0.01165771484375, -0.0076045989990234375, -0.003551483154296875, 0.0005016326904296875, 0.00455474853515625, 0.008607864379882812, 0.012660980224609375, 0.016714096069335938, 0.0207672119140625, 0.024820327758789062, 0.028873443603515625, 0.03292655944824219, 0.03697967529296875, 0.04103279113769531, 0.045085906982421875, 0.04913902282714844, 0.053192138671875, 0.05724525451660156, 0.061298370361328125, 0.06535148620605469, 0.06940460205078125, 0.07345771789550781, 0.07751083374023438, 0.08156394958496094, 0.0856170654296875, 0.08967018127441406, 0.09372329711914062, 0.09777641296386719, 0.10182952880859375, 0.10588264465332031, 0.10993576049804688, 0.11398887634277344, 0.1180419921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 10.0, 11.0, 19.0, 19.0, 30.0, 43.0, 50.0, 68.0, 84.0, 130.0, 125.0, 177.0, 229.0, 300.0, 399.0, 483.0, 591.0, 767.0, 1030.0, 1289.0, 1946.0, 3047.0, 5493.0, 13517.0, 89203.0, 883030.0, 25379.0, 8133.0, 3862.0, 2363.0, 1543.0, 1163.0, 911.0, 644.0, 556.0, 414.0, 342.0, 266.0, 216.0, 149.0, 124.0, 105.0, 71.0, 56.0, 46.0, 35.0, 15.0, 15.0, 16.0, 9.0, 9.0, 11.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.1900634765625, -0.18416786193847656, -0.17827224731445312, -0.1723766326904297, -0.16648101806640625, -0.1605854034423828, -0.15468978881835938, -0.14879417419433594, -0.1428985595703125, -0.13700294494628906, -0.13110733032226562, -0.1252117156982422, -0.11931610107421875, -0.11342048645019531, -0.10752487182617188, -0.10162925720214844, -0.095733642578125, -0.08983802795410156, -0.08394241333007812, -0.07804679870605469, -0.07215118408203125, -0.06625556945800781, -0.060359954833984375, -0.05446434020996094, -0.0485687255859375, -0.04267311096191406, -0.036777496337890625, -0.030881881713867188, -0.02498626708984375, -0.019090652465820312, -0.013195037841796875, -0.0072994232177734375, -0.00140380859375, 0.0044918060302734375, 0.010387420654296875, 0.016283035278320312, 0.02217864990234375, 0.028074264526367188, 0.033969879150390625, 0.03986549377441406, 0.0457611083984375, 0.05165672302246094, 0.057552337646484375, 0.06344795227050781, 0.06934356689453125, 0.07523918151855469, 0.08113479614257812, 0.08703041076660156, 0.092926025390625, 0.09882164001464844, 0.10471725463867188, 0.11061286926269531, 0.11650848388671875, 0.12240409851074219, 0.12829971313476562, 0.13419532775878906, 0.1400909423828125, 0.14598655700683594, 0.15188217163085938, 0.1577777862548828, 0.16367340087890625, 0.1695690155029297, 0.17546463012695312, 0.18136024475097656, 0.187255859375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 6.0, 9.0, 20.0, 22.0, 48.0, 106.0, 220.0, 263.0, 134.0, 38.0, 54.0, 27.0, 10.0, 12.0, 10.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.268732249736786e-06, -6.100162863731384e-06, -5.931593477725983e-06, -5.763024091720581e-06, -5.5944547057151794e-06, -5.425885319709778e-06, -5.257315933704376e-06, -5.088746547698975e-06, -4.920177161693573e-06, -4.751607775688171e-06, -4.58303838968277e-06, -4.414469003677368e-06, -4.2458996176719666e-06, -4.077330231666565e-06, -3.908760845661163e-06, -3.7401914596557617e-06, -3.57162207365036e-06, -3.4030526876449585e-06, -3.234483301639557e-06, -3.0659139156341553e-06, -2.8973445296287537e-06, -2.728775143623352e-06, -2.5602057576179504e-06, -2.391636371612549e-06, -2.2230669856071472e-06, -2.0544975996017456e-06, -1.885928213596344e-06, -1.7173588275909424e-06, -1.5487894415855408e-06, -1.3802200555801392e-06, -1.2116506695747375e-06, -1.043081283569336e-06, -8.745118975639343e-07, -7.059425115585327e-07, -5.373731255531311e-07, -3.688037395477295e-07, -2.0023435354232788e-07, -3.166496753692627e-08, 1.3690441846847534e-07, 3.0547380447387695e-07, 4.7404319047927856e-07, 6.426125764846802e-07, 8.111819624900818e-07, 9.797513484954834e-07, 1.148320734500885e-06, 1.3168901205062866e-06, 1.4854595065116882e-06, 1.6540288925170898e-06, 1.8225982785224915e-06, 1.991167664527893e-06, 2.1597370505332947e-06, 2.3283064365386963e-06, 2.496875822544098e-06, 2.6654452085494995e-06, 2.834014594554901e-06, 3.0025839805603027e-06, 3.1711533665657043e-06, 3.339722752571106e-06, 3.5082921385765076e-06, 3.676861524581909e-06, 3.845430910587311e-06, 4.014000296592712e-06, 4.182569682598114e-06, 4.351139068603516e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 3.0, 2.0, 4.0, 18.0, 11.0, 22.0, 34.0, 47.0, 70.0, 91.0, 140.0, 168.0, 271.0, 390.0, 496.0, 742.0, 1100.0, 1577.0, 2488.0, 4606.0, 11267.0, 58059.0, 913224.0, 34190.0, 8717.0, 3801.0, 2276.0, 1416.0, 996.0, 661.0, 488.0, 337.0, 246.0, 178.0, 116.0, 84.0, 58.0, 50.0, 27.0, 24.0, 15.0, 6.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.229248046875, -0.22276878356933594, -0.21628952026367188, -0.2098102569580078, -0.20333099365234375, -0.1968517303466797, -0.19037246704101562, -0.18389320373535156, -0.1774139404296875, -0.17093467712402344, -0.16445541381835938, -0.1579761505126953, -0.15149688720703125, -0.1450176239013672, -0.13853836059570312, -0.13205909729003906, -0.125579833984375, -0.11910057067871094, -0.11262130737304688, -0.10614204406738281, -0.09966278076171875, -0.09318351745605469, -0.08670425415039062, -0.08022499084472656, -0.0737457275390625, -0.06726646423339844, -0.060787200927734375, -0.05430793762207031, -0.04782867431640625, -0.04134941101074219, -0.034870147705078125, -0.028390884399414062, -0.02191162109375, -0.015432357788085938, -0.008953094482421875, -0.0024738311767578125, 0.00400543212890625, 0.010484695434570312, 0.016963958740234375, 0.023443222045898438, 0.0299224853515625, 0.03640174865722656, 0.042881011962890625, 0.04936027526855469, 0.05583953857421875, 0.06231880187988281, 0.06879806518554688, 0.07527732849121094, 0.081756591796875, 0.08823585510253906, 0.09471511840820312, 0.10119438171386719, 0.10767364501953125, 0.11415290832519531, 0.12063217163085938, 0.12711143493652344, 0.1335906982421875, 0.14006996154785156, 0.14654922485351562, 0.1530284881591797, 0.15950775146484375, 0.1659870147705078, 0.17246627807617188, 0.17894554138183594, 0.1854248046875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 11.0, 15.0, 33.0, 165.0, 568.0, 97.0, 29.0, 27.0, 13.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044830322265625, -0.043062686920166016, -0.04129505157470703, -0.03952741622924805, -0.03775978088378906, -0.03599214553833008, -0.034224510192871094, -0.03245687484741211, -0.030689239501953125, -0.02892160415649414, -0.027153968811035156, -0.025386333465576172, -0.023618698120117188, -0.021851062774658203, -0.02008342742919922, -0.018315792083740234, -0.01654815673828125, -0.014780521392822266, -0.013012886047363281, -0.011245250701904297, -0.009477615356445312, -0.007709980010986328, -0.005942344665527344, -0.004174709320068359, -0.002407073974609375, -0.0006394386291503906, 0.0011281967163085938, 0.002895832061767578, 0.0046634674072265625, 0.006431102752685547, 0.008198738098144531, 0.009966373443603516, 0.0117340087890625, 0.013501644134521484, 0.015269279479980469, 0.017036914825439453, 0.018804550170898438, 0.020572185516357422, 0.022339820861816406, 0.02410745620727539, 0.025875091552734375, 0.02764272689819336, 0.029410362243652344, 0.031177997589111328, 0.03294563293457031, 0.0347132682800293, 0.03648090362548828, 0.038248538970947266, 0.04001617431640625, 0.041783809661865234, 0.04355144500732422, 0.0453190803527832, 0.04708671569824219, 0.04885435104370117, 0.050621986389160156, 0.05238962173461914, 0.054157257080078125, 0.05592489242553711, 0.057692527770996094, 0.05946016311645508, 0.06122779846191406, 0.06299543380737305, 0.06476306915283203, 0.06653070449829102, 0.06829833984375]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 9.0, 13.0, 16.0, 19.0, 26.0, 33.0, 46.0, 57.0, 96.0, 122.0, 137.0, 96.0, 90.0, 68.0, 39.0, 31.0, 27.0, 12.0, 15.0, 8.0, 12.0, 9.0, 8.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.47175055742263794, -0.4594736099243164, -0.44719669222831726, -0.4349197447299957, -0.4226428270339966, -0.41036587953567505, -0.3980889320373535, -0.38581201434135437, -0.3735350966453552, -0.3612581491470337, -0.34898123145103455, -0.336704283952713, -0.32442736625671387, -0.31215041875839233, -0.2998734712600708, -0.28759655356407166, -0.2753196060657501, -0.2630426585674286, -0.25076574087142944, -0.2384887933731079, -0.22621187567710876, -0.21393492817878723, -0.2016579955816269, -0.18938106298446655, -0.1771041303873062, -0.16482719779014587, -0.15255026519298553, -0.1402733325958252, -0.12799638509750366, -0.11571945995092392, -0.10344251990318298, -0.09116558730602264, -0.07888862490653992, -0.06661169230937958, -0.05433475598692894, -0.0420578196644783, -0.029780887067317963, -0.017503954470157623, -0.005227014422416687, 0.007049918174743652, 0.01932685077190399, 0.03160378336906433, 0.04388071969151497, 0.05615765601396561, 0.06843458861112595, 0.08071152120828629, 0.09298846125602722, 0.10526539385318756, 0.1175423264503479, 0.12981925904750824, 0.14209619164466858, 0.1543731391429901, 0.16665005683898926, 0.1789270043373108, 0.19120393693447113, 0.20348086953163147, 0.2157578021287918, 0.22803473472595215, 0.2403116673231125, 0.2525885999202728, 0.26486554741859436, 0.2771424651145935, 0.28941941261291504, 0.3016963601112366, 0.3139732778072357]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 13.0, 12.0, 9.0, 16.0, 11.0, 17.0, 22.0, 19.0, 24.0, 30.0, 19.0, 40.0, 23.0, 29.0, 39.0, 29.0, 34.0, 34.0, 43.0, 43.0, 37.0, 40.0, 29.0, 34.0, 38.0, 29.0, 24.0, 26.0, 35.0, 28.0, 18.0, 20.0, 18.0, 16.0, 16.0, 8.0, 9.0, 16.0, 7.0, 6.0, 8.0, 6.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.18892674148082733, -0.18307974934577942, -0.1772327721118927, -0.1713857799768448, -0.16553878784179688, -0.15969179570674896, -0.15384481847286224, -0.14799782633781433, -0.14215083420276642, -0.1363038420677185, -0.1304568648338318, -0.12460987269878387, -0.11876288056373596, -0.11291589587926865, -0.10706891119480133, -0.10122191905975342, -0.0953749343752861, -0.08952794969081879, -0.08368095755577087, -0.07783397287130356, -0.07198698073625565, -0.06613999605178833, -0.060293007642030716, -0.0544460192322731, -0.04859903082251549, -0.042752042412757874, -0.03690505400300026, -0.031058067455887794, -0.02521107904613018, -0.019364090636372566, -0.013517104089260101, -0.007670115679502487, -0.001823127269744873, 0.004023860674351454, 0.00987084861844778, 0.01571783609688282, 0.021564824506640434, 0.02741181291639805, 0.03325879946351051, 0.03910578787326813, 0.04495277628302574, 0.050799764692783356, 0.05664675310254097, 0.062493741512298584, 0.0683407261967659, 0.07418771833181381, 0.08003470301628113, 0.08588169515132904, 0.09172867983579636, 0.09757566452026367, 0.10342265665531158, 0.1092696413397789, 0.11511663347482681, 0.12096361815929413, 0.12681061029434204, 0.13265758752822876, 0.13850457966327667, 0.14435157179832458, 0.1501985490322113, 0.15604554116725922, 0.16189253330230713, 0.16773952543735504, 0.17358650267124176, 0.17943349480628967, 0.18528048694133759]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 9.0, 21.0, 14.0, 24.0, 42.0, 84.0, 112.0, 182.0, 341.0, 580.0, 895.0, 1502.0, 2774.0, 4832.0, 8701.0, 15818.0, 28548.0, 54795.0, 111608.0, 258886.0, 1063407.0, 1906032.0, 428425.0, 152746.0, 72556.0, 37045.0, 19593.0, 10696.0, 5990.0, 3329.0, 1860.0, 1112.0, 655.0, 400.0, 252.0, 153.0, 98.0, 57.0, 30.0, 31.0, 19.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.348876953125, -0.33769989013671875, -0.3265228271484375, -0.31534576416015625, -0.304168701171875, -0.29299163818359375, -0.2818145751953125, -0.27063751220703125, -0.25946044921875, -0.24828338623046875, -0.2371063232421875, -0.22592926025390625, -0.214752197265625, -0.20357513427734375, -0.1923980712890625, -0.18122100830078125, -0.1700439453125, -0.15886688232421875, -0.1476898193359375, -0.13651275634765625, -0.125335693359375, -0.11415863037109375, -0.1029815673828125, -0.09180450439453125, -0.08062744140625, -0.06945037841796875, -0.0582733154296875, -0.04709625244140625, -0.035919189453125, -0.02474212646484375, -0.0135650634765625, -0.00238800048828125, 0.0087890625, 0.01996612548828125, 0.0311431884765625, 0.04232025146484375, 0.053497314453125, 0.06467437744140625, 0.0758514404296875, 0.08702850341796875, 0.09820556640625, 0.10938262939453125, 0.1205596923828125, 0.13173675537109375, 0.142913818359375, 0.15409088134765625, 0.1652679443359375, 0.17644500732421875, 0.1876220703125, 0.19879913330078125, 0.2099761962890625, 0.22115325927734375, 0.232330322265625, 0.24350738525390625, 0.2546844482421875, 0.26586151123046875, 0.27703857421875, 0.28821563720703125, 0.2993927001953125, 0.31056976318359375, 0.321746826171875, 0.33292388916015625, 0.3441009521484375, 0.35527801513671875, 0.366455078125]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 9.0, 9.0, 10.0, 16.0, 17.0, 18.0, 28.0, 21.0, 28.0, 27.0, 27.0, 35.0, 29.0, 48.0, 41.0, 36.0, 37.0, 52.0, 52.0, 48.0, 30.0, 27.0, 40.0, 28.0, 39.0, 32.0, 30.0, 28.0, 24.0, 16.0, 15.0, 12.0, 9.0, 12.0, 6.0, 8.0, 9.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12359619140625, -0.11969661712646484, -0.11579704284667969, -0.11189746856689453, -0.10799789428710938, -0.10409832000732422, -0.10019874572753906, -0.0962991714477539, -0.09239959716796875, -0.0885000228881836, -0.08460044860839844, -0.08070087432861328, -0.07680130004882812, -0.07290172576904297, -0.06900215148925781, -0.06510257720947266, -0.0612030029296875, -0.057303428649902344, -0.05340385437011719, -0.04950428009033203, -0.045604705810546875, -0.04170513153076172, -0.03780555725097656, -0.033905982971191406, -0.03000640869140625, -0.026106834411621094, -0.022207260131835938, -0.01830768585205078, -0.014408111572265625, -0.010508537292480469, -0.0066089630126953125, -0.0027093887329101562, 0.001190185546875, 0.005089759826660156, 0.008989334106445312, 0.012888908386230469, 0.016788482666015625, 0.02068805694580078, 0.024587631225585938, 0.028487205505371094, 0.03238677978515625, 0.036286354064941406, 0.04018592834472656, 0.04408550262451172, 0.047985076904296875, 0.05188465118408203, 0.05578422546386719, 0.059683799743652344, 0.0635833740234375, 0.06748294830322266, 0.07138252258300781, 0.07528209686279297, 0.07918167114257812, 0.08308124542236328, 0.08698081970214844, 0.0908803939819336, 0.09477996826171875, 0.0986795425415039, 0.10257911682128906, 0.10647869110107422, 0.11037826538085938, 0.11427783966064453, 0.11817741394042969, 0.12207698822021484, 0.1259765625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 8.0, 25.0, 38.0, 51.0, 70.0, 120.0, 189.0, 265.0, 428.0, 680.0, 1062.0, 1629.0, 2607.0, 4390.0, 6937.0, 11243.0, 18688.0, 30546.0, 51923.0, 89001.0, 161611.0, 324367.0, 775059.0, 1478991.0, 623213.0, 274372.0, 141483.0, 78714.0, 45372.0, 27523.0, 16643.0, 10335.0, 6258.0, 3871.0, 2515.0, 1489.0, 907.0, 607.0, 408.0, 229.0, 136.0, 100.0, 58.0, 44.0, 20.0, 13.0, 14.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0], "bins": [-0.230224609375, -0.22352981567382812, -0.21683502197265625, -0.21014022827148438, -0.2034454345703125, -0.19675064086914062, -0.19005584716796875, -0.18336105346679688, -0.176666259765625, -0.16997146606445312, -0.16327667236328125, -0.15658187866210938, -0.1498870849609375, -0.14319229125976562, -0.13649749755859375, -0.12980270385742188, -0.12310791015625, -0.11641311645507812, -0.10971832275390625, -0.10302352905273438, -0.0963287353515625, -0.08963394165039062, -0.08293914794921875, -0.07624435424804688, -0.069549560546875, -0.06285476684570312, -0.05615997314453125, -0.049465179443359375, -0.0427703857421875, -0.036075592041015625, -0.02938079833984375, -0.022686004638671875, -0.0159912109375, -0.009296417236328125, -0.00260162353515625, 0.004093170166015625, 0.0107879638671875, 0.017482757568359375, 0.02417755126953125, 0.030872344970703125, 0.037567138671875, 0.044261932373046875, 0.05095672607421875, 0.057651519775390625, 0.0643463134765625, 0.07104110717773438, 0.07773590087890625, 0.08443069458007812, 0.09112548828125, 0.09782028198242188, 0.10451507568359375, 0.11120986938476562, 0.1179046630859375, 0.12459945678710938, 0.13129425048828125, 0.13798904418945312, 0.144683837890625, 0.15137863159179688, 0.15807342529296875, 0.16476821899414062, 0.1714630126953125, 0.17815780639648438, 0.18485260009765625, 0.19154739379882812, 0.1982421875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 8.0, 13.0, 23.0, 23.0, 34.0, 42.0, 41.0, 53.0, 74.0, 90.0, 94.0, 110.0, 125.0, 159.0, 181.0, 244.0, 243.0, 309.0, 336.0, 313.0, 278.0, 218.0, 191.0, 170.0, 138.0, 83.0, 72.0, 85.0, 67.0, 66.0, 50.0, 41.0, 28.0, 20.0, 14.0, 11.0, 4.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0704345703125, -0.0681314468383789, -0.06582832336425781, -0.06352519989013672, -0.061222076416015625, -0.05891895294189453, -0.05661582946777344, -0.054312705993652344, -0.05200958251953125, -0.049706459045410156, -0.04740333557128906, -0.04510021209716797, -0.042797088623046875, -0.04049396514892578, -0.03819084167480469, -0.035887718200683594, -0.0335845947265625, -0.031281471252441406, -0.028978347778320312, -0.02667522430419922, -0.024372100830078125, -0.02206897735595703, -0.019765853881835938, -0.017462730407714844, -0.01515960693359375, -0.012856483459472656, -0.010553359985351562, -0.008250236511230469, -0.005947113037109375, -0.0036439895629882812, -0.0013408660888671875, 0.0009622573852539062, 0.003265380859375, 0.005568504333496094, 0.007871627807617188, 0.010174751281738281, 0.012477874755859375, 0.014780998229980469, 0.017084121704101562, 0.019387245178222656, 0.02169036865234375, 0.023993492126464844, 0.026296615600585938, 0.02859973907470703, 0.030902862548828125, 0.03320598602294922, 0.03550910949707031, 0.037812232971191406, 0.0401153564453125, 0.042418479919433594, 0.04472160339355469, 0.04702472686767578, 0.049327850341796875, 0.05163097381591797, 0.05393409729003906, 0.056237220764160156, 0.05854034423828125, 0.060843467712402344, 0.06314659118652344, 0.06544971466064453, 0.06775283813476562, 0.07005596160888672, 0.07235908508300781, 0.0746622085571289, 0.07696533203125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 4.0, 15.0, 9.0, 17.0, 20.0, 27.0, 30.0, 37.0, 66.0, 82.0, 79.0, 130.0, 103.0, 78.0, 66.0, 55.0, 39.0, 23.0, 21.0, 18.0, 18.0, 11.0, 7.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.19987991452217102, -0.19294939935207367, -0.18601888418197632, -0.17908836901187897, -0.17215785384178162, -0.16522735357284546, -0.1582968384027481, -0.15136632323265076, -0.1444358080625534, -0.13750529289245605, -0.1305747777223587, -0.12364427000284195, -0.1167137548327446, -0.10978323966264725, -0.1028527319431305, -0.09592221677303314, -0.08899170160293579, -0.08206118643283844, -0.07513067126274109, -0.06820016354322433, -0.061269648373126984, -0.05433913320302963, -0.04740862175822258, -0.04047811031341553, -0.033547595143318176, -0.026617081835865974, -0.019686568528413773, -0.01275605522096157, -0.005825541913509369, 0.0011049732565879822, 0.008035484701395035, 0.014965996146202087, 0.02189651131629944, 0.02882702462375164, 0.03575753793120384, 0.042688049376010895, 0.049618564546108246, 0.0565490797162056, 0.06347958743572235, 0.0704101026058197, 0.07734061777591705, 0.0842711329460144, 0.09120164811611176, 0.09813215583562851, 0.10506267100572586, 0.11199318617582321, 0.11892369389533997, 0.12585420906543732, 0.13278472423553467, 0.13971523940563202, 0.14664575457572937, 0.15357626974582672, 0.16050678491592407, 0.16743728518486023, 0.17436780035495758, 0.18129831552505493, 0.18822883069515228, 0.19515934586524963, 0.20208986103534698, 0.20902037620544434, 0.2159508764743805, 0.22288140654563904, 0.2298119068145752, 0.23674242198467255, 0.2436729371547699]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 8.0, 6.0, 9.0, 10.0, 8.0, 20.0, 11.0, 17.0, 26.0, 19.0, 28.0, 18.0, 26.0, 36.0, 38.0, 41.0, 38.0, 37.0, 34.0, 38.0, 37.0, 37.0, 37.0, 43.0, 33.0, 34.0, 31.0, 33.0, 30.0, 27.0, 31.0, 25.0, 17.0, 22.0, 14.0, 10.0, 17.0, 6.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 8.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.13533739745616913, -0.1312183290719986, -0.12709924578666687, -0.12298017740249634, -0.1188611090183258, -0.11474203318357468, -0.11062295734882355, -0.10650388896465302, -0.10238481312990189, -0.09826573729515076, -0.09414666891098022, -0.0900275930762291, -0.08590851724147797, -0.08178944885730743, -0.0776703730225563, -0.07355129718780518, -0.06943222880363464, -0.06531315296888351, -0.06119408458471298, -0.05707500874996185, -0.05295593664050102, -0.04883686453104019, -0.04471778869628906, -0.04059871658682823, -0.0364796444773674, -0.03236057236790657, -0.02824149839580059, -0.02412242442369461, -0.02000335231423378, -0.01588428020477295, -0.01176520623266697, -0.007646132260560989, -0.003527045249938965, 0.0005920277908444405, 0.004711100831627846, 0.008830173872411251, 0.012949246913194656, 0.017068319022655487, 0.021187392994761467, 0.025306466966867447, 0.029425539076328278, 0.03354461118578911, 0.03766368329524994, 0.04178275913000107, 0.0459018312394619, 0.05002090334892273, 0.05413997918367386, 0.05825905129313469, 0.06237812340259552, 0.06649719923734665, 0.07061626762151718, 0.07473534345626831, 0.07885441184043884, 0.08297348767518997, 0.0870925635099411, 0.09121163189411163, 0.09533070772886276, 0.09944978356361389, 0.10356885194778442, 0.10768792778253555, 0.11180700361728668, 0.11592607200145721, 0.12004514783620834, 0.12416422367095947, 0.12828329205513]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 7.0, 7.0, 14.0, 12.0, 20.0, 43.0, 71.0, 111.0, 177.0, 281.0, 367.0, 644.0, 1000.0, 1630.0, 2538.0, 4170.0, 6904.0, 11173.0, 19670.0, 35993.0, 70141.0, 160563.0, 390267.0, 177708.0, 75080.0, 38474.0, 20715.0, 11970.0, 7206.0, 4518.0, 2668.0, 1625.0, 1030.0, 632.0, 404.0, 274.0, 152.0, 96.0, 63.0, 49.0, 24.0, 22.0, 18.0, 7.0, 6.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1339111328125, -0.1293792724609375, -0.124847412109375, -0.1203155517578125, -0.11578369140625, -0.1112518310546875, -0.106719970703125, -0.1021881103515625, -0.09765625, -0.0931243896484375, -0.088592529296875, -0.0840606689453125, -0.07952880859375, -0.0749969482421875, -0.070465087890625, -0.0659332275390625, -0.0614013671875, -0.0568695068359375, -0.052337646484375, -0.0478057861328125, -0.04327392578125, -0.0387420654296875, -0.034210205078125, -0.0296783447265625, -0.025146484375, -0.0206146240234375, -0.016082763671875, -0.0115509033203125, -0.00701904296875, -0.0024871826171875, 0.002044677734375, 0.0065765380859375, 0.0111083984375, 0.0156402587890625, 0.020172119140625, 0.0247039794921875, 0.02923583984375, 0.0337677001953125, 0.038299560546875, 0.0428314208984375, 0.04736328125, 0.0518951416015625, 0.056427001953125, 0.0609588623046875, 0.06549072265625, 0.0700225830078125, 0.074554443359375, 0.0790863037109375, 0.0836181640625, 0.0881500244140625, 0.092681884765625, 0.0972137451171875, 0.10174560546875, 0.1062774658203125, 0.110809326171875, 0.1153411865234375, 0.119873046875, 0.1244049072265625, 0.128936767578125, 0.1334686279296875, 0.13800048828125, 0.1425323486328125, 0.147064208984375, 0.1515960693359375, 0.1561279296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 6.0, 3.0, 4.0, 4.0, 16.0, 5.0, 12.0, 17.0, 16.0, 16.0, 25.0, 21.0, 15.0, 22.0, 34.0, 29.0, 43.0, 42.0, 39.0, 37.0, 45.0, 48.0, 43.0, 32.0, 52.0, 48.0, 37.0, 32.0, 30.0, 32.0, 26.0, 28.0, 29.0, 22.0, 19.0, 12.0, 12.0, 11.0, 11.0, 7.0, 8.0, 6.0, 1.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.15966796875, -0.1551361083984375, -0.150604248046875, -0.1460723876953125, -0.14154052734375, -0.1370086669921875, -0.132476806640625, -0.1279449462890625, -0.1234130859375, -0.1188812255859375, -0.114349365234375, -0.1098175048828125, -0.10528564453125, -0.1007537841796875, -0.096221923828125, -0.0916900634765625, -0.087158203125, -0.0826263427734375, -0.078094482421875, -0.0735626220703125, -0.06903076171875, -0.0644989013671875, -0.059967041015625, -0.0554351806640625, -0.0509033203125, -0.0463714599609375, -0.041839599609375, -0.0373077392578125, -0.03277587890625, -0.0282440185546875, -0.023712158203125, -0.0191802978515625, -0.0146484375, -0.0101165771484375, -0.005584716796875, -0.0010528564453125, 0.00347900390625, 0.0080108642578125, 0.012542724609375, 0.0170745849609375, 0.0216064453125, 0.0261383056640625, 0.030670166015625, 0.0352020263671875, 0.03973388671875, 0.0442657470703125, 0.048797607421875, 0.0533294677734375, 0.057861328125, 0.0623931884765625, 0.066925048828125, 0.0714569091796875, 0.07598876953125, 0.0805206298828125, 0.085052490234375, 0.0895843505859375, 0.0941162109375, 0.0986480712890625, 0.103179931640625, 0.1077117919921875, 0.11224365234375, 0.1167755126953125, 0.121307373046875, 0.1258392333984375, 0.13037109375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 1.0, 9.0, 8.0, 8.0, 21.0, 28.0, 37.0, 39.0, 41.0, 96.0, 122.0, 142.0, 204.0, 342.0, 439.0, 603.0, 816.0, 1272.0, 1990.0, 3100.0, 5097.0, 9106.0, 17931.0, 45952.0, 306173.0, 550969.0, 57468.0, 20677.0, 10226.0, 5548.0, 3387.0, 2113.0, 1370.0, 933.0, 653.0, 446.0, 341.0, 240.0, 172.0, 104.0, 91.0, 65.0, 55.0, 43.0, 26.0, 16.0, 10.0, 3.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2364501953125, -0.2290821075439453, -0.22171401977539062, -0.21434593200683594, -0.20697784423828125, -0.19960975646972656, -0.19224166870117188, -0.1848735809326172, -0.1775054931640625, -0.1701374053955078, -0.16276931762695312, -0.15540122985839844, -0.14803314208984375, -0.14066505432128906, -0.13329696655273438, -0.1259288787841797, -0.118560791015625, -0.11119270324707031, -0.10382461547851562, -0.09645652770996094, -0.08908843994140625, -0.08172035217285156, -0.07435226440429688, -0.06698417663574219, -0.0596160888671875, -0.05224800109863281, -0.044879913330078125, -0.03751182556152344, -0.03014373779296875, -0.022775650024414062, -0.015407562255859375, -0.008039474487304688, -0.00067138671875, 0.0066967010498046875, 0.014064788818359375, 0.021432876586914062, 0.02880096435546875, 0.03616905212402344, 0.043537139892578125, 0.05090522766113281, 0.0582733154296875, 0.06564140319824219, 0.07300949096679688, 0.08037757873535156, 0.08774566650390625, 0.09511375427246094, 0.10248184204101562, 0.10984992980957031, 0.117218017578125, 0.12458610534667969, 0.13195419311523438, 0.13932228088378906, 0.14669036865234375, 0.15405845642089844, 0.16142654418945312, 0.1687946319580078, 0.1761627197265625, 0.1835308074951172, 0.19089889526367188, 0.19826698303222656, 0.20563507080078125, 0.21300315856933594, 0.22037124633789062, 0.2277393341064453, 0.235107421875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 11.0, 10.0, 7.0, 10.0, 12.0, 13.0, 14.0, 11.0, 30.0, 20.0, 28.0, 29.0, 25.0, 31.0, 44.0, 35.0, 39.0, 37.0, 39.0, 37.0, 33.0, 42.0, 43.0, 32.0, 45.0, 46.0, 35.0, 32.0, 27.0, 15.0, 22.0, 12.0, 19.0, 12.0, 16.0, 16.0, 3.0, 10.0, 8.0, 7.0, 5.0, 3.0, 5.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.08245849609375, -0.07993698120117188, -0.07741546630859375, -0.07489395141601562, -0.0723724365234375, -0.06985092163085938, -0.06732940673828125, -0.06480789184570312, -0.062286376953125, -0.059764862060546875, -0.05724334716796875, -0.054721832275390625, -0.0522003173828125, -0.049678802490234375, -0.04715728759765625, -0.044635772705078125, -0.0421142578125, -0.039592742919921875, -0.03707122802734375, -0.034549713134765625, -0.0320281982421875, -0.029506683349609375, -0.02698516845703125, -0.024463653564453125, -0.021942138671875, -0.019420623779296875, -0.01689910888671875, -0.014377593994140625, -0.0118560791015625, -0.009334564208984375, -0.00681304931640625, -0.004291534423828125, -0.00177001953125, 0.000751495361328125, 0.00327301025390625, 0.005794525146484375, 0.0083160400390625, 0.010837554931640625, 0.01335906982421875, 0.015880584716796875, 0.018402099609375, 0.020923614501953125, 0.02344512939453125, 0.025966644287109375, 0.0284881591796875, 0.031009674072265625, 0.03353118896484375, 0.036052703857421875, 0.03857421875, 0.041095733642578125, 0.04361724853515625, 0.046138763427734375, 0.0486602783203125, 0.051181793212890625, 0.05370330810546875, 0.056224822998046875, 0.058746337890625, 0.061267852783203125, 0.06378936767578125, 0.06631088256835938, 0.0688323974609375, 0.07135391235351562, 0.07387542724609375, 0.07639694213867188, 0.07891845703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 12.0, 5.0, 15.0, 11.0, 18.0, 35.0, 30.0, 40.0, 56.0, 56.0, 81.0, 128.0, 152.0, 172.0, 294.0, 406.0, 584.0, 944.0, 1399.0, 2244.0, 3863.0, 7151.0, 15765.0, 46931.0, 411690.0, 473630.0, 48510.0, 16250.0, 7270.0, 3975.0, 2284.0, 1492.0, 900.0, 664.0, 388.0, 284.0, 219.0, 161.0, 98.0, 76.0, 71.0, 58.0, 33.0, 25.0, 20.0, 15.0, 15.0, 10.0, 4.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.0184783935546875, -0.017882585525512695, -0.01728677749633789, -0.016690969467163086, -0.01609516143798828, -0.015499353408813477, -0.014903545379638672, -0.014307737350463867, -0.013711929321289062, -0.013116121292114258, -0.012520313262939453, -0.011924505233764648, -0.011328697204589844, -0.010732889175415039, -0.010137081146240234, -0.00954127311706543, -0.008945465087890625, -0.00834965705871582, -0.007753849029541016, -0.007158041000366211, -0.006562232971191406, -0.0059664249420166016, -0.005370616912841797, -0.004774808883666992, -0.0041790008544921875, -0.003583192825317383, -0.002987384796142578, -0.0023915767669677734, -0.0017957687377929688, -0.001199960708618164, -0.0006041526794433594, -8.344650268554688e-06, 0.00058746337890625, 0.0011832714080810547, 0.0017790794372558594, 0.002374887466430664, 0.0029706954956054688, 0.0035665035247802734, 0.004162311553955078, 0.004758119583129883, 0.0053539276123046875, 0.005949735641479492, 0.006545543670654297, 0.0071413516998291016, 0.007737159729003906, 0.008332967758178711, 0.008928775787353516, 0.00952458381652832, 0.010120391845703125, 0.01071619987487793, 0.011312007904052734, 0.011907815933227539, 0.012503623962402344, 0.013099431991577148, 0.013695240020751953, 0.014291048049926758, 0.014886856079101562, 0.015482664108276367, 0.016078472137451172, 0.016674280166625977, 0.01727008819580078, 0.017865896224975586, 0.01846170425415039, 0.019057512283325195, 0.0196533203125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 5.0, 7.0, 9.0, 15.0, 18.0, 12.0, 12.0, 13.0, 35.0, 86.0, 55.0, 53.0, 64.0, 65.0, 73.0, 138.0, 56.0, 47.0, 44.0, 38.0, 49.0, 19.0, 13.0, 13.0, 7.0, 9.0, 6.0, 6.0, 6.0, 1.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.8971040844917297e-06, -1.8272548913955688e-06, -1.757405698299408e-06, -1.687556505203247e-06, -1.6177073121070862e-06, -1.5478581190109253e-06, -1.4780089259147644e-06, -1.4081597328186035e-06, -1.3383105397224426e-06, -1.2684613466262817e-06, -1.1986121535301208e-06, -1.12876296043396e-06, -1.058913767337799e-06, -9.890645742416382e-07, -9.192153811454773e-07, -8.493661880493164e-07, -7.795169949531555e-07, -7.096678018569946e-07, -6.398186087608337e-07, -5.699694156646729e-07, -5.00120222568512e-07, -4.302710294723511e-07, -3.604218363761902e-07, -2.905726432800293e-07, -2.207234501838684e-07, -1.5087425708770752e-07, -8.102506399154663e-08, -1.1175870895385742e-08, 5.8673322200775146e-08, 1.2852251529693604e-07, 1.9837170839309692e-07, 2.682209014892578e-07, 3.380700945854187e-07, 4.079192876815796e-07, 4.777684807777405e-07, 5.476176738739014e-07, 6.174668669700623e-07, 6.873160600662231e-07, 7.57165253162384e-07, 8.270144462585449e-07, 8.968636393547058e-07, 9.667128324508667e-07, 1.0365620255470276e-06, 1.1064112186431885e-06, 1.1762604117393494e-06, 1.2461096048355103e-06, 1.3159587979316711e-06, 1.385807991027832e-06, 1.455657184123993e-06, 1.5255063772201538e-06, 1.5953555703163147e-06, 1.6652047634124756e-06, 1.7350539565086365e-06, 1.8049031496047974e-06, 1.8747523427009583e-06, 1.944601535797119e-06, 2.01445072889328e-06, 2.084299921989441e-06, 2.154149115085602e-06, 2.2239983081817627e-06, 2.2938475012779236e-06, 2.3636966943740845e-06, 2.4335458874702454e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 11.0, 16.0, 26.0, 35.0, 50.0, 80.0, 117.0, 169.0, 246.0, 366.0, 541.0, 861.0, 1430.0, 2436.0, 4170.0, 7692.0, 15507.0, 35306.0, 105479.0, 537098.0, 229614.0, 59384.0, 22996.0, 11024.0, 5690.0, 3181.0, 1852.0, 1100.0, 710.0, 456.0, 299.0, 202.0, 110.0, 84.0, 51.0, 42.0, 31.0, 23.0, 17.0, 16.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019073486328125, -0.018453359603881836, -0.017833232879638672, -0.017213106155395508, -0.016592979431152344, -0.01597285270690918, -0.015352725982666016, -0.014732599258422852, -0.014112472534179688, -0.013492345809936523, -0.01287221908569336, -0.012252092361450195, -0.011631965637207031, -0.011011838912963867, -0.010391712188720703, -0.009771585464477539, -0.009151458740234375, -0.008531332015991211, -0.007911205291748047, -0.007291078567504883, -0.006670951843261719, -0.006050825119018555, -0.005430698394775391, -0.0048105716705322266, -0.0041904449462890625, -0.0035703182220458984, -0.0029501914978027344, -0.0023300647735595703, -0.0017099380493164062, -0.0010898113250732422, -0.0004696846008300781, 0.00015044212341308594, 0.00077056884765625, 0.001390695571899414, 0.002010822296142578, 0.002630949020385742, 0.0032510757446289062, 0.0038712024688720703, 0.004491329193115234, 0.0051114559173583984, 0.0057315826416015625, 0.0063517093658447266, 0.006971836090087891, 0.007591962814331055, 0.008212089538574219, 0.008832216262817383, 0.009452342987060547, 0.010072469711303711, 0.010692596435546875, 0.011312723159790039, 0.011932849884033203, 0.012552976608276367, 0.013173103332519531, 0.013793230056762695, 0.01441335678100586, 0.015033483505249023, 0.015653610229492188, 0.01627373695373535, 0.016893863677978516, 0.01751399040222168, 0.018134117126464844, 0.018754243850708008, 0.019374370574951172, 0.019994497299194336, 0.0206146240234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 10.0, 7.0, 10.0, 12.0, 16.0, 37.0, 36.0, 93.0, 150.0, 211.0, 152.0, 87.0, 40.0, 27.0, 21.0, 17.0, 15.0, 5.0, 7.0, 6.0, 5.0, 4.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0110931396484375, -0.010818719863891602, -0.010544300079345703, -0.010269880294799805, -0.009995460510253906, -0.009721040725708008, -0.00944662094116211, -0.009172201156616211, -0.008897781372070312, -0.008623361587524414, -0.008348941802978516, -0.008074522018432617, -0.007800102233886719, -0.00752568244934082, -0.007251262664794922, -0.0069768428802490234, -0.006702423095703125, -0.0064280033111572266, -0.006153583526611328, -0.00587916374206543, -0.005604743957519531, -0.005330324172973633, -0.005055904388427734, -0.004781484603881836, -0.0045070648193359375, -0.004232645034790039, -0.003958225250244141, -0.003683805465698242, -0.0034093856811523438, -0.0031349658966064453, -0.002860546112060547, -0.0025861263275146484, -0.00231170654296875, -0.0020372867584228516, -0.0017628669738769531, -0.0014884471893310547, -0.0012140274047851562, -0.0009396076202392578, -0.0006651878356933594, -0.00039076805114746094, -0.0001163482666015625, 0.00015807151794433594, 0.0004324913024902344, 0.0007069110870361328, 0.0009813308715820312, 0.0012557506561279297, 0.0015301704406738281, 0.0018045902252197266, 0.002079010009765625, 0.0023534297943115234, 0.002627849578857422, 0.0029022693634033203, 0.0031766891479492188, 0.003451108932495117, 0.0037255287170410156, 0.003999948501586914, 0.0042743682861328125, 0.004548788070678711, 0.004823207855224609, 0.005097627639770508, 0.005372047424316406, 0.005646467208862305, 0.005920886993408203, 0.0061953067779541016, 0.0064697265625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 9.0, 11.0, 12.0, 23.0, 17.0, 32.0, 42.0, 50.0, 67.0, 85.0, 112.0, 121.0, 92.0, 79.0, 54.0, 48.0, 29.0, 25.0, 14.0, 18.0, 8.0, 7.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20207804441452026, -0.19492216408252716, -0.18776626884937286, -0.18061038851737976, -0.17345449328422546, -0.16629861295223236, -0.15914273262023926, -0.15198683738708496, -0.14483095705509186, -0.13767507672309875, -0.13051918148994446, -0.12336330115795135, -0.11620741337537766, -0.10905152559280396, -0.10189563781023026, -0.09473975002765656, -0.08758386224508286, -0.08042797446250916, -0.07327208667993546, -0.06611619889736176, -0.05896031856536865, -0.05180443078279495, -0.04464854300022125, -0.03749265894293785, -0.03033677116036415, -0.0231808852404356, -0.01602499932050705, -0.00886911153793335, -0.0017132256180047989, 0.005442660301923752, 0.012598548084497452, 0.019754432141780853, 0.026910319924354553, 0.03406620770692825, 0.041222091764211655, 0.048377979546785355, 0.055533863604068756, 0.06268975138664246, 0.06984563916921616, 0.07700152695178986, 0.08415740728378296, 0.09131329506635666, 0.09846918284893036, 0.10562506318092346, 0.11278095096349716, 0.11993683874607086, 0.12709271907806396, 0.13424861431121826, 0.14140450954437256, 0.14856038987636566, 0.15571628510951996, 0.16287216544151306, 0.17002806067466736, 0.17718394100666046, 0.18433982133865356, 0.19149571657180786, 0.19865159690380096, 0.20580747723579407, 0.21296337246894836, 0.22011925280094147, 0.22727514803409576, 0.23443102836608887, 0.24158692359924316, 0.24874280393123627, 0.25589868426322937]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 9.0, 8.0, 5.0, 10.0, 13.0, 19.0, 14.0, 23.0, 21.0, 27.0, 22.0, 27.0, 31.0, 42.0, 37.0, 39.0, 38.0, 35.0, 38.0, 35.0, 33.0, 40.0, 45.0, 31.0, 36.0, 33.0, 34.0, 33.0, 22.0, 31.0, 27.0, 22.0, 20.0, 14.0, 10.0, 20.0, 5.0, 7.0, 9.0, 8.0, 3.0, 0.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1353679746389389, -0.13127759099006653, -0.12718720734119415, -0.12309681624174118, -0.1190064325928688, -0.11491604894399643, -0.11082565784454346, -0.10673527419567108, -0.1026448905467987, -0.09855450689792633, -0.09446412324905396, -0.09037373214960098, -0.08628334850072861, -0.08219296485185623, -0.07810257375240326, -0.07401219010353088, -0.06992180645465851, -0.06583142280578613, -0.06174103543162346, -0.057650648057460785, -0.05356026440858841, -0.049469880759716034, -0.04537949338555336, -0.041289106011390686, -0.03719872236251831, -0.033108338713645935, -0.02901795133948326, -0.024927565827965736, -0.02083718031644821, -0.016746794804930687, -0.012656409293413162, -0.008566023781895638, -0.004475638270378113, -0.0003852527588605881, 0.0037051327526569366, 0.007795518264174461, 0.011885903775691986, 0.01597628928720951, 0.020066674798727036, 0.02415706031024456, 0.028247445821762085, 0.03233782947063446, 0.036428216844797134, 0.04051860421895981, 0.044608987867832184, 0.04869937151670456, 0.05278975889086723, 0.05688014626502991, 0.06097052991390228, 0.06506091356277466, 0.06915129721164703, 0.0732416883111, 0.07733207195997238, 0.08142245560884476, 0.08551284670829773, 0.0896032303571701, 0.09369361400604248, 0.09778399765491486, 0.10187438130378723, 0.1059647724032402, 0.11005515605211258, 0.11414553970098495, 0.11823593080043793, 0.1223263144493103, 0.12641669809818268]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 14.0, 17.0, 28.0, 42.0, 78.0, 119.0, 169.0, 262.0, 384.0, 666.0, 1033.0, 1735.0, 2754.0, 4624.0, 7969.0, 13626.0, 24331.0, 44029.0, 82154.0, 164024.0, 295303.0, 193152.0, 95509.0, 50754.0, 27756.0, 15490.0, 9053.0, 5412.0, 3048.0, 1943.0, 1188.0, 760.0, 427.0, 274.0, 165.0, 100.0, 67.0, 32.0, 21.0, 14.0, 10.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.33154296875, -0.3219642639160156, -0.31238555908203125, -0.3028068542480469, -0.2932281494140625, -0.2836494445800781, -0.27407073974609375, -0.2644920349121094, -0.254913330078125, -0.24533462524414062, -0.23575592041015625, -0.22617721557617188, -0.2165985107421875, -0.20701980590820312, -0.19744110107421875, -0.18786239624023438, -0.17828369140625, -0.16870498657226562, -0.15912628173828125, -0.14954757690429688, -0.1399688720703125, -0.13039016723632812, -0.12081146240234375, -0.11123275756835938, -0.101654052734375, -0.09207534790039062, -0.08249664306640625, -0.07291793823242188, -0.0633392333984375, -0.053760528564453125, -0.04418182373046875, -0.034603118896484375, -0.0250244140625, -0.015445709228515625, -0.00586700439453125, 0.003711700439453125, 0.0132904052734375, 0.022869110107421875, 0.03244781494140625, 0.042026519775390625, 0.051605224609375, 0.061183929443359375, 0.07076263427734375, 0.08034133911132812, 0.0899200439453125, 0.09949874877929688, 0.10907745361328125, 0.11865615844726562, 0.12823486328125, 0.13781356811523438, 0.14739227294921875, 0.15697097778320312, 0.1665496826171875, 0.17612838745117188, 0.18570709228515625, 0.19528579711914062, 0.204864501953125, 0.21444320678710938, 0.22402191162109375, 0.23360061645507812, 0.2431793212890625, 0.2527580261230469, 0.26233673095703125, 0.2719154357910156, 0.281494140625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 11.0, 4.0, 7.0, 6.0, 15.0, 14.0, 11.0, 16.0, 18.0, 22.0, 20.0, 35.0, 31.0, 36.0, 25.0, 32.0, 43.0, 27.0, 40.0, 39.0, 31.0, 32.0, 27.0, 39.0, 42.0, 36.0, 32.0, 34.0, 26.0, 36.0, 23.0, 24.0, 24.0, 21.0, 13.0, 19.0, 11.0, 10.0, 12.0, 8.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.109375, -0.10590553283691406, -0.10243606567382812, -0.09896659851074219, -0.09549713134765625, -0.09202766418457031, -0.08855819702148438, -0.08508872985839844, -0.0816192626953125, -0.07814979553222656, -0.07468032836914062, -0.07121086120605469, -0.06774139404296875, -0.06427192687988281, -0.060802459716796875, -0.05733299255371094, -0.053863525390625, -0.05039405822753906, -0.046924591064453125, -0.04345512390136719, -0.03998565673828125, -0.03651618957519531, -0.033046722412109375, -0.029577255249023438, -0.0261077880859375, -0.022638320922851562, -0.019168853759765625, -0.015699386596679688, -0.01222991943359375, -0.008760452270507812, -0.005290985107421875, -0.0018215179443359375, 0.00164794921875, 0.0051174163818359375, 0.008586883544921875, 0.012056350708007812, 0.01552581787109375, 0.018995285034179688, 0.022464752197265625, 0.025934219360351562, 0.0294036865234375, 0.03287315368652344, 0.036342620849609375, 0.03981208801269531, 0.04328155517578125, 0.04675102233886719, 0.050220489501953125, 0.05368995666503906, 0.057159423828125, 0.06062889099121094, 0.06409835815429688, 0.06756782531738281, 0.07103729248046875, 0.07450675964355469, 0.07797622680664062, 0.08144569396972656, 0.0849151611328125, 0.08838462829589844, 0.09185409545898438, 0.09532356262207031, 0.09879302978515625, 0.10226249694824219, 0.10573196411132812, 0.10920143127441406, 0.1126708984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 11.0, 16.0, 21.0, 26.0, 38.0, 45.0, 67.0, 88.0, 148.0, 219.0, 318.0, 492.0, 699.0, 1039.0, 1608.0, 2307.0, 3678.0, 5750.0, 9067.0, 14004.0, 22630.0, 37533.0, 63445.0, 112059.0, 214750.0, 243755.0, 130290.0, 72185.0, 42594.0, 25646.0, 15637.0, 9915.0, 6345.0, 4085.0, 2635.0, 1809.0, 1173.0, 800.0, 567.0, 340.0, 231.0, 156.0, 98.0, 71.0, 37.0, 42.0, 22.0, 23.0, 12.0, 9.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.26123046875, -0.2530975341796875, -0.244964599609375, -0.2368316650390625, -0.22869873046875, -0.2205657958984375, -0.212432861328125, -0.2042999267578125, -0.1961669921875, -0.1880340576171875, -0.179901123046875, -0.1717681884765625, -0.16363525390625, -0.1555023193359375, -0.147369384765625, -0.1392364501953125, -0.131103515625, -0.1229705810546875, -0.114837646484375, -0.1067047119140625, -0.09857177734375, -0.0904388427734375, -0.082305908203125, -0.0741729736328125, -0.0660400390625, -0.0579071044921875, -0.049774169921875, -0.0416412353515625, -0.03350830078125, -0.0253753662109375, -0.017242431640625, -0.0091094970703125, -0.0009765625, 0.0071563720703125, 0.015289306640625, 0.0234222412109375, 0.03155517578125, 0.0396881103515625, 0.047821044921875, 0.0559539794921875, 0.0640869140625, 0.0722198486328125, 0.080352783203125, 0.0884857177734375, 0.09661865234375, 0.1047515869140625, 0.112884521484375, 0.1210174560546875, 0.129150390625, 0.1372833251953125, 0.145416259765625, 0.1535491943359375, 0.16168212890625, 0.1698150634765625, 0.177947998046875, 0.1860809326171875, 0.1942138671875, 0.2023468017578125, 0.210479736328125, 0.2186126708984375, 0.22674560546875, 0.2348785400390625, 0.243011474609375, 0.2511444091796875, 0.25927734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 5.0, 9.0, 9.0, 14.0, 18.0, 11.0, 13.0, 20.0, 19.0, 20.0, 21.0, 32.0, 38.0, 31.0, 46.0, 44.0, 36.0, 21.0, 33.0, 35.0, 37.0, 29.0, 36.0, 51.0, 30.0, 38.0, 31.0, 21.0, 29.0, 23.0, 26.0, 17.0, 21.0, 23.0, 19.0, 17.0, 8.0, 8.0, 4.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0679931640625, -0.06567573547363281, -0.06335830688476562, -0.06104087829589844, -0.05872344970703125, -0.05640602111816406, -0.054088592529296875, -0.05177116394042969, -0.0494537353515625, -0.04713630676269531, -0.044818878173828125, -0.04250144958496094, -0.04018402099609375, -0.03786659240722656, -0.035549163818359375, -0.03323173522949219, -0.030914306640625, -0.028596878051757812, -0.026279449462890625, -0.023962020874023438, -0.02164459228515625, -0.019327163696289062, -0.017009735107421875, -0.014692306518554688, -0.0123748779296875, -0.010057449340820312, -0.007740020751953125, -0.0054225921630859375, -0.00310516357421875, -0.0007877349853515625, 0.001529693603515625, 0.0038471221923828125, 0.00616455078125, 0.008481979370117188, 0.010799407958984375, 0.013116836547851562, 0.01543426513671875, 0.017751693725585938, 0.020069122314453125, 0.022386550903320312, 0.0247039794921875, 0.027021408081054688, 0.029338836669921875, 0.03165626525878906, 0.03397369384765625, 0.03629112243652344, 0.038608551025390625, 0.04092597961425781, 0.043243408203125, 0.04556083679199219, 0.047878265380859375, 0.05019569396972656, 0.05251312255859375, 0.05483055114746094, 0.057147979736328125, 0.05946540832519531, 0.0617828369140625, 0.06410026550292969, 0.06641769409179688, 0.06873512268066406, 0.07105255126953125, 0.07336997985839844, 0.07568740844726562, 0.07800483703613281, 0.080322265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 11.0, 14.0, 19.0, 34.0, 41.0, 47.0, 83.0, 111.0, 152.0, 235.0, 322.0, 477.0, 711.0, 959.0, 1413.0, 1958.0, 2948.0, 4428.0, 6519.0, 10007.0, 16032.0, 28993.0, 66419.0, 613081.0, 182621.0, 47646.0, 23287.0, 13550.0, 8522.0, 5593.0, 3764.0, 2680.0, 1770.0, 1242.0, 847.0, 586.0, 425.0, 282.0, 217.0, 144.0, 111.0, 68.0, 53.0, 49.0, 24.0, 15.0, 11.0, 10.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.013031005859375, -0.01260828971862793, -0.01218557357788086, -0.011762857437133789, -0.011340141296386719, -0.010917425155639648, -0.010494709014892578, -0.010071992874145508, -0.009649276733398438, -0.009226560592651367, -0.008803844451904297, -0.008381128311157227, -0.007958412170410156, -0.007535696029663086, -0.007112979888916016, -0.006690263748168945, -0.006267547607421875, -0.005844831466674805, -0.005422115325927734, -0.004999399185180664, -0.004576683044433594, -0.0041539669036865234, -0.003731250762939453, -0.003308534622192383, -0.0028858184814453125, -0.002463102340698242, -0.002040386199951172, -0.0016176700592041016, -0.0011949539184570312, -0.0007722377777099609, -0.0003495216369628906, 7.319450378417969e-05, 0.00049591064453125, 0.0009186267852783203, 0.0013413429260253906, 0.001764059066772461, 0.0021867752075195312, 0.0026094913482666016, 0.003032207489013672, 0.003454923629760742, 0.0038776397705078125, 0.004300355911254883, 0.004723072052001953, 0.0051457881927490234, 0.005568504333496094, 0.005991220474243164, 0.006413936614990234, 0.006836652755737305, 0.007259368896484375, 0.007682085037231445, 0.008104801177978516, 0.008527517318725586, 0.008950233459472656, 0.009372949600219727, 0.009795665740966797, 0.010218381881713867, 0.010641098022460938, 0.011063814163208008, 0.011486530303955078, 0.011909246444702148, 0.012331962585449219, 0.012754678726196289, 0.01317739486694336, 0.01360011100769043, 0.0140228271484375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 13.0, 9.0, 11.0, 15.0, 15.0, 15.0, 82.0, 50.0, 54.0, 80.0, 102.0, 198.0, 75.0, 47.0, 41.0, 43.0, 22.0, 31.0, 15.0, 10.0, 8.0, 7.0, 3.0, 16.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.314336597919464e-06, -2.2444874048233032e-06, -2.1746382117271423e-06, -2.1047890186309814e-06, -2.0349398255348206e-06, -1.9650906324386597e-06, -1.8952414393424988e-06, -1.8253922462463379e-06, -1.755543053150177e-06, -1.6856938600540161e-06, -1.6158446669578552e-06, -1.5459954738616943e-06, -1.4761462807655334e-06, -1.4062970876693726e-06, -1.3364478945732117e-06, -1.2665987014770508e-06, -1.1967495083808899e-06, -1.126900315284729e-06, -1.0570511221885681e-06, -9.872019290924072e-07, -9.173527359962463e-07, -8.475035429000854e-07, -7.776543498039246e-07, -7.078051567077637e-07, -6.379559636116028e-07, -5.681067705154419e-07, -4.98257577419281e-07, -4.284083843231201e-07, -3.5855919122695923e-07, -2.8870999813079834e-07, -2.1886080503463745e-07, -1.4901161193847656e-07, -7.916241884231567e-08, -9.313225746154785e-09, 6.05359673500061e-08, 1.30385160446167e-07, 2.0023435354232788e-07, 2.7008354663848877e-07, 3.3993273973464966e-07, 4.0978193283081055e-07, 4.796311259269714e-07, 5.494803190231323e-07, 6.193295121192932e-07, 6.891787052154541e-07, 7.59027898311615e-07, 8.288770914077759e-07, 8.987262845039368e-07, 9.685754776000977e-07, 1.0384246706962585e-06, 1.1082738637924194e-06, 1.1781230568885803e-06, 1.2479722499847412e-06, 1.317821443080902e-06, 1.387670636177063e-06, 1.4575198292732239e-06, 1.5273690223693848e-06, 1.5972182154655457e-06, 1.6670674085617065e-06, 1.7369166016578674e-06, 1.8067657947540283e-06, 1.8766149878501892e-06, 1.94646418094635e-06, 2.016313374042511e-06, 2.086162567138672e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 6.0, 10.0, 6.0, 8.0, 15.0, 17.0, 36.0, 28.0, 64.0, 94.0, 112.0, 167.0, 171.0, 333.0, 485.0, 652.0, 992.0, 1462.0, 2236.0, 3562.0, 5931.0, 10158.0, 19535.0, 45413.0, 229873.0, 619254.0, 56497.0, 22348.0, 11312.0, 6450.0, 3929.0, 2418.0, 1610.0, 1013.0, 716.0, 455.0, 348.0, 236.0, 167.0, 108.0, 61.0, 66.0, 50.0, 45.0, 29.0, 23.0, 14.0, 13.0, 7.0, 11.0, 0.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01445770263671875, -0.013943076133728027, -0.013428449630737305, -0.012913823127746582, -0.01239919662475586, -0.011884570121765137, -0.011369943618774414, -0.010855317115783691, -0.010340690612792969, -0.009826064109802246, -0.009311437606811523, -0.0087968111038208, -0.008282184600830078, -0.0077675580978393555, -0.007252931594848633, -0.00673830509185791, -0.0062236785888671875, -0.005709052085876465, -0.005194425582885742, -0.0046797990798950195, -0.004165172576904297, -0.0036505460739135742, -0.0031359195709228516, -0.002621293067932129, -0.0021066665649414062, -0.0015920400619506836, -0.001077413558959961, -0.0005627870559692383, -4.8160552978515625e-05, 0.00046646595001220703, 0.0009810924530029297, 0.0014957189559936523, 0.002010345458984375, 0.0025249719619750977, 0.0030395984649658203, 0.003554224967956543, 0.004068851470947266, 0.004583477973937988, 0.005098104476928711, 0.005612730979919434, 0.006127357482910156, 0.006641983985900879, 0.0071566104888916016, 0.007671236991882324, 0.008185863494873047, 0.00870048999786377, 0.009215116500854492, 0.009729743003845215, 0.010244369506835938, 0.01075899600982666, 0.011273622512817383, 0.011788249015808105, 0.012302875518798828, 0.01281750202178955, 0.013332128524780273, 0.013846755027770996, 0.014361381530761719, 0.014876008033752441, 0.015390634536743164, 0.015905261039733887, 0.01641988754272461, 0.016934514045715332, 0.017449140548706055, 0.017963767051696777, 0.0184783935546875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 2.0, 7.0, 3.0, 6.0, 9.0, 13.0, 9.0, 11.0, 20.0, 11.0, 26.0, 29.0, 43.0, 84.0, 279.0, 116.0, 79.0, 47.0, 42.0, 24.0, 21.0, 14.0, 19.0, 10.0, 10.0, 9.0, 4.0, 6.0, 2.0, 1.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0038166046142578125, -0.003710329532623291, -0.0036040544509887695, -0.003497779369354248, -0.0033915042877197266, -0.003285229206085205, -0.0031789541244506836, -0.003072679042816162, -0.0029664039611816406, -0.002860128879547119, -0.0027538537979125977, -0.002647578716278076, -0.0025413036346435547, -0.002435028553009033, -0.0023287534713745117, -0.0022224783897399902, -0.0021162033081054688, -0.0020099282264709473, -0.0019036531448364258, -0.0017973780632019043, -0.0016911029815673828, -0.0015848278999328613, -0.0014785528182983398, -0.0013722777366638184, -0.0012660026550292969, -0.0011597275733947754, -0.001053452491760254, -0.0009471774101257324, -0.0008409023284912109, -0.0007346272468566895, -0.000628352165222168, -0.0005220770835876465, -0.000415802001953125, -0.0003095269203186035, -0.00020325183868408203, -9.697675704956055e-05, 9.298324584960938e-06, 0.00011557340621948242, 0.0002218484878540039, 0.0003281235694885254, 0.0004343986511230469, 0.0005406737327575684, 0.0006469488143920898, 0.0007532238960266113, 0.0008594989776611328, 0.0009657740592956543, 0.0010720491409301758, 0.0011783242225646973, 0.0012845993041992188, 0.0013908743858337402, 0.0014971494674682617, 0.0016034245491027832, 0.0017096996307373047, 0.0018159747123718262, 0.0019222497940063477, 0.002028524875640869, 0.0021347999572753906, 0.002241075038909912, 0.0023473501205444336, 0.002453625202178955, 0.0025599002838134766, 0.002666175365447998, 0.0027724504470825195, 0.002878725528717041, 0.0029850006103515625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 12.0, 9.0, 11.0, 16.0, 21.0, 33.0, 35.0, 72.0, 84.0, 103.0, 109.0, 122.0, 86.0, 61.0, 51.0, 37.0, 29.0, 24.0, 20.0, 13.0, 12.0, 6.0, 13.0, 9.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17265063524246216, -0.1657581925392151, -0.1588657647371292, -0.15197333693504333, -0.14508089423179626, -0.1381884515285492, -0.13129602372646332, -0.12440358847379684, -0.11751115322113037, -0.1106187179684639, -0.10372628271579742, -0.09683384746313095, -0.08994141221046448, -0.083048976957798, -0.07615654170513153, -0.06926410645246506, -0.062371671199798584, -0.05547923594713211, -0.04858680069446564, -0.041694365441799164, -0.03480193018913269, -0.027909494936466217, -0.021017059683799744, -0.01412462443113327, -0.007232189178466797, -0.0003397539258003235, 0.00655268132686615, 0.013445116579532623, 0.020337551832199097, 0.02722998708486557, 0.03412242233753204, 0.04101485759019852, 0.04790729284286499, 0.054799728095531464, 0.06169216334819794, 0.06858459860086441, 0.07547703385353088, 0.08236946910619736, 0.08926190435886383, 0.0961543396115303, 0.10304677486419678, 0.10993921011686325, 0.11683164536952972, 0.1237240806221962, 0.13061651587486267, 0.13750895857810974, 0.14440138638019562, 0.1512938141822815, 0.15818625688552856, 0.16507869958877563, 0.1719711273908615, 0.1788635551929474, 0.18575599789619446, 0.19264844059944153, 0.1995408684015274, 0.20643329620361328, 0.21332573890686035, 0.22021818161010742, 0.2271106094121933, 0.23400303721427917, 0.24089547991752625, 0.24778792262077332, 0.254680335521698, 0.26157277822494507, 0.26846522092819214]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 9.0, 5.0, 14.0, 13.0, 12.0, 17.0, 24.0, 26.0, 19.0, 22.0, 37.0, 25.0, 35.0, 45.0, 40.0, 35.0, 48.0, 42.0, 41.0, 36.0, 46.0, 40.0, 38.0, 36.0, 32.0, 26.0, 30.0, 28.0, 28.0, 32.0, 19.0, 14.0, 13.0, 11.0, 17.0, 11.0, 10.0, 9.0, 2.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.13561442494392395, -0.13153374195098877, -0.1274530589580536, -0.12337237596511841, -0.11929168552160263, -0.11521100252866745, -0.11113031953573227, -0.10704963654279709, -0.10296894609928131, -0.09888826310634613, -0.09480758011341095, -0.09072689712047577, -0.08664620667695999, -0.08256552368402481, -0.07848484069108963, -0.07440415769815445, -0.07032347470521927, -0.06624279171228409, -0.06216210499405861, -0.05808142200112343, -0.05400073528289795, -0.04992005228996277, -0.04583936929702759, -0.04175868630409241, -0.03767799958586693, -0.03359731659293175, -0.02951662987470627, -0.025435946881771088, -0.021355262026190758, -0.017274577170610428, -0.013193894177675247, -0.009113209322094917, -0.005032524466514587, -0.0009518400765955448, 0.0031288443133234978, 0.007209528237581253, 0.011290213093161583, 0.015370897948741913, 0.019451580941677094, 0.023532265797257423, 0.027612950652837753, 0.031693633645772934, 0.03577432036399841, 0.039855003356933594, 0.043935686349868774, 0.048016373068094254, 0.052097056061029434, 0.05617774277925491, 0.060258425772190094, 0.06433910876512527, 0.06841979175806046, 0.07250048220157623, 0.07658116519451141, 0.0806618481874466, 0.08474253118038177, 0.08882321417331696, 0.09290389716625214, 0.09698458015918732, 0.1010652631521225, 0.10514594614505768, 0.10922663658857346, 0.11330731958150864, 0.11738800257444382, 0.121468685567379, 0.12554937601089478]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 14.0, 18.0, 27.0, 38.0, 49.0, 79.0, 116.0, 169.0, 280.0, 483.0, 766.0, 1196.0, 1912.0, 3087.0, 4934.0, 8453.0, 14211.0, 24927.0, 44613.0, 83326.0, 167692.0, 457502.0, 1750466.0, 1079334.0, 275135.0, 122749.0, 63905.0, 35755.0, 20613.0, 12227.0, 7358.0, 4588.0, 3035.0, 1832.0, 1166.0, 716.0, 500.0, 352.0, 200.0, 147.0, 93.0, 62.0, 42.0, 37.0, 28.0, 17.0, 10.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1734619140625, -0.16743850708007812, -0.16141510009765625, -0.15539169311523438, -0.1493682861328125, -0.14334487915039062, -0.13732147216796875, -0.13129806518554688, -0.125274658203125, -0.11925125122070312, -0.11322784423828125, -0.10720443725585938, -0.1011810302734375, -0.09515762329101562, -0.08913421630859375, -0.08311080932617188, -0.07708740234375, -0.07106399536132812, -0.06504058837890625, -0.059017181396484375, -0.0529937744140625, -0.046970367431640625, -0.04094696044921875, -0.034923553466796875, -0.028900146484375, -0.022876739501953125, -0.01685333251953125, -0.010829925537109375, -0.0048065185546875, 0.001216888427734375, 0.00724029541015625, 0.013263702392578125, 0.019287109375, 0.025310516357421875, 0.03133392333984375, 0.037357330322265625, 0.0433807373046875, 0.049404144287109375, 0.05542755126953125, 0.061450958251953125, 0.067474365234375, 0.07349777221679688, 0.07952117919921875, 0.08554458618164062, 0.0915679931640625, 0.09759140014648438, 0.10361480712890625, 0.10963821411132812, 0.11566162109375, 0.12168502807617188, 0.12770843505859375, 0.13373184204101562, 0.1397552490234375, 0.14577865600585938, 0.15180206298828125, 0.15782546997070312, 0.163848876953125, 0.16987228393554688, 0.17589569091796875, 0.18191909790039062, 0.1879425048828125, 0.19396591186523438, 0.19998931884765625, 0.20601272583007812, 0.2120361328125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 7.0, 3.0, 8.0, 11.0, 17.0, 21.0, 21.0, 20.0, 23.0, 22.0, 30.0, 31.0, 35.0, 39.0, 37.0, 32.0, 43.0, 38.0, 33.0, 36.0, 47.0, 39.0, 36.0, 29.0, 36.0, 35.0, 28.0, 35.0, 29.0, 23.0, 12.0, 24.0, 16.0, 10.0, 8.0, 13.0, 17.0, 12.0, 3.0, 6.0, 7.0, 3.0, 4.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-0.07501220703125, -0.07277679443359375, -0.0705413818359375, -0.06830596923828125, -0.066070556640625, -0.06383514404296875, -0.0615997314453125, -0.05936431884765625, -0.05712890625, -0.05489349365234375, -0.0526580810546875, -0.05042266845703125, -0.048187255859375, -0.04595184326171875, -0.0437164306640625, -0.04148101806640625, -0.03924560546875, -0.03701019287109375, -0.0347747802734375, -0.03253936767578125, -0.030303955078125, -0.02806854248046875, -0.0258331298828125, -0.02359771728515625, -0.0213623046875, -0.01912689208984375, -0.0168914794921875, -0.01465606689453125, -0.012420654296875, -0.01018524169921875, -0.0079498291015625, -0.00571441650390625, -0.00347900390625, -0.00124359130859375, 0.0009918212890625, 0.00322723388671875, 0.005462646484375, 0.00769805908203125, 0.0099334716796875, 0.01216888427734375, 0.014404296875, 0.01663970947265625, 0.0188751220703125, 0.02111053466796875, 0.023345947265625, 0.02558135986328125, 0.0278167724609375, 0.03005218505859375, 0.03228759765625, 0.03452301025390625, 0.0367584228515625, 0.03899383544921875, 0.041229248046875, 0.04346466064453125, 0.0457000732421875, 0.04793548583984375, 0.0501708984375, 0.05240631103515625, 0.0546417236328125, 0.05687713623046875, 0.059112548828125, 0.06134796142578125, 0.0635833740234375, 0.06581878662109375, 0.06805419921875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 2.0, 7.0, 9.0, 14.0, 18.0, 27.0, 41.0, 90.0, 144.0, 250.0, 495.0, 850.0, 1538.0, 2686.0, 4892.0, 8575.0, 15042.0, 27070.0, 51212.0, 102900.0, 217443.0, 523898.0, 1520316.0, 1021068.0, 366258.0, 162286.0, 78504.0, 39717.0, 21276.0, 12010.0, 6668.0, 3772.0, 2243.0, 1268.0, 741.0, 402.0, 236.0, 123.0, 68.0, 45.0, 35.0, 22.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.14039039611816406, -0.13551712036132812, -0.1306438446044922, -0.12577056884765625, -0.12089729309082031, -0.11602401733398438, -0.11115074157714844, -0.1062774658203125, -0.10140419006347656, -0.09653091430664062, -0.09165763854980469, -0.08678436279296875, -0.08191108703613281, -0.07703781127929688, -0.07216453552246094, -0.067291259765625, -0.06241798400878906, -0.057544708251953125, -0.05267143249511719, -0.04779815673828125, -0.04292488098144531, -0.038051605224609375, -0.03317832946777344, -0.0283050537109375, -0.023431777954101562, -0.018558502197265625, -0.013685226440429688, -0.00881195068359375, -0.0039386749267578125, 0.000934600830078125, 0.0058078765869140625, 0.01068115234375, 0.015554428100585938, 0.020427703857421875, 0.025300979614257812, 0.03017425537109375, 0.03504753112792969, 0.039920806884765625, 0.04479408264160156, 0.0496673583984375, 0.05454063415527344, 0.059413909912109375, 0.06428718566894531, 0.06916046142578125, 0.07403373718261719, 0.07890701293945312, 0.08378028869628906, 0.088653564453125, 0.09352684020996094, 0.09840011596679688, 0.10327339172363281, 0.10814666748046875, 0.11301994323730469, 0.11789321899414062, 0.12276649475097656, 0.1276397705078125, 0.13251304626464844, 0.13738632202148438, 0.1422595977783203, 0.14713287353515625, 0.1520061492919922, 0.15687942504882812, 0.16175270080566406, 0.1666259765625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 13.0, 13.0, 16.0, 20.0, 30.0, 31.0, 30.0, 50.0, 62.0, 63.0, 88.0, 111.0, 130.0, 151.0, 198.0, 226.0, 251.0, 301.0, 302.0, 321.0, 290.0, 266.0, 199.0, 188.0, 135.0, 114.0, 99.0, 77.0, 52.0, 64.0, 49.0, 41.0, 22.0, 27.0, 11.0, 13.0, 7.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03912353515625, -0.03771162033081055, -0.036299705505371094, -0.03488779067993164, -0.03347587585449219, -0.032063961029052734, -0.03065204620361328, -0.029240131378173828, -0.027828216552734375, -0.026416301727294922, -0.02500438690185547, -0.023592472076416016, -0.022180557250976562, -0.02076864242553711, -0.019356727600097656, -0.017944812774658203, -0.01653289794921875, -0.015120983123779297, -0.013709068298339844, -0.01229715347290039, -0.010885238647460938, -0.009473323822021484, -0.008061408996582031, -0.006649494171142578, -0.005237579345703125, -0.003825664520263672, -0.0024137496948242188, -0.0010018348693847656, 0.0004100799560546875, 0.0018219947814941406, 0.0032339096069335938, 0.004645824432373047, 0.0060577392578125, 0.007469654083251953, 0.008881568908691406, 0.01029348373413086, 0.011705398559570312, 0.013117313385009766, 0.014529228210449219, 0.015941143035888672, 0.017353057861328125, 0.018764972686767578, 0.02017688751220703, 0.021588802337646484, 0.023000717163085938, 0.02441263198852539, 0.025824546813964844, 0.027236461639404297, 0.02864837646484375, 0.030060291290283203, 0.031472206115722656, 0.03288412094116211, 0.03429603576660156, 0.035707950592041016, 0.03711986541748047, 0.03853178024291992, 0.039943695068359375, 0.04135560989379883, 0.04276752471923828, 0.044179439544677734, 0.04559135437011719, 0.04700326919555664, 0.048415184020996094, 0.04982709884643555, 0.051239013671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 10.0, 14.0, 14.0, 26.0, 32.0, 38.0, 44.0, 67.0, 73.0, 96.0, 122.0, 95.0, 88.0, 57.0, 52.0, 39.0, 31.0, 28.0, 16.0, 6.0, 9.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15770062804222107, -0.15328910946846008, -0.1488776057958603, -0.1444661021232605, -0.1400545835494995, -0.13564306497573853, -0.13123156130313873, -0.12682005763053894, -0.12240853905677795, -0.11799702793359756, -0.11358551681041718, -0.10917400568723679, -0.1047624945640564, -0.10035098344087601, -0.09593947231769562, -0.09152796119451523, -0.08711645007133484, -0.08270493894815445, -0.07829342782497406, -0.07388191670179367, -0.06947040557861328, -0.06505889445543289, -0.0606473833322525, -0.05623587220907211, -0.051824361085891724, -0.047412849962711334, -0.043001338839530945, -0.038589827716350555, -0.034178316593170166, -0.029766805469989777, -0.025355294346809387, -0.020943783223628998, -0.016532257199287415, -0.012120746076107025, -0.007709234952926636, -0.0032977238297462463, 0.001113787293434143, 0.0055252984166145325, 0.009936809539794922, 0.014348320662975311, 0.0187598317861557, 0.02317134290933609, 0.02758285403251648, 0.03199436515569687, 0.03640587627887726, 0.04081738740205765, 0.04522889852523804, 0.049640409648418427, 0.054051920771598816, 0.058463431894779205, 0.0628749430179596, 0.06728645414113998, 0.07169796526432037, 0.07610947638750076, 0.08052098751068115, 0.08493249863386154, 0.08934400975704193, 0.09375552088022232, 0.09816703200340271, 0.1025785431265831, 0.10699005424976349, 0.11140156537294388, 0.11581307649612427, 0.12022458761930466, 0.12463609874248505]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 10.0, 12.0, 12.0, 10.0, 18.0, 20.0, 21.0, 26.0, 27.0, 20.0, 30.0, 36.0, 32.0, 33.0, 41.0, 41.0, 46.0, 44.0, 34.0, 31.0, 37.0, 34.0, 48.0, 38.0, 31.0, 33.0, 32.0, 21.0, 25.0, 20.0, 20.0, 19.0, 12.0, 13.0, 11.0, 9.0, 13.0, 5.0, 7.0, 4.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.0746145099401474, -0.07216963171958923, -0.06972475349903107, -0.0672798752784729, -0.06483499705791473, -0.06239011883735657, -0.0599452406167984, -0.057500362396240234, -0.05505548417568207, -0.0526106059551239, -0.050165727734565735, -0.04772084951400757, -0.0452759712934494, -0.042831093072891235, -0.04038621485233307, -0.0379413366317749, -0.035496458411216736, -0.03305158019065857, -0.030606701970100403, -0.028161823749542236, -0.02571694552898407, -0.023272067308425903, -0.020827189087867737, -0.01838231086730957, -0.015937432646751404, -0.013492554426193237, -0.01104767620563507, -0.008602797985076904, -0.006157919764518738, -0.0037130415439605713, -0.0012681633234024048, 0.0011767148971557617, 0.0036215856671333313, 0.006066463887691498, 0.008511342108249664, 0.01095622032880783, 0.013401098549365997, 0.015845976769924164, 0.01829085499048233, 0.020735733211040497, 0.023180611431598663, 0.02562548965215683, 0.028070367872714996, 0.030515246093273163, 0.03296012431383133, 0.035405002534389496, 0.03784988075494766, 0.04029475897550583, 0.042739637196063995, 0.04518451541662216, 0.04762939363718033, 0.050074271857738495, 0.05251915007829666, 0.05496402829885483, 0.057408906519412994, 0.05985378473997116, 0.06229866296052933, 0.0647435411810875, 0.06718841940164566, 0.06963329762220383, 0.072078175842762, 0.07452305406332016, 0.07696793228387833, 0.07941281050443649, 0.08185768872499466]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 8.0, 9.0, 13.0, 26.0, 31.0, 51.0, 67.0, 104.0, 118.0, 170.0, 269.0, 391.0, 526.0, 716.0, 1080.0, 1549.0, 2186.0, 3189.0, 4722.0, 6984.0, 10432.0, 15883.0, 24693.0, 39588.0, 66535.0, 125504.0, 288971.0, 210413.0, 95628.0, 53274.0, 32960.0, 21038.0, 13409.0, 8878.0, 5905.0, 4130.0, 2759.0, 1893.0, 1303.0, 959.0, 641.0, 454.0, 344.0, 215.0, 184.0, 108.0, 73.0, 53.0, 32.0, 30.0, 19.0, 12.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.058197021484375, -0.0562443733215332, -0.054291725158691406, -0.05233907699584961, -0.05038642883300781, -0.048433780670166016, -0.04648113250732422, -0.04452848434448242, -0.042575836181640625, -0.04062318801879883, -0.03867053985595703, -0.036717891693115234, -0.03476524353027344, -0.03281259536743164, -0.030859947204589844, -0.028907299041748047, -0.02695465087890625, -0.025002002716064453, -0.023049354553222656, -0.02109670639038086, -0.019144058227539062, -0.017191410064697266, -0.015238761901855469, -0.013286113739013672, -0.011333465576171875, -0.009380817413330078, -0.007428169250488281, -0.005475521087646484, -0.0035228729248046875, -0.0015702247619628906, 0.00038242340087890625, 0.002335071563720703, 0.0042877197265625, 0.006240367889404297, 0.008193016052246094, 0.01014566421508789, 0.012098312377929688, 0.014050960540771484, 0.01600360870361328, 0.017956256866455078, 0.019908905029296875, 0.021861553192138672, 0.02381420135498047, 0.025766849517822266, 0.027719497680664062, 0.02967214584350586, 0.031624794006347656, 0.03357744216918945, 0.03553009033203125, 0.03748273849487305, 0.039435386657714844, 0.04138803482055664, 0.04334068298339844, 0.045293331146240234, 0.04724597930908203, 0.04919862747192383, 0.051151275634765625, 0.05310392379760742, 0.05505657196044922, 0.057009220123291016, 0.05896186828613281, 0.06091451644897461, 0.0628671646118164, 0.0648198127746582, 0.0667724609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 13.0, 11.0, 14.0, 19.0, 19.0, 17.0, 28.0, 25.0, 16.0, 34.0, 39.0, 30.0, 45.0, 43.0, 46.0, 39.0, 48.0, 41.0, 43.0, 38.0, 47.0, 44.0, 34.0, 33.0, 27.0, 28.0, 25.0, 24.0, 12.0, 24.0, 12.0, 11.0, 14.0, 7.0, 7.0, 11.0, 5.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07819080352783203, -0.07551002502441406, -0.0728292465209961, -0.07014846801757812, -0.06746768951416016, -0.06478691101074219, -0.06210613250732422, -0.05942535400390625, -0.05674457550048828, -0.05406379699707031, -0.051383018493652344, -0.048702239990234375, -0.046021461486816406, -0.04334068298339844, -0.04065990447998047, -0.0379791259765625, -0.03529834747314453, -0.03261756896972656, -0.029936790466308594, -0.027256011962890625, -0.024575233459472656, -0.021894454956054688, -0.01921367645263672, -0.01653289794921875, -0.013852119445800781, -0.011171340942382812, -0.008490562438964844, -0.005809783935546875, -0.0031290054321289062, -0.0004482269287109375, 0.0022325515747070312, 0.004913330078125, 0.007594108581542969, 0.010274887084960938, 0.012955665588378906, 0.015636444091796875, 0.018317222595214844, 0.020998001098632812, 0.02367877960205078, 0.02635955810546875, 0.02904033660888672, 0.03172111511230469, 0.034401893615722656, 0.037082672119140625, 0.039763450622558594, 0.04244422912597656, 0.04512500762939453, 0.0478057861328125, 0.05048656463623047, 0.05316734313964844, 0.055848121643066406, 0.058528900146484375, 0.061209678649902344, 0.06389045715332031, 0.06657123565673828, 0.06925201416015625, 0.07193279266357422, 0.07461357116699219, 0.07729434967041016, 0.07997512817382812, 0.0826559066772461, 0.08533668518066406, 0.08801746368408203, 0.0906982421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 16.0, 27.0, 26.0, 34.0, 51.0, 81.0, 116.0, 149.0, 203.0, 308.0, 451.0, 655.0, 987.0, 1376.0, 2116.0, 3398.0, 5613.0, 10016.0, 19942.0, 50333.0, 447987.0, 410706.0, 49219.0, 19486.0, 9775.0, 5513.0, 3347.0, 2142.0, 1353.0, 954.0, 689.0, 448.0, 323.0, 211.0, 153.0, 106.0, 72.0, 51.0, 31.0, 21.0, 20.0, 13.0, 12.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.14453125, -0.1401500701904297, -0.13576889038085938, -0.13138771057128906, -0.12700653076171875, -0.12262535095214844, -0.11824417114257812, -0.11386299133300781, -0.1094818115234375, -0.10510063171386719, -0.10071945190429688, -0.09633827209472656, -0.09195709228515625, -0.08757591247558594, -0.08319473266601562, -0.07881355285644531, -0.074432373046875, -0.07005119323730469, -0.06567001342773438, -0.06128883361816406, -0.05690765380859375, -0.05252647399902344, -0.048145294189453125, -0.04376411437988281, -0.0393829345703125, -0.03500175476074219, -0.030620574951171875, -0.026239395141601562, -0.02185821533203125, -0.017477035522460938, -0.013095855712890625, -0.008714675903320312, -0.00433349609375, 4.76837158203125e-05, 0.004428863525390625, 0.008810043334960938, 0.01319122314453125, 0.017572402954101562, 0.021953582763671875, 0.026334762573242188, 0.0307159423828125, 0.03509712219238281, 0.039478302001953125, 0.04385948181152344, 0.04824066162109375, 0.05262184143066406, 0.057003021240234375, 0.06138420104980469, 0.065765380859375, 0.07014656066894531, 0.07452774047851562, 0.07890892028808594, 0.08329010009765625, 0.08767127990722656, 0.09205245971679688, 0.09643363952636719, 0.1008148193359375, 0.10519599914550781, 0.10957717895507812, 0.11395835876464844, 0.11833953857421875, 0.12272071838378906, 0.12710189819335938, 0.1314830780029297, 0.1358642578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 5.0, 5.0, 8.0, 9.0, 13.0, 10.0, 8.0, 13.0, 14.0, 20.0, 15.0, 23.0, 34.0, 25.0, 24.0, 27.0, 52.0, 43.0, 31.0, 32.0, 44.0, 33.0, 28.0, 38.0, 37.0, 41.0, 32.0, 34.0, 28.0, 28.0, 31.0, 26.0, 27.0, 15.0, 24.0, 10.0, 16.0, 19.0, 16.0, 13.0, 8.0, 6.0, 7.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.051849365234375, -0.05031299591064453, -0.04877662658691406, -0.047240257263183594, -0.045703887939453125, -0.044167518615722656, -0.04263114929199219, -0.04109477996826172, -0.03955841064453125, -0.03802204132080078, -0.03648567199707031, -0.034949302673339844, -0.033412933349609375, -0.031876564025878906, -0.030340194702148438, -0.02880382537841797, -0.0272674560546875, -0.02573108673095703, -0.024194717407226562, -0.022658348083496094, -0.021121978759765625, -0.019585609436035156, -0.018049240112304688, -0.01651287078857422, -0.01497650146484375, -0.013440132141113281, -0.011903762817382812, -0.010367393493652344, -0.008831024169921875, -0.007294654846191406, -0.0057582855224609375, -0.004221916198730469, -0.002685546875, -0.0011491775512695312, 0.0003871917724609375, 0.0019235610961914062, 0.003459930419921875, 0.004996299743652344, 0.0065326690673828125, 0.008069038391113281, 0.00960540771484375, 0.011141777038574219, 0.012678146362304688, 0.014214515686035156, 0.015750885009765625, 0.017287254333496094, 0.018823623657226562, 0.02035999298095703, 0.0218963623046875, 0.02343273162841797, 0.024969100952148438, 0.026505470275878906, 0.028041839599609375, 0.029578208923339844, 0.031114578247070312, 0.03265094757080078, 0.03418731689453125, 0.03572368621826172, 0.03726005554199219, 0.038796424865722656, 0.040332794189453125, 0.041869163513183594, 0.04340553283691406, 0.04494190216064453, 0.046478271484375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 11.0, 7.0, 7.0, 20.0, 22.0, 24.0, 26.0, 51.0, 65.0, 89.0, 104.0, 170.0, 230.0, 338.0, 483.0, 729.0, 1171.0, 1960.0, 3414.0, 6722.0, 15035.0, 49372.0, 738534.0, 177888.0, 29041.0, 10621.0, 5086.0, 2683.0, 1625.0, 950.0, 602.0, 419.0, 281.0, 213.0, 150.0, 105.0, 84.0, 77.0, 41.0, 32.0, 24.0, 13.0, 12.0, 7.0, 11.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.024383544921875, -0.023591995239257812, -0.022800445556640625, -0.022008895874023438, -0.02121734619140625, -0.020425796508789062, -0.019634246826171875, -0.018842697143554688, -0.0180511474609375, -0.017259597778320312, -0.016468048095703125, -0.015676498413085938, -0.01488494873046875, -0.014093399047851562, -0.013301849365234375, -0.012510299682617188, -0.01171875, -0.010927200317382812, -0.010135650634765625, -0.009344100952148438, -0.00855255126953125, -0.0077610015869140625, -0.006969451904296875, -0.0061779022216796875, -0.0053863525390625, -0.0045948028564453125, -0.003803253173828125, -0.0030117034912109375, -0.00222015380859375, -0.0014286041259765625, -0.000637054443359375, 0.0001544952392578125, 0.000946044921875, 0.0017375946044921875, 0.002529144287109375, 0.0033206939697265625, 0.00411224365234375, 0.0049037933349609375, 0.005695343017578125, 0.0064868927001953125, 0.0072784423828125, 0.008069992065429688, 0.008861541748046875, 0.009653091430664062, 0.01044464111328125, 0.011236190795898438, 0.012027740478515625, 0.012819290161132812, 0.01361083984375, 0.014402389526367188, 0.015193939208984375, 0.015985488891601562, 0.01677703857421875, 0.017568588256835938, 0.018360137939453125, 0.019151687622070312, 0.0199432373046875, 0.020734786987304688, 0.021526336669921875, 0.022317886352539062, 0.02310943603515625, 0.023900985717773438, 0.024692535400390625, 0.025484085083007812, 0.026275634765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 7.0, 3.0, 3.0, 10.0, 11.0, 9.0, 0.0, 16.0, 19.0, 25.0, 33.0, 53.0, 54.0, 0.0, 79.0, 62.0, 78.0, 81.0, 91.0, 67.0, 0.0, 56.0, 62.0, 36.0, 45.0, 24.0, 15.0, 0.0, 19.0, 12.0, 11.0, 9.0, 4.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6177073121070862e-06, -1.5664845705032349e-06, -1.5152618288993835e-06, -1.4640390872955322e-06, -1.412816345691681e-06, -1.3615936040878296e-06, -1.3103708624839783e-06, -1.259148120880127e-06, -1.2079253792762756e-06, -1.1567026376724243e-06, -1.105479896068573e-06, -1.0542571544647217e-06, -1.0030344128608704e-06, -9.51811671257019e-07, -9.005889296531677e-07, -8.493661880493164e-07, -7.981434464454651e-07, -7.469207048416138e-07, -6.956979632377625e-07, -6.444752216339111e-07, -5.932524800300598e-07, -5.420297384262085e-07, -4.908069968223572e-07, -4.3958425521850586e-07, -3.8836151361465454e-07, -3.371387720108032e-07, -2.859160304069519e-07, -2.3469328880310059e-07, -1.8347054719924927e-07, -1.3224780559539795e-07, -8.102506399154663e-08, -2.9802322387695312e-08, 2.1420419216156006e-08, 7.264316082000732e-08, 1.2386590242385864e-07, 1.7508864402770996e-07, 2.2631138563156128e-07, 2.775341272354126e-07, 3.287568688392639e-07, 3.7997961044311523e-07, 4.3120235204696655e-07, 4.824250936508179e-07, 5.336478352546692e-07, 5.848705768585205e-07, 6.360933184623718e-07, 6.873160600662231e-07, 7.385388016700745e-07, 7.897615432739258e-07, 8.409842848777771e-07, 8.922070264816284e-07, 9.434297680854797e-07, 9.94652509689331e-07, 1.0458752512931824e-06, 1.0970979928970337e-06, 1.148320734500885e-06, 1.1995434761047363e-06, 1.2507662177085876e-06, 1.301988959312439e-06, 1.3532117009162903e-06, 1.4044344425201416e-06, 1.455657184123993e-06, 1.5068799257278442e-06, 1.5581026673316956e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 11.0, 16.0, 22.0, 28.0, 43.0, 43.0, 78.0, 113.0, 130.0, 176.0, 257.0, 347.0, 456.0, 735.0, 996.0, 1495.0, 2182.0, 3590.0, 5763.0, 10035.0, 18632.0, 39298.0, 112001.0, 540392.0, 198547.0, 56671.0, 24407.0, 12511.0, 6987.0, 4249.0, 2632.0, 1741.0, 1147.0, 800.0, 530.0, 441.0, 276.0, 214.0, 158.0, 98.0, 78.0, 60.0, 38.0, 34.0, 31.0, 17.0, 12.0, 9.0, 10.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.01617431640625, -0.015679597854614258, -0.015184879302978516, -0.014690160751342773, -0.014195442199707031, -0.013700723648071289, -0.013206005096435547, -0.012711286544799805, -0.012216567993164062, -0.01172184944152832, -0.011227130889892578, -0.010732412338256836, -0.010237693786621094, -0.009742975234985352, -0.00924825668334961, -0.008753538131713867, -0.008258819580078125, -0.007764101028442383, -0.007269382476806641, -0.0067746639251708984, -0.006279945373535156, -0.005785226821899414, -0.005290508270263672, -0.00479578971862793, -0.0043010711669921875, -0.0038063526153564453, -0.003311634063720703, -0.002816915512084961, -0.0023221969604492188, -0.0018274784088134766, -0.0013327598571777344, -0.0008380413055419922, -0.00034332275390625, 0.0001513957977294922, 0.0006461143493652344, 0.0011408329010009766, 0.0016355514526367188, 0.002130270004272461, 0.002624988555908203, 0.0031197071075439453, 0.0036144256591796875, 0.00410914421081543, 0.004603862762451172, 0.005098581314086914, 0.005593299865722656, 0.0060880184173583984, 0.006582736968994141, 0.007077455520629883, 0.007572174072265625, 0.008066892623901367, 0.00856161117553711, 0.009056329727172852, 0.009551048278808594, 0.010045766830444336, 0.010540485382080078, 0.01103520393371582, 0.011529922485351562, 0.012024641036987305, 0.012519359588623047, 0.013014078140258789, 0.013508796691894531, 0.014003515243530273, 0.014498233795166016, 0.014992952346801758, 0.0154876708984375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 8.0, 3.0, 5.0, 3.0, 7.0, 15.0, 16.0, 26.0, 19.0, 43.0, 35.0, 63.0, 125.0, 198.0, 123.0, 62.0, 55.0, 37.0, 35.0, 17.0, 21.0, 10.0, 15.0, 8.0, 3.0, 11.0, 8.0, 2.0, 4.0, 1.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038089752197265625, -0.0036701858043670654, -0.0035313963890075684, -0.0033926069736480713, -0.0032538175582885742, -0.003115028142929077, -0.00297623872756958, -0.002837449312210083, -0.002698659896850586, -0.002559870481491089, -0.002421081066131592, -0.0022822916507720947, -0.0021435022354125977, -0.0020047128200531006, -0.0018659234046936035, -0.0017271339893341064, -0.0015883445739746094, -0.0014495551586151123, -0.0013107657432556152, -0.0011719763278961182, -0.001033186912536621, -0.000894397497177124, -0.000755608081817627, -0.0006168186664581299, -0.0004780292510986328, -0.00033923983573913574, -0.00020045042037963867, -6.16610050201416e-05, 7.712841033935547e-05, 0.00021591782569885254, 0.0003547072410583496, 0.0004934966564178467, 0.0006322860717773438, 0.0007710754871368408, 0.0009098649024963379, 0.001048654317855835, 0.001187443733215332, 0.001326233148574829, 0.0014650225639343262, 0.0016038119792938232, 0.0017426013946533203, 0.0018813908100128174, 0.0020201802253723145, 0.0021589696407318115, 0.0022977590560913086, 0.0024365484714508057, 0.0025753378868103027, 0.0027141273021698, 0.002852916717529297, 0.002991706132888794, 0.003130495548248291, 0.003269284963607788, 0.003408074378967285, 0.0035468637943267822, 0.0036856532096862793, 0.0038244426250457764, 0.0039632320404052734, 0.0041020214557647705, 0.004240810871124268, 0.004379600286483765, 0.004518389701843262, 0.004657179117202759, 0.004795968532562256, 0.004934757947921753, 0.00507354736328125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 10.0, 11.0, 13.0, 34.0, 19.0, 40.0, 37.0, 65.0, 78.0, 84.0, 128.0, 103.0, 90.0, 51.0, 57.0, 35.0, 34.0, 28.0, 14.0, 11.0, 17.0, 5.0, 6.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15215714275836945, -0.14779318869113922, -0.1434292495250702, -0.13906529545783997, -0.13470134139060974, -0.13033738732337952, -0.12597344815731049, -0.12160949409008026, -0.11724554747343063, -0.112881600856781, -0.10851764678955078, -0.10415370017290115, -0.09978975355625153, -0.0954257994890213, -0.09106185287237167, -0.08669790625572205, -0.08233395218849182, -0.0779700055718422, -0.07360605150461197, -0.06924210488796234, -0.06487815082073212, -0.06051420420408249, -0.05615025758743286, -0.051786307245492935, -0.04742235690355301, -0.04305840656161308, -0.03869445621967316, -0.03433050960302353, -0.029966559261083603, -0.025602608919143677, -0.0212386604398489, -0.016874711960554123, -0.01251077651977539, -0.008146827109158039, -0.0037828776985406876, 0.000581071712076664, 0.0049450211226940155, 0.009308971464633942, 0.013672919943928719, 0.018036868423223495, 0.02240081876516342, 0.026764769107103348, 0.031128717586398125, 0.0354926660656929, 0.03985661640763283, 0.044220566749572754, 0.04858451336622238, 0.05294846370816231, 0.057312414050102234, 0.06167636439204216, 0.06604031473398209, 0.07040426135063171, 0.07476821541786194, 0.07913216203451157, 0.0834961086511612, 0.08786006271839142, 0.09222400933504105, 0.09658795595169067, 0.1009519100189209, 0.10531585663557053, 0.10967980325222015, 0.11404375731945038, 0.1184077039361, 0.12277165055274963, 0.12713560461997986]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 13.0, 14.0, 17.0, 21.0, 18.0, 25.0, 32.0, 13.0, 34.0, 45.0, 25.0, 35.0, 41.0, 36.0, 54.0, 38.0, 34.0, 36.0, 34.0, 40.0, 43.0, 33.0, 34.0, 31.0, 35.0, 16.0, 29.0, 17.0, 18.0, 22.0, 13.0, 9.0, 13.0, 11.0, 11.0, 4.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0738101676106453, -0.07139213383197784, -0.0689741000533104, -0.06655605882406235, -0.0641380250453949, -0.06171999126672745, -0.05930195748806, -0.05688392370939255, -0.0544658862054348, -0.05204785242676735, -0.0496298149228096, -0.04721178114414215, -0.0447937473654747, -0.04237570986151695, -0.0399576760828495, -0.037539638578891754, -0.035121604800224304, -0.032703571021556854, -0.030285533517599106, -0.027867499738931656, -0.025449464097619057, -0.023031428456306458, -0.020613394677639008, -0.01819535903632641, -0.01577732339501381, -0.01335928775370121, -0.010941253043711185, -0.008523218333721161, -0.006105182692408562, -0.0036871470510959625, -0.001269112341105938, 0.0011489223688840866, 0.003566958010196686, 0.005984993185847998, 0.00840302836149931, 0.010821063071489334, 0.013239098712801933, 0.015657134354114532, 0.018075168132781982, 0.02049320377409458, 0.02291123941540718, 0.02532927505671978, 0.02774731069803238, 0.03016534447669983, 0.03258337825536728, 0.03500141575932503, 0.03741944953799248, 0.039837487041950226, 0.042255520820617676, 0.044673554599285126, 0.047091592103242874, 0.049509625881910324, 0.05192766338586807, 0.05434569716453552, 0.05676373094320297, 0.05918176472187042, 0.06159980222582817, 0.06401783972978592, 0.06643587350845337, 0.06885390728712082, 0.07127194106578827, 0.07368998229503632, 0.07610801607370377, 0.07852604985237122, 0.08094408363103867]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 11.0, 13.0, 26.0, 27.0, 47.0, 78.0, 112.0, 165.0, 251.0, 339.0, 542.0, 727.0, 1104.0, 1662.0, 2405.0, 3494.0, 5021.0, 7391.0, 11305.0, 16828.0, 26332.0, 42945.0, 74577.0, 139964.0, 258417.0, 198415.0, 102063.0, 56690.0, 33999.0, 21174.0, 13857.0, 9113.0, 6076.0, 4289.0, 2937.0, 1908.0, 1351.0, 890.0, 620.0, 423.0, 299.0, 197.0, 137.0, 109.0, 74.0, 47.0, 30.0, 24.0, 21.0, 14.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.15283203125, -0.14816665649414062, -0.14350128173828125, -0.13883590698242188, -0.1341705322265625, -0.12950515747070312, -0.12483978271484375, -0.12017440795898438, -0.115509033203125, -0.11084365844726562, -0.10617828369140625, -0.10151290893554688, -0.0968475341796875, -0.09218215942382812, -0.08751678466796875, -0.08285140991210938, -0.07818603515625, -0.07352066040039062, -0.06885528564453125, -0.06418991088867188, -0.0595245361328125, -0.054859161376953125, -0.05019378662109375, -0.045528411865234375, -0.040863037109375, -0.036197662353515625, -0.03153228759765625, -0.026866912841796875, -0.0222015380859375, -0.017536163330078125, -0.01287078857421875, -0.008205413818359375, -0.0035400390625, 0.001125335693359375, 0.00579071044921875, 0.010456085205078125, 0.0151214599609375, 0.019786834716796875, 0.02445220947265625, 0.029117584228515625, 0.033782958984375, 0.038448333740234375, 0.04311370849609375, 0.047779083251953125, 0.0524444580078125, 0.057109832763671875, 0.06177520751953125, 0.06644058227539062, 0.07110595703125, 0.07577133178710938, 0.08043670654296875, 0.08510208129882812, 0.0897674560546875, 0.09443283081054688, 0.09909820556640625, 0.10376358032226562, 0.108428955078125, 0.11309432983398438, 0.11775970458984375, 0.12242507934570312, 0.1270904541015625, 0.13175582885742188, 0.13642120361328125, 0.14108657836914062, 0.145751953125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 9.0, 4.0, 7.0, 9.0, 12.0, 15.0, 17.0, 17.0, 14.0, 19.0, 29.0, 28.0, 33.0, 29.0, 29.0, 40.0, 30.0, 41.0, 43.0, 34.0, 34.0, 34.0, 30.0, 35.0, 50.0, 35.0, 43.0, 29.0, 26.0, 24.0, 26.0, 23.0, 20.0, 21.0, 17.0, 8.0, 13.0, 21.0, 6.0, 6.0, 5.0, 6.0, 8.0, 4.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.060394287109375, -0.05832529067993164, -0.05625629425048828, -0.05418729782104492, -0.05211830139160156, -0.0500493049621582, -0.047980308532714844, -0.045911312103271484, -0.043842315673828125, -0.041773319244384766, -0.039704322814941406, -0.03763532638549805, -0.03556632995605469, -0.03349733352661133, -0.03142833709716797, -0.02935934066772461, -0.02729034423828125, -0.02522134780883789, -0.02315235137939453, -0.021083354949951172, -0.019014358520507812, -0.016945362091064453, -0.014876365661621094, -0.012807369232177734, -0.010738372802734375, -0.008669376373291016, -0.006600379943847656, -0.004531383514404297, -0.0024623870849609375, -0.0003933906555175781, 0.0016756057739257812, 0.0037446022033691406, 0.0058135986328125, 0.00788259506225586, 0.009951591491699219, 0.012020587921142578, 0.014089584350585938, 0.016158580780029297, 0.018227577209472656, 0.020296573638916016, 0.022365570068359375, 0.024434566497802734, 0.026503562927246094, 0.028572559356689453, 0.030641555786132812, 0.03271055221557617, 0.03477954864501953, 0.03684854507446289, 0.03891754150390625, 0.04098653793334961, 0.04305553436279297, 0.04512453079223633, 0.04719352722167969, 0.04926252365112305, 0.051331520080566406, 0.053400516510009766, 0.055469512939453125, 0.057538509368896484, 0.059607505798339844, 0.0616765022277832, 0.06374549865722656, 0.06581449508666992, 0.06788349151611328, 0.06995248794555664, 0.072021484375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 10.0, 5.0, 17.0, 28.0, 27.0, 41.0, 53.0, 82.0, 110.0, 169.0, 251.0, 421.0, 653.0, 969.0, 1359.0, 2187.0, 3418.0, 5212.0, 8300.0, 12996.0, 21035.0, 34087.0, 55117.0, 93511.0, 174342.0, 271348.0, 149019.0, 82978.0, 48885.0, 30310.0, 18872.0, 11792.0, 7349.0, 4754.0, 3052.0, 2005.0, 1278.0, 804.0, 527.0, 368.0, 242.0, 157.0, 110.0, 91.0, 66.0, 44.0, 22.0, 29.0, 15.0, 12.0, 8.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.14013671875, -0.13552474975585938, -0.13091278076171875, -0.12630081176757812, -0.1216888427734375, -0.11707687377929688, -0.11246490478515625, -0.10785293579101562, -0.103240966796875, -0.09862899780273438, -0.09401702880859375, -0.08940505981445312, -0.0847930908203125, -0.08018112182617188, -0.07556915283203125, -0.07095718383789062, -0.06634521484375, -0.061733245849609375, -0.05712127685546875, -0.052509307861328125, -0.0478973388671875, -0.043285369873046875, -0.03867340087890625, -0.034061431884765625, -0.029449462890625, -0.024837493896484375, -0.02022552490234375, -0.015613555908203125, -0.0110015869140625, -0.006389617919921875, -0.00177764892578125, 0.002834320068359375, 0.0074462890625, 0.012058258056640625, 0.01667022705078125, 0.021282196044921875, 0.0258941650390625, 0.030506134033203125, 0.03511810302734375, 0.039730072021484375, 0.044342041015625, 0.048954010009765625, 0.05356597900390625, 0.058177947998046875, 0.0627899169921875, 0.06740188598632812, 0.07201385498046875, 0.07662582397460938, 0.08123779296875, 0.08584976196289062, 0.09046173095703125, 0.09507369995117188, 0.0996856689453125, 0.10429763793945312, 0.10890960693359375, 0.11352157592773438, 0.118133544921875, 0.12274551391601562, 0.12735748291015625, 0.13196945190429688, 0.1365814208984375, 0.14119338989257812, 0.14580535888671875, 0.15041732788085938, 0.155029296875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 10.0, 14.0, 8.0, 12.0, 12.0, 15.0, 11.0, 23.0, 29.0, 30.0, 28.0, 29.0, 30.0, 32.0, 29.0, 37.0, 42.0, 35.0, 40.0, 45.0, 31.0, 33.0, 30.0, 52.0, 34.0, 31.0, 40.0, 50.0, 24.0, 27.0, 23.0, 13.0, 23.0, 16.0, 12.0, 12.0, 10.0, 6.0, 5.0, 8.0, 4.0, 6.0, 0.0, 1.0, 2.0], "bins": [-0.05352783203125, -0.052135467529296875, -0.05074310302734375, -0.049350738525390625, -0.0479583740234375, -0.046566009521484375, -0.04517364501953125, -0.043781280517578125, -0.042388916015625, -0.040996551513671875, -0.03960418701171875, -0.038211822509765625, -0.0368194580078125, -0.035427093505859375, -0.03403472900390625, -0.032642364501953125, -0.03125, -0.029857635498046875, -0.02846527099609375, -0.027072906494140625, -0.0256805419921875, -0.024288177490234375, -0.02289581298828125, -0.021503448486328125, -0.020111083984375, -0.018718719482421875, -0.01732635498046875, -0.015933990478515625, -0.0145416259765625, -0.013149261474609375, -0.01175689697265625, -0.010364532470703125, -0.00897216796875, -0.007579803466796875, -0.00618743896484375, -0.004795074462890625, -0.0034027099609375, -0.002010345458984375, -0.00061798095703125, 0.000774383544921875, 0.002166748046875, 0.003559112548828125, 0.00495147705078125, 0.006343841552734375, 0.0077362060546875, 0.009128570556640625, 0.01052093505859375, 0.011913299560546875, 0.0133056640625, 0.014698028564453125, 0.01609039306640625, 0.017482757568359375, 0.0188751220703125, 0.020267486572265625, 0.02165985107421875, 0.023052215576171875, 0.024444580078125, 0.025836944580078125, 0.02722930908203125, 0.028621673583984375, 0.0300140380859375, 0.031406402587890625, 0.03279876708984375, 0.034191131591796875, 0.03558349609375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 12.0, 10.0, 12.0, 18.0, 24.0, 34.0, 45.0, 61.0, 73.0, 109.0, 125.0, 191.0, 275.0, 345.0, 428.0, 600.0, 824.0, 1202.0, 1690.0, 2525.0, 3894.0, 6400.0, 10692.0, 22999.0, 754571.0, 192073.0, 21070.0, 10114.0, 6002.0, 3813.0, 2476.0, 1572.0, 1176.0, 789.0, 601.0, 438.0, 313.0, 245.0, 173.0, 135.0, 105.0, 82.0, 64.0, 44.0, 35.0, 22.0, 9.0, 13.0, 5.0, 5.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.03753662109375, -0.036397457122802734, -0.03525829315185547, -0.0341191291809082, -0.03297996520996094, -0.03184080123901367, -0.030701637268066406, -0.02956247329711914, -0.028423309326171875, -0.02728414535522461, -0.026144981384277344, -0.025005817413330078, -0.023866653442382812, -0.022727489471435547, -0.02158832550048828, -0.020449161529541016, -0.01930999755859375, -0.018170833587646484, -0.01703166961669922, -0.015892505645751953, -0.014753341674804688, -0.013614177703857422, -0.012475013732910156, -0.01133584976196289, -0.010196685791015625, -0.00905752182006836, -0.007918357849121094, -0.006779193878173828, -0.0056400299072265625, -0.004500865936279297, -0.0033617019653320312, -0.0022225379943847656, -0.0010833740234375, 5.5789947509765625e-05, 0.0011949539184570312, 0.002334117889404297, 0.0034732818603515625, 0.004612445831298828, 0.005751609802246094, 0.006890773773193359, 0.008029937744140625, 0.00916910171508789, 0.010308265686035156, 0.011447429656982422, 0.012586593627929688, 0.013725757598876953, 0.014864921569824219, 0.016004085540771484, 0.01714324951171875, 0.018282413482666016, 0.01942157745361328, 0.020560741424560547, 0.021699905395507812, 0.022839069366455078, 0.023978233337402344, 0.02511739730834961, 0.026256561279296875, 0.02739572525024414, 0.028534889221191406, 0.029674053192138672, 0.030813217163085938, 0.0319523811340332, 0.03309154510498047, 0.034230709075927734, 0.035369873046875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 4.0, 7.0, 7.0, 5.0, 14.0, 19.0, 16.0, 30.0, 52.0, 69.0, 85.0, 118.0, 127.0, 106.0, 83.0, 79.0, 54.0, 29.0, 35.0, 18.0, 8.0, 7.0, 9.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1324882507324219e-06, -1.0728836059570312e-06, -1.0132789611816406e-06, -9.5367431640625e-07, -8.940696716308594e-07, -8.344650268554688e-07, -7.748603820800781e-07, -7.152557373046875e-07, -6.556510925292969e-07, -5.960464477539062e-07, -5.364418029785156e-07, -4.76837158203125e-07, -4.172325134277344e-07, -3.5762786865234375e-07, -2.980232238769531e-07, -2.384185791015625e-07, -1.7881393432617188e-07, -1.1920928955078125e-07, -5.960464477539063e-08, 0.0, 5.960464477539063e-08, 1.1920928955078125e-07, 1.7881393432617188e-07, 2.384185791015625e-07, 2.980232238769531e-07, 3.5762786865234375e-07, 4.172325134277344e-07, 4.76837158203125e-07, 5.364418029785156e-07, 5.960464477539062e-07, 6.556510925292969e-07, 7.152557373046875e-07, 7.748603820800781e-07, 8.344650268554688e-07, 8.940696716308594e-07, 9.5367431640625e-07, 1.0132789611816406e-06, 1.0728836059570312e-06, 1.1324882507324219e-06, 1.1920928955078125e-06, 1.2516975402832031e-06, 1.3113021850585938e-06, 1.3709068298339844e-06, 1.430511474609375e-06, 1.4901161193847656e-06, 1.5497207641601562e-06, 1.6093254089355469e-06, 1.6689300537109375e-06, 1.7285346984863281e-06, 1.7881393432617188e-06, 1.8477439880371094e-06, 1.9073486328125e-06, 1.9669532775878906e-06, 2.0265579223632812e-06, 2.086162567138672e-06, 2.1457672119140625e-06, 2.205371856689453e-06, 2.2649765014648438e-06, 2.3245811462402344e-06, 2.384185791015625e-06, 2.4437904357910156e-06, 2.5033950805664062e-06, 2.562999725341797e-06, 2.6226043701171875e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 2.0, 2.0, 4.0, 17.0, 17.0, 27.0, 27.0, 41.0, 74.0, 91.0, 94.0, 147.0, 206.0, 315.0, 416.0, 628.0, 925.0, 1172.0, 1758.0, 2562.0, 3815.0, 6016.0, 9907.0, 21196.0, 548224.0, 401435.0, 21188.0, 9925.0, 5927.0, 3877.0, 2494.0, 1837.0, 1198.0, 874.0, 609.0, 442.0, 303.0, 226.0, 140.0, 101.0, 96.0, 60.0, 38.0, 24.0, 23.0, 19.0, 10.0, 7.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033447265625, -0.03236818313598633, -0.031289100646972656, -0.030210018157958984, -0.029130935668945312, -0.02805185317993164, -0.02697277069091797, -0.025893688201904297, -0.024814605712890625, -0.023735523223876953, -0.02265644073486328, -0.02157735824584961, -0.020498275756835938, -0.019419193267822266, -0.018340110778808594, -0.017261028289794922, -0.01618194580078125, -0.015102863311767578, -0.014023780822753906, -0.012944698333740234, -0.011865615844726562, -0.01078653335571289, -0.009707450866699219, -0.008628368377685547, -0.007549285888671875, -0.006470203399658203, -0.005391120910644531, -0.004312038421630859, -0.0032329559326171875, -0.0021538734436035156, -0.0010747909545898438, 4.291534423828125e-06, 0.0010833740234375, 0.002162456512451172, 0.0032415390014648438, 0.004320621490478516, 0.0053997039794921875, 0.006478786468505859, 0.007557868957519531, 0.008636951446533203, 0.009716033935546875, 0.010795116424560547, 0.011874198913574219, 0.01295328140258789, 0.014032363891601562, 0.015111446380615234, 0.016190528869628906, 0.017269611358642578, 0.01834869384765625, 0.019427776336669922, 0.020506858825683594, 0.021585941314697266, 0.022665023803710938, 0.02374410629272461, 0.02482318878173828, 0.025902271270751953, 0.026981353759765625, 0.028060436248779297, 0.02913951873779297, 0.03021860122680664, 0.03129768371582031, 0.032376766204833984, 0.033455848693847656, 0.03453493118286133, 0.035614013671875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 7.0, 12.0, 10.0, 40.0, 493.0, 292.0, 28.0, 22.0, 13.0, 6.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01102447509765625, -0.010689973831176758, -0.010355472564697266, -0.010020971298217773, -0.009686470031738281, -0.009351968765258789, -0.009017467498779297, -0.008682966232299805, -0.008348464965820312, -0.00801396369934082, -0.007679462432861328, -0.007344961166381836, -0.007010459899902344, -0.0066759586334228516, -0.006341457366943359, -0.006006956100463867, -0.005672454833984375, -0.005337953567504883, -0.005003452301025391, -0.0046689510345458984, -0.004334449768066406, -0.003999948501586914, -0.003665447235107422, -0.0033309459686279297, -0.0029964447021484375, -0.0026619434356689453, -0.002327442169189453, -0.001992940902709961, -0.0016584396362304688, -0.0013239383697509766, -0.0009894371032714844, -0.0006549358367919922, -0.0003204345703125, 1.4066696166992188e-05, 0.0003485679626464844, 0.0006830692291259766, 0.0010175704956054688, 0.001352071762084961, 0.0016865730285644531, 0.0020210742950439453, 0.0023555755615234375, 0.0026900768280029297, 0.003024578094482422, 0.003359079360961914, 0.0036935806274414062, 0.0040280818939208984, 0.004362583160400391, 0.004697084426879883, 0.005031585693359375, 0.005366086959838867, 0.005700588226318359, 0.0060350894927978516, 0.006369590759277344, 0.006704092025756836, 0.007038593292236328, 0.00737309455871582, 0.0077075958251953125, 0.008042097091674805, 0.008376598358154297, 0.008711099624633789, 0.009045600891113281, 0.009380102157592773, 0.009714603424072266, 0.010049104690551758, 0.01038360595703125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 16.0, 18.0, 19.0, 18.0, 36.0, 31.0, 53.0, 79.0, 106.0, 106.0, 113.0, 83.0, 72.0, 51.0, 42.0, 27.0, 33.0, 19.0, 13.0, 14.0, 4.0, 6.0, 13.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.145944744348526, -0.14200077950954437, -0.13805681467056274, -0.13411284983158112, -0.1301688849925995, -0.12622492015361786, -0.12228095531463623, -0.1183369904756546, -0.11439302563667297, -0.11044906079769135, -0.10650509595870972, -0.10256113111972809, -0.09861716628074646, -0.09467320144176483, -0.0907292366027832, -0.08678527176380157, -0.08284130692481995, -0.07889734208583832, -0.07495337724685669, -0.07100941240787506, -0.06706544756889343, -0.0631214827299118, -0.059177517890930176, -0.05523355305194855, -0.05128958821296692, -0.04734562337398529, -0.04340165853500366, -0.039457693696022034, -0.035513728857040405, -0.03156976401805878, -0.02762579917907715, -0.02368183434009552, -0.019737862050533295, -0.015793897211551666, -0.011849932372570038, -0.00790596753358841, -0.003962002694606781, -1.8037855625152588e-05, 0.003925926983356476, 0.007869891822338104, 0.011813856661319733, 0.01575782150030136, 0.01970178633928299, 0.023645751178264618, 0.027589716017246246, 0.031533680856227875, 0.0354776456952095, 0.03942161053419113, 0.04336557537317276, 0.04730954021215439, 0.05125350505113602, 0.055197469890117645, 0.059141434729099274, 0.0630853995680809, 0.06702936440706253, 0.07097332924604416, 0.07491729408502579, 0.07886125892400742, 0.08280522376298904, 0.08674918860197067, 0.0906931534409523, 0.09463711827993393, 0.09858108311891556, 0.10252504795789719, 0.10646901279687881]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 5.0, 7.0, 9.0, 15.0, 17.0, 13.0, 22.0, 22.0, 24.0, 35.0, 20.0, 36.0, 34.0, 42.0, 35.0, 36.0, 34.0, 43.0, 32.0, 42.0, 48.0, 43.0, 28.0, 45.0, 28.0, 34.0, 29.0, 20.0, 31.0, 20.0, 21.0, 17.0, 17.0, 19.0, 12.0, 12.0, 9.0, 7.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.06962723284959793, -0.06739553809165955, -0.06516385078430176, -0.06293215602636337, -0.060700464993715286, -0.0584687739610672, -0.056237079203128815, -0.05400538817048073, -0.05177369713783264, -0.049542006105184555, -0.04731031134724617, -0.045078620314598083, -0.04284692928195, -0.04061523824930191, -0.038383543491363525, -0.03615185245871544, -0.033920157700777054, -0.03168846666812897, -0.02945677377283573, -0.027225080877542496, -0.02499338984489441, -0.022761696949601173, -0.020530004054307938, -0.01829831302165985, -0.016066620126366615, -0.013834928162395954, -0.011603236198425293, -0.009371543303132057, -0.007139851339161396, -0.004908159375190735, -0.002676466479897499, -0.0004447745159268379, 0.0017869174480438232, 0.004018609412014484, 0.006250301841646433, 0.008481994271278381, 0.010713686235249043, 0.012945378199219704, 0.01517707109451294, 0.017408762127161026, 0.019640455022454262, 0.021872147917747498, 0.024103838950395584, 0.02633553184568882, 0.028567224740982056, 0.030798915773630142, 0.03303060680627823, 0.035262301564216614, 0.0374939925968647, 0.03972568362951279, 0.04195737838745117, 0.04418906942009926, 0.046420760452747345, 0.04865245521068573, 0.050884146243333817, 0.0531158372759819, 0.05534753203392029, 0.057579223066568375, 0.05981091782450676, 0.062042608857154846, 0.06427430361509323, 0.06650599092245102, 0.0687376856803894, 0.07096938043832779, 0.07320106774568558]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 7.0, 20.0, 17.0, 38.0, 48.0, 67.0, 103.0, 160.0, 196.0, 336.0, 508.0, 767.0, 1131.0, 1605.0, 2481.0, 3761.0, 5748.0, 8795.0, 13722.0, 22019.0, 36605.0, 62027.0, 112830.0, 233546.0, 691462.0, 1717806.0, 741250.0, 241729.0, 119969.0, 66840.0, 39569.0, 24144.0, 15030.0, 9798.0, 6512.0, 4298.0, 2787.0, 1988.0, 1362.0, 906.0, 648.0, 461.0, 352.0, 237.0, 171.0, 141.0, 83.0, 69.0, 55.0, 24.0, 17.0, 15.0, 8.0, 10.0, 4.0, 4.0, 3.0], "bins": [-0.0975341796875, -0.09453678131103516, -0.09153938293457031, -0.08854198455810547, -0.08554458618164062, -0.08254718780517578, -0.07954978942871094, -0.0765523910522461, -0.07355499267578125, -0.0705575942993164, -0.06756019592285156, -0.06456279754638672, -0.061565399169921875, -0.05856800079345703, -0.05557060241699219, -0.052573204040527344, -0.0495758056640625, -0.046578407287597656, -0.04358100891113281, -0.04058361053466797, -0.037586212158203125, -0.03458881378173828, -0.03159141540527344, -0.028594017028808594, -0.02559661865234375, -0.022599220275878906, -0.019601821899414062, -0.01660442352294922, -0.013607025146484375, -0.010609626770019531, -0.0076122283935546875, -0.004614830017089844, -0.001617431640625, 0.0013799667358398438, 0.0043773651123046875, 0.007374763488769531, 0.010372161865234375, 0.013369560241699219, 0.016366958618164062, 0.019364356994628906, 0.02236175537109375, 0.025359153747558594, 0.028356552124023438, 0.03135395050048828, 0.034351348876953125, 0.03734874725341797, 0.04034614562988281, 0.043343544006347656, 0.0463409423828125, 0.049338340759277344, 0.05233573913574219, 0.05533313751220703, 0.058330535888671875, 0.06132793426513672, 0.06432533264160156, 0.0673227310180664, 0.07032012939453125, 0.0733175277709961, 0.07631492614746094, 0.07931232452392578, 0.08230972290039062, 0.08530712127685547, 0.08830451965332031, 0.09130191802978516, 0.09429931640625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 7.0, 6.0, 9.0, 10.0, 11.0, 15.0, 22.0, 23.0, 20.0, 37.0, 31.0, 43.0, 21.0, 49.0, 46.0, 40.0, 51.0, 43.0, 38.0, 45.0, 42.0, 42.0, 30.0, 35.0, 37.0, 48.0, 21.0, 28.0, 21.0, 17.0, 20.0, 14.0, 18.0, 8.0, 10.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046966552734375, -0.04551553726196289, -0.04406452178955078, -0.04261350631713867, -0.04116249084472656, -0.03971147537231445, -0.038260459899902344, -0.036809444427490234, -0.035358428955078125, -0.033907413482666016, -0.032456398010253906, -0.031005382537841797, -0.029554367065429688, -0.028103351593017578, -0.02665233612060547, -0.02520132064819336, -0.02375030517578125, -0.02229928970336914, -0.02084827423095703, -0.019397258758544922, -0.017946243286132812, -0.016495227813720703, -0.015044212341308594, -0.013593196868896484, -0.012142181396484375, -0.010691165924072266, -0.009240150451660156, -0.007789134979248047, -0.0063381195068359375, -0.004887104034423828, -0.0034360885620117188, -0.0019850730895996094, -0.0005340576171875, 0.0009169578552246094, 0.0023679733276367188, 0.003818988800048828, 0.0052700042724609375, 0.006721019744873047, 0.008172035217285156, 0.009623050689697266, 0.011074066162109375, 0.012525081634521484, 0.013976097106933594, 0.015427112579345703, 0.016878128051757812, 0.018329143524169922, 0.01978015899658203, 0.02123117446899414, 0.02268218994140625, 0.02413320541381836, 0.02558422088623047, 0.027035236358642578, 0.028486251831054688, 0.029937267303466797, 0.031388282775878906, 0.032839298248291016, 0.034290313720703125, 0.035741329193115234, 0.037192344665527344, 0.03864336013793945, 0.04009437561035156, 0.04154539108276367, 0.04299640655517578, 0.04444742202758789, 0.0458984375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 7.0, 11.0, 12.0, 13.0, 30.0, 39.0, 55.0, 87.0, 124.0, 195.0, 280.0, 356.0, 581.0, 874.0, 1247.0, 1877.0, 2718.0, 4245.0, 6464.0, 9780.0, 15426.0, 23939.0, 38498.0, 63745.0, 108837.0, 194450.0, 380632.0, 877534.0, 1299523.0, 543932.0, 263314.0, 141957.0, 81345.0, 48432.0, 29786.0, 18861.0, 11946.0, 7804.0, 4974.0, 3372.0, 2246.0, 1520.0, 1033.0, 692.0, 500.0, 314.0, 236.0, 148.0, 98.0, 75.0, 39.0, 35.0, 25.0, 11.0, 7.0, 11.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.06768798828125, -0.06558799743652344, -0.06348800659179688, -0.06138801574707031, -0.05928802490234375, -0.05718803405761719, -0.055088043212890625, -0.05298805236816406, -0.0508880615234375, -0.04878807067871094, -0.046688079833984375, -0.04458808898925781, -0.04248809814453125, -0.04038810729980469, -0.038288116455078125, -0.03618812561035156, -0.034088134765625, -0.03198814392089844, -0.029888153076171875, -0.027788162231445312, -0.02568817138671875, -0.023588180541992188, -0.021488189697265625, -0.019388198852539062, -0.0172882080078125, -0.015188217163085938, -0.013088226318359375, -0.010988235473632812, -0.00888824462890625, -0.0067882537841796875, -0.004688262939453125, -0.0025882720947265625, -0.00048828125, 0.0016117095947265625, 0.003711700439453125, 0.0058116912841796875, 0.00791168212890625, 0.010011672973632812, 0.012111663818359375, 0.014211654663085938, 0.0163116455078125, 0.018411636352539062, 0.020511627197265625, 0.022611618041992188, 0.02471160888671875, 0.026811599731445312, 0.028911590576171875, 0.031011581420898438, 0.033111572265625, 0.03521156311035156, 0.037311553955078125, 0.03941154479980469, 0.04151153564453125, 0.04361152648925781, 0.045711517333984375, 0.04781150817871094, 0.0499114990234375, 0.05201148986816406, 0.054111480712890625, 0.05621147155761719, 0.05831146240234375, 0.06041145324707031, 0.06251144409179688, 0.06461143493652344, 0.06671142578125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 3.0, 7.0, 7.0, 12.0, 15.0, 11.0, 15.0, 37.0, 33.0, 43.0, 55.0, 71.0, 64.0, 105.0, 150.0, 128.0, 156.0, 156.0, 205.0, 233.0, 227.0, 282.0, 282.0, 266.0, 246.0, 180.0, 195.0, 149.0, 150.0, 90.0, 77.0, 73.0, 72.0, 47.0, 53.0, 38.0, 26.0, 27.0, 21.0, 13.0, 13.0, 10.0, 11.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0221099853515625, -0.02139878273010254, -0.020687580108642578, -0.019976377487182617, -0.019265174865722656, -0.018553972244262695, -0.017842769622802734, -0.017131567001342773, -0.016420364379882812, -0.01570916175842285, -0.01499795913696289, -0.01428675651550293, -0.013575553894042969, -0.012864351272583008, -0.012153148651123047, -0.011441946029663086, -0.010730743408203125, -0.010019540786743164, -0.009308338165283203, -0.008597135543823242, -0.007885932922363281, -0.00717473030090332, -0.006463527679443359, -0.0057523250579833984, -0.0050411224365234375, -0.0043299198150634766, -0.0036187171936035156, -0.0029075145721435547, -0.0021963119506835938, -0.0014851093292236328, -0.0007739067077636719, -6.270408630371094e-05, 0.00064849853515625, 0.001359701156616211, 0.002070903778076172, 0.002782106399536133, 0.0034933090209960938, 0.004204511642456055, 0.004915714263916016, 0.0056269168853759766, 0.0063381195068359375, 0.0070493221282958984, 0.007760524749755859, 0.00847172737121582, 0.009182929992675781, 0.009894132614135742, 0.010605335235595703, 0.011316537857055664, 0.012027740478515625, 0.012738943099975586, 0.013450145721435547, 0.014161348342895508, 0.014872550964355469, 0.01558375358581543, 0.01629495620727539, 0.01700615882873535, 0.017717361450195312, 0.018428564071655273, 0.019139766693115234, 0.019850969314575195, 0.020562171936035156, 0.021273374557495117, 0.021984577178955078, 0.02269577980041504, 0.023406982421875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 5.0, 14.0, 36.0, 33.0, 34.0, 43.0, 67.0, 83.0, 113.0, 111.0, 104.0, 57.0, 65.0, 40.0, 39.0, 18.0, 24.0, 19.0, 21.0, 12.0, 11.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0841507539153099, -0.08156321197748184, -0.07897566258907318, -0.07638812065124512, -0.07380057126283646, -0.07121302932500839, -0.06862547993659973, -0.06603793799877167, -0.063450388610363, -0.060862842947244644, -0.05827529728412628, -0.05568775162100792, -0.05310020595788956, -0.050512660294771194, -0.04792511463165283, -0.04533757269382477, -0.042750027030706406, -0.04016248136758804, -0.03757493570446968, -0.03498739004135132, -0.032399844378232956, -0.029812298715114594, -0.02722475491464138, -0.024637209251523018, -0.022049663588404655, -0.019462117925286293, -0.01687457226216793, -0.014287027530372143, -0.01169948186725378, -0.009111936204135418, -0.00652439147233963, -0.003936845809221268, -0.0013493001461029053, 0.0012382452841848135, 0.0038257907144725323, 0.006413335911929607, 0.00900088157504797, 0.011588427238166332, 0.01417597196996212, 0.016763517633080482, 0.019351063296198845, 0.021938608959317207, 0.02452615462243557, 0.027113698422908783, 0.029701244086027145, 0.03228878974914551, 0.03487633541226387, 0.03746388107538223, 0.040051426738500595, 0.04263897240161896, 0.04522651806473732, 0.04781406372785568, 0.050401609390974045, 0.05298915505409241, 0.05557669699192047, 0.05816424638032913, 0.060751788318157196, 0.06333933025598526, 0.06592687964439392, 0.06851442158222198, 0.07110197097063065, 0.07368951290845871, 0.07627706229686737, 0.07886460423469543, 0.0814521536231041]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 7.0, 11.0, 12.0, 16.0, 15.0, 19.0, 16.0, 20.0, 22.0, 21.0, 35.0, 27.0, 41.0, 34.0, 34.0, 31.0, 34.0, 36.0, 48.0, 37.0, 38.0, 31.0, 27.0, 39.0, 36.0, 30.0, 29.0, 27.0, 29.0, 29.0, 23.0, 18.0, 10.0, 21.0, 17.0, 12.0, 5.0, 13.0, 10.0, 2.0, 9.0, 7.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.04850662872195244, -0.04713018238544464, -0.045753732323646545, -0.04437728598713875, -0.04300083592534065, -0.041624389588832855, -0.04024793952703476, -0.03887149319052696, -0.037495046854019165, -0.03611860051751137, -0.03474215045571327, -0.033365704119205475, -0.03198925405740738, -0.030612807720899582, -0.029236359521746635, -0.02785991132259369, -0.026483461260795593, -0.025107013061642647, -0.0237305648624897, -0.022354118525981903, -0.020977668464183807, -0.01960122212767601, -0.018224773928523064, -0.016848325729370117, -0.01547187753021717, -0.014095429331064224, -0.012718981131911278, -0.011342533864080906, -0.00996608566492796, -0.008589637465775013, -0.007213190197944641, -0.005836741998791695, -0.004460293799638748, -0.0030838458333164454, -0.0017073978669941425, -0.00033095013350248337, 0.001045498065650463, 0.0024219462648034096, 0.0037983935326337814, 0.005174841731786728, 0.006551289930939674, 0.00792773813009262, 0.009304186329245567, 0.01068063359707594, 0.012057081796228886, 0.013433529995381832, 0.014809977263212204, 0.01618642546236515, 0.017562873661518097, 0.018939321860671043, 0.02031577005982399, 0.021692216396331787, 0.023068666458129883, 0.02444511279463768, 0.025821560993790627, 0.027198009192943573, 0.02857445739209652, 0.029950905591249466, 0.03132735192775726, 0.03270380198955536, 0.034080248326063156, 0.03545669838786125, 0.03683314472436905, 0.038209594786167145, 0.03958604112267494]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 9.0, 14.0, 22.0, 29.0, 43.0, 58.0, 85.0, 134.0, 188.0, 276.0, 412.0, 657.0, 985.0, 1491.0, 2245.0, 3632.0, 5556.0, 9031.0, 14299.0, 23449.0, 40254.0, 73565.0, 156883.0, 351654.0, 175235.0, 79085.0, 43113.0, 24875.0, 14931.0, 9658.0, 5867.0, 3793.0, 2429.0, 1529.0, 1030.0, 661.0, 463.0, 275.0, 207.0, 136.0, 91.0, 69.0, 53.0, 30.0, 12.0, 9.0, 12.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.04278564453125, -0.04147148132324219, -0.040157318115234375, -0.03884315490722656, -0.03752899169921875, -0.03621482849121094, -0.034900665283203125, -0.03358650207519531, -0.0322723388671875, -0.030958175659179688, -0.029644012451171875, -0.028329849243164062, -0.02701568603515625, -0.025701522827148438, -0.024387359619140625, -0.023073196411132812, -0.021759033203125, -0.020444869995117188, -0.019130706787109375, -0.017816543579101562, -0.01650238037109375, -0.015188217163085938, -0.013874053955078125, -0.012559890747070312, -0.0112457275390625, -0.009931564331054688, -0.008617401123046875, -0.0073032379150390625, -0.00598907470703125, -0.0046749114990234375, -0.003360748291015625, -0.0020465850830078125, -0.000732421875, 0.0005817413330078125, 0.001895904541015625, 0.0032100677490234375, 0.00452423095703125, 0.0058383941650390625, 0.007152557373046875, 0.008466720581054688, 0.0097808837890625, 0.011095046997070312, 0.012409210205078125, 0.013723373413085938, 0.01503753662109375, 0.016351699829101562, 0.017665863037109375, 0.018980026245117188, 0.020294189453125, 0.021608352661132812, 0.022922515869140625, 0.024236679077148438, 0.02555084228515625, 0.026865005493164062, 0.028179168701171875, 0.029493331909179688, 0.0308074951171875, 0.03212165832519531, 0.033435821533203125, 0.03474998474121094, 0.03606414794921875, 0.03737831115722656, 0.038692474365234375, 0.04000663757324219, 0.04132080078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 7.0, 7.0, 9.0, 14.0, 14.0, 22.0, 19.0, 21.0, 20.0, 31.0, 31.0, 32.0, 40.0, 36.0, 38.0, 34.0, 38.0, 37.0, 31.0, 40.0, 45.0, 41.0, 42.0, 39.0, 24.0, 29.0, 30.0, 30.0, 28.0, 29.0, 23.0, 19.0, 19.0, 11.0, 10.0, 12.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.053314208984375, -0.05182504653930664, -0.05033588409423828, -0.04884672164916992, -0.04735755920410156, -0.0458683967590332, -0.044379234313964844, -0.042890071868896484, -0.041400909423828125, -0.039911746978759766, -0.038422584533691406, -0.03693342208862305, -0.03544425964355469, -0.03395509719848633, -0.03246593475341797, -0.03097677230834961, -0.02948760986328125, -0.02799844741821289, -0.02650928497314453, -0.025020122528076172, -0.023530960083007812, -0.022041797637939453, -0.020552635192871094, -0.019063472747802734, -0.017574310302734375, -0.016085147857666016, -0.014595985412597656, -0.013106822967529297, -0.011617660522460938, -0.010128498077392578, -0.008639335632324219, -0.007150173187255859, -0.0056610107421875, -0.004171848297119141, -0.0026826858520507812, -0.0011935234069824219, 0.0002956390380859375, 0.0017848014831542969, 0.0032739639282226562, 0.004763126373291016, 0.006252288818359375, 0.007741451263427734, 0.009230613708496094, 0.010719776153564453, 0.012208938598632812, 0.013698101043701172, 0.015187263488769531, 0.01667642593383789, 0.01816558837890625, 0.01965475082397461, 0.02114391326904297, 0.022633075714111328, 0.024122238159179688, 0.025611400604248047, 0.027100563049316406, 0.028589725494384766, 0.030078887939453125, 0.031568050384521484, 0.033057212829589844, 0.0345463752746582, 0.03603553771972656, 0.03752470016479492, 0.03901386260986328, 0.04050302505493164, 0.0419921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 13.0, 11.0, 20.0, 21.0, 24.0, 17.0, 45.0, 70.0, 105.0, 126.0, 152.0, 232.0, 336.0, 402.0, 604.0, 833.0, 1150.0, 1739.0, 2305.0, 3428.0, 5080.0, 7995.0, 14046.0, 27066.0, 69928.0, 597846.0, 217818.0, 44570.0, 20325.0, 11036.0, 6727.0, 4233.0, 2981.0, 2148.0, 1413.0, 1081.0, 762.0, 496.0, 366.0, 286.0, 222.0, 141.0, 98.0, 76.0, 49.0, 35.0, 35.0, 22.0, 16.0, 8.0, 5.0, 7.0, 6.0, 4.0, 2.0, 4.0, 2.0], "bins": [-0.06890869140625, -0.06680774688720703, -0.06470680236816406, -0.0626058578491211, -0.060504913330078125, -0.058403968811035156, -0.05630302429199219, -0.05420207977294922, -0.05210113525390625, -0.05000019073486328, -0.04789924621582031, -0.045798301696777344, -0.043697357177734375, -0.041596412658691406, -0.03949546813964844, -0.03739452362060547, -0.0352935791015625, -0.03319263458251953, -0.031091690063476562, -0.028990745544433594, -0.026889801025390625, -0.024788856506347656, -0.022687911987304688, -0.02058696746826172, -0.01848602294921875, -0.01638507843017578, -0.014284133911132812, -0.012183189392089844, -0.010082244873046875, -0.007981300354003906, -0.0058803558349609375, -0.0037794113159179688, -0.001678466796875, 0.00042247772216796875, 0.0025234222412109375, 0.004624366760253906, 0.006725311279296875, 0.008826255798339844, 0.010927200317382812, 0.013028144836425781, 0.01512908935546875, 0.01723003387451172, 0.019330978393554688, 0.021431922912597656, 0.023532867431640625, 0.025633811950683594, 0.027734756469726562, 0.02983570098876953, 0.0319366455078125, 0.03403759002685547, 0.03613853454589844, 0.038239479064941406, 0.040340423583984375, 0.042441368103027344, 0.04454231262207031, 0.04664325714111328, 0.04874420166015625, 0.05084514617919922, 0.05294609069824219, 0.055047035217285156, 0.057147979736328125, 0.059248924255371094, 0.06134986877441406, 0.06345081329345703, 0.0655517578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 4.0, 5.0, 10.0, 12.0, 10.0, 10.0, 13.0, 19.0, 19.0, 17.0, 25.0, 24.0, 20.0, 26.0, 37.0, 35.0, 30.0, 46.0, 51.0, 27.0, 50.0, 33.0, 42.0, 49.0, 34.0, 31.0, 37.0, 37.0, 26.0, 26.0, 33.0, 22.0, 21.0, 18.0, 19.0, 18.0, 9.0, 13.0, 5.0, 9.0, 5.0, 3.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03216552734375, -0.031189441680908203, -0.030213356018066406, -0.02923727035522461, -0.028261184692382812, -0.027285099029541016, -0.02630901336669922, -0.025332927703857422, -0.024356842041015625, -0.023380756378173828, -0.02240467071533203, -0.021428585052490234, -0.020452499389648438, -0.01947641372680664, -0.018500328063964844, -0.017524242401123047, -0.01654815673828125, -0.015572071075439453, -0.014595985412597656, -0.01361989974975586, -0.012643814086914062, -0.011667728424072266, -0.010691642761230469, -0.009715557098388672, -0.008739471435546875, -0.007763385772705078, -0.006787300109863281, -0.005811214447021484, -0.0048351287841796875, -0.0038590431213378906, -0.0028829574584960938, -0.0019068717956542969, -0.0009307861328125, 4.5299530029296875e-05, 0.0010213851928710938, 0.0019974708557128906, 0.0029735565185546875, 0.003949642181396484, 0.004925727844238281, 0.005901813507080078, 0.006877899169921875, 0.007853984832763672, 0.008830070495605469, 0.009806156158447266, 0.010782241821289062, 0.01175832748413086, 0.012734413146972656, 0.013710498809814453, 0.01468658447265625, 0.015662670135498047, 0.016638755798339844, 0.01761484146118164, 0.018590927124023438, 0.019567012786865234, 0.02054309844970703, 0.021519184112548828, 0.022495269775390625, 0.023471355438232422, 0.02444744110107422, 0.025423526763916016, 0.026399612426757812, 0.02737569808959961, 0.028351783752441406, 0.029327869415283203, 0.030303955078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 10.0, 10.0, 12.0, 9.0, 21.0, 25.0, 35.0, 52.0, 75.0, 94.0, 138.0, 200.0, 253.0, 470.0, 653.0, 1091.0, 1844.0, 3213.0, 6180.0, 14754.0, 52389.0, 789888.0, 133710.0, 24005.0, 9061.0, 4310.0, 2276.0, 1339.0, 847.0, 509.0, 334.0, 218.0, 165.0, 101.0, 76.0, 53.0, 40.0, 18.0, 22.0, 17.0, 7.0, 11.0, 10.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01611328125, -0.015588760375976562, -0.015064239501953125, -0.014539718627929688, -0.01401519775390625, -0.013490676879882812, -0.012966156005859375, -0.012441635131835938, -0.0119171142578125, -0.011392593383789062, -0.010868072509765625, -0.010343551635742188, -0.00981903076171875, -0.009294509887695312, -0.008769989013671875, -0.008245468139648438, -0.007720947265625, -0.0071964263916015625, -0.006671905517578125, -0.0061473846435546875, -0.00562286376953125, -0.0050983428955078125, -0.004573822021484375, -0.0040493011474609375, -0.0035247802734375, -0.0030002593994140625, -0.002475738525390625, -0.0019512176513671875, -0.00142669677734375, -0.0009021759033203125, -0.000377655029296875, 0.0001468658447265625, 0.00067138671875, 0.0011959075927734375, 0.001720428466796875, 0.0022449493408203125, 0.00276947021484375, 0.0032939910888671875, 0.003818511962890625, 0.0043430328369140625, 0.0048675537109375, 0.0053920745849609375, 0.005916595458984375, 0.0064411163330078125, 0.00696563720703125, 0.0074901580810546875, 0.008014678955078125, 0.008539199829101562, 0.009063720703125, 0.009588241577148438, 0.010112762451171875, 0.010637283325195312, 0.01116180419921875, 0.011686325073242188, 0.012210845947265625, 0.012735366821289062, 0.0132598876953125, 0.013784408569335938, 0.014308929443359375, 0.014833450317382812, 0.01535797119140625, 0.015882492065429688, 0.016407012939453125, 0.016931533813476562, 0.0174560546875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 1.0, 7.0, 6.0, 5.0, 7.0, 10.0, 19.0, 24.0, 28.0, 25.0, 28.0, 49.0, 49.0, 51.0, 62.0, 67.0, 69.0, 84.0, 0.0, 79.0, 57.0, 55.0, 43.0, 40.0, 30.0, 19.0, 17.0, 19.0, 8.0, 8.0, 7.0, 6.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6707926988601685e-06, -1.6130506992340088e-06, -1.5553086996078491e-06, -1.4975666999816895e-06, -1.4398247003555298e-06, -1.3820827007293701e-06, -1.3243407011032104e-06, -1.2665987014770508e-06, -1.2088567018508911e-06, -1.1511147022247314e-06, -1.0933727025985718e-06, -1.0356307029724121e-06, -9.778887033462524e-07, -9.201467037200928e-07, -8.624047040939331e-07, -8.046627044677734e-07, -7.469207048416138e-07, -6.891787052154541e-07, -6.314367055892944e-07, -5.736947059631348e-07, -5.159527063369751e-07, -4.5821070671081543e-07, -4.0046870708465576e-07, -3.427267074584961e-07, -2.849847078323364e-07, -2.2724270820617676e-07, -1.695007085800171e-07, -1.1175870895385742e-07, -5.4016709327697754e-08, 3.725290298461914e-09, 6.146728992462158e-08, 1.1920928955078125e-07, 1.7695128917694092e-07, 2.3469328880310059e-07, 2.9243528842926025e-07, 3.501772880554199e-07, 4.079192876815796e-07, 4.6566128730773926e-07, 5.234032869338989e-07, 5.811452865600586e-07, 6.388872861862183e-07, 6.966292858123779e-07, 7.543712854385376e-07, 8.121132850646973e-07, 8.698552846908569e-07, 9.275972843170166e-07, 9.853392839431763e-07, 1.043081283569336e-06, 1.1008232831954956e-06, 1.1585652828216553e-06, 1.216307282447815e-06, 1.2740492820739746e-06, 1.3317912817001343e-06, 1.389533281326294e-06, 1.4472752809524536e-06, 1.5050172805786133e-06, 1.562759280204773e-06, 1.6205012798309326e-06, 1.6782432794570923e-06, 1.735985279083252e-06, 1.7937272787094116e-06, 1.8514692783355713e-06, 1.909211277961731e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 18.0, 19.0, 32.0, 49.0, 52.0, 86.0, 122.0, 186.0, 258.0, 343.0, 521.0, 698.0, 1136.0, 1690.0, 2466.0, 4161.0, 7411.0, 14531.0, 33325.0, 110807.0, 641404.0, 151240.0, 40109.0, 16696.0, 8222.0, 4570.0, 2742.0, 1779.0, 1194.0, 784.0, 572.0, 380.0, 289.0, 194.0, 136.0, 101.0, 61.0, 44.0, 32.0, 26.0, 22.0, 14.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0135955810546875, -0.01316523551940918, -0.01273488998413086, -0.012304544448852539, -0.011874198913574219, -0.011443853378295898, -0.011013507843017578, -0.010583162307739258, -0.010152816772460938, -0.009722471237182617, -0.009292125701904297, -0.008861780166625977, -0.008431434631347656, -0.008001089096069336, -0.007570743560791016, -0.007140398025512695, -0.006710052490234375, -0.006279706954956055, -0.005849361419677734, -0.005419015884399414, -0.004988670349121094, -0.0045583248138427734, -0.004127979278564453, -0.003697633743286133, -0.0032672882080078125, -0.002836942672729492, -0.002406597137451172, -0.0019762516021728516, -0.0015459060668945312, -0.001115560531616211, -0.0006852149963378906, -0.0002548694610595703, 0.00017547607421875, 0.0006058216094970703, 0.0010361671447753906, 0.001466512680053711, 0.0018968582153320312, 0.0023272037506103516, 0.002757549285888672, 0.003187894821166992, 0.0036182403564453125, 0.004048585891723633, 0.004478931427001953, 0.0049092769622802734, 0.005339622497558594, 0.005769968032836914, 0.006200313568115234, 0.006630659103393555, 0.007061004638671875, 0.007491350173950195, 0.007921695709228516, 0.008352041244506836, 0.008782386779785156, 0.009212732315063477, 0.009643077850341797, 0.010073423385620117, 0.010503768920898438, 0.010934114456176758, 0.011364459991455078, 0.011794805526733398, 0.012225151062011719, 0.012655496597290039, 0.01308584213256836, 0.01351618766784668, 0.013946533203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 6.0, 9.0, 9.0, 20.0, 35.0, 37.0, 76.0, 164.0, 282.0, 136.0, 81.0, 47.0, 28.0, 15.0, 22.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006641387939453125, -0.006463825702667236, -0.006286263465881348, -0.006108701229095459, -0.00593113899230957, -0.005753576755523682, -0.005576014518737793, -0.005398452281951904, -0.005220890045166016, -0.005043327808380127, -0.004865765571594238, -0.00468820333480835, -0.004510641098022461, -0.004333078861236572, -0.004155516624450684, -0.003977954387664795, -0.0038003921508789062, -0.0036228299140930176, -0.003445267677307129, -0.0032677054405212402, -0.0030901432037353516, -0.002912580966949463, -0.0027350187301635742, -0.0025574564933776855, -0.002379894256591797, -0.002202332019805908, -0.0020247697830200195, -0.0018472075462341309, -0.0016696453094482422, -0.0014920830726623535, -0.0013145208358764648, -0.0011369585990905762, -0.0009593963623046875, -0.0007818341255187988, -0.0006042718887329102, -0.0004267096519470215, -0.0002491474151611328, -7.158517837524414e-05, 0.00010597705841064453, 0.0002835392951965332, 0.0004611015319824219, 0.0006386637687683105, 0.0008162260055541992, 0.0009937882423400879, 0.0011713504791259766, 0.0013489127159118652, 0.001526474952697754, 0.0017040371894836426, 0.0018815994262695312, 0.00205916166305542, 0.0022367238998413086, 0.0024142861366271973, 0.002591848373413086, 0.0027694106101989746, 0.0029469728469848633, 0.003124535083770752, 0.0033020973205566406, 0.0034796595573425293, 0.003657221794128418, 0.0038347840309143066, 0.004012346267700195, 0.004189908504486084, 0.004367470741271973, 0.004545032978057861, 0.00472259521484375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 4.0, 8.0, 8.0, 7.0, 11.0, 15.0, 21.0, 42.0, 33.0, 45.0, 64.0, 76.0, 116.0, 109.0, 110.0, 63.0, 58.0, 42.0, 41.0, 23.0, 23.0, 18.0, 17.0, 13.0, 7.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08309037238359451, -0.08054132014513016, -0.0779922679066658, -0.07544320821762085, -0.0728941559791565, -0.07034510374069214, -0.06779605150222778, -0.06524699926376343, -0.06269793957471848, -0.06014888733625412, -0.057599831372499466, -0.05505077913403511, -0.05250172317028046, -0.0499526709318161, -0.047403618693351746, -0.04485456272959709, -0.042305510491132736, -0.03975645825266838, -0.03720740228891373, -0.03465835005044937, -0.03210929408669472, -0.029560241848230362, -0.027011187747120857, -0.024462133646011353, -0.021913079544901848, -0.019364025443792343, -0.01681497134268284, -0.014265918172895908, -0.011716864071786404, -0.009167809970676899, -0.006618756800889969, -0.004069702699780464, -0.0015206485986709595, 0.0010284052696079016, 0.0035774591378867626, 0.00612651277333498, 0.008675566874444485, 0.01122462097555399, 0.01377367414534092, 0.016322728246450424, 0.01887178234755993, 0.021420836448669434, 0.02396989054977894, 0.026518944650888443, 0.0290679968893528, 0.03161705285310745, 0.03416610509157181, 0.03671515733003616, 0.03926421329379082, 0.04181326553225517, 0.04436232149600983, 0.04691137373447418, 0.049460429698228836, 0.05200948193669319, 0.054558537900447845, 0.0571075901389122, 0.059656642377376556, 0.06220569461584091, 0.06475474685430527, 0.06730380654335022, 0.06985285878181458, 0.07240191102027893, 0.07495096325874329, 0.07750001549720764, 0.0800490751862526]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 14.0, 13.0, 15.0, 19.0, 18.0, 23.0, 21.0, 18.0, 37.0, 26.0, 35.0, 37.0, 36.0, 24.0, 42.0, 30.0, 49.0, 36.0, 40.0, 34.0, 33.0, 36.0, 35.0, 31.0, 20.0, 32.0, 32.0, 25.0, 24.0, 21.0, 12.0, 18.0, 16.0, 14.0, 6.0, 12.0, 6.0, 8.0, 8.0, 7.0, 2.0, 1.0, 4.0, 3.0, 0.0, 4.0], "bins": [-0.04802699387073517, -0.046669792383909225, -0.04531259462237358, -0.04395539313554764, -0.04259819537401199, -0.04124099388718605, -0.03988379240036011, -0.03852659463882446, -0.03716939687728882, -0.035812195390462875, -0.03445499762892723, -0.03309779614210129, -0.03174059838056564, -0.0303833968937397, -0.029026197269558907, -0.027668997645378113, -0.02631179615855217, -0.024954596534371376, -0.023597396910190582, -0.02224019542336464, -0.020882997661828995, -0.019525796175003052, -0.018168596550822258, -0.016811396926641464, -0.01545419730246067, -0.014096997678279877, -0.012739798054099083, -0.011382597498595715, -0.01002539787441492, -0.008668198250234127, -0.007310997694730759, -0.005953798070549965, -0.004596598446369171, -0.0032393985893577337, -0.0018821987323462963, -0.0005249986425042152, 0.0008322009816765785, 0.0021894006058573723, 0.0035466011613607407, 0.004903800785541534, 0.006261000409722328, 0.007618200033903122, 0.008975399658083916, 0.010332600213587284, 0.011689799837768078, 0.013046999461948872, 0.01440420001745224, 0.015761399641633034, 0.017118599265813828, 0.01847579888999462, 0.019832998514175415, 0.021190200001001358, 0.022547397762537003, 0.023904599249362946, 0.02526179887354374, 0.026618998497724533, 0.027976198121905327, 0.02933339774608612, 0.030690597370266914, 0.03204779699444771, 0.03340499848127365, 0.034762196242809296, 0.03611939772963524, 0.03747659921646118, 0.038833796977996826]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 6.0, 8.0, 8.0, 16.0, 20.0, 34.0, 53.0, 72.0, 98.0, 162.0, 237.0, 329.0, 494.0, 672.0, 1012.0, 1511.0, 2255.0, 3443.0, 5034.0, 7904.0, 11917.0, 18486.0, 29381.0, 47827.0, 80739.0, 141791.0, 252644.0, 183487.0, 100467.0, 58899.0, 35640.0, 22076.0, 14319.0, 9238.0, 6003.0, 4104.0, 2609.0, 1795.0, 1194.0, 809.0, 570.0, 364.0, 251.0, 174.0, 136.0, 79.0, 57.0, 48.0, 19.0, 23.0, 16.0, 9.0, 10.0, 5.0, 5.0, 2.0, 1.0], "bins": [-0.0906982421875, -0.08800697326660156, -0.08531570434570312, -0.08262443542480469, -0.07993316650390625, -0.07724189758300781, -0.07455062866210938, -0.07185935974121094, -0.0691680908203125, -0.06647682189941406, -0.06378555297851562, -0.06109428405761719, -0.05840301513671875, -0.05571174621582031, -0.053020477294921875, -0.05032920837402344, -0.047637939453125, -0.04494667053222656, -0.042255401611328125, -0.03956413269042969, -0.03687286376953125, -0.03418159484863281, -0.031490325927734375, -0.028799057006835938, -0.0261077880859375, -0.023416519165039062, -0.020725250244140625, -0.018033981323242188, -0.01534271240234375, -0.012651443481445312, -0.009960174560546875, -0.0072689056396484375, -0.00457763671875, -0.0018863677978515625, 0.000804901123046875, 0.0034961700439453125, 0.00618743896484375, 0.008878707885742188, 0.011569976806640625, 0.014261245727539062, 0.0169525146484375, 0.019643783569335938, 0.022335052490234375, 0.025026321411132812, 0.02771759033203125, 0.030408859252929688, 0.033100128173828125, 0.03579139709472656, 0.038482666015625, 0.04117393493652344, 0.043865203857421875, 0.04655647277832031, 0.04924774169921875, 0.05193901062011719, 0.054630279541015625, 0.05732154846191406, 0.0600128173828125, 0.06270408630371094, 0.06539535522460938, 0.06808662414550781, 0.07077789306640625, 0.07346916198730469, 0.07616043090820312, 0.07885169982910156, 0.08154296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 5.0, 7.0, 10.0, 20.0, 19.0, 24.0, 9.0, 21.0, 20.0, 21.0, 21.0, 43.0, 35.0, 33.0, 34.0, 33.0, 29.0, 44.0, 39.0, 44.0, 45.0, 35.0, 28.0, 39.0, 35.0, 31.0, 30.0, 33.0, 24.0, 28.0, 20.0, 21.0, 19.0, 18.0, 11.0, 7.0, 10.0, 12.0, 9.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.04443359375, -0.04314279556274414, -0.04185199737548828, -0.04056119918823242, -0.03927040100097656, -0.0379796028137207, -0.036688804626464844, -0.035398006439208984, -0.034107208251953125, -0.032816410064697266, -0.031525611877441406, -0.030234813690185547, -0.028944015502929688, -0.027653217315673828, -0.02636241912841797, -0.02507162094116211, -0.02378082275390625, -0.02249002456665039, -0.02119922637939453, -0.019908428192138672, -0.018617630004882812, -0.017326831817626953, -0.016036033630371094, -0.014745235443115234, -0.013454437255859375, -0.012163639068603516, -0.010872840881347656, -0.009582042694091797, -0.008291244506835938, -0.007000446319580078, -0.005709648132324219, -0.004418849945068359, -0.0031280517578125, -0.0018372535705566406, -0.0005464553833007812, 0.0007443428039550781, 0.0020351409912109375, 0.003325939178466797, 0.004616737365722656, 0.005907535552978516, 0.007198333740234375, 0.008489131927490234, 0.009779930114746094, 0.011070728302001953, 0.012361526489257812, 0.013652324676513672, 0.014943122863769531, 0.01623392105102539, 0.01752471923828125, 0.01881551742553711, 0.02010631561279297, 0.021397113800048828, 0.022687911987304688, 0.023978710174560547, 0.025269508361816406, 0.026560306549072266, 0.027851104736328125, 0.029141902923583984, 0.030432701110839844, 0.0317234992980957, 0.03301429748535156, 0.03430509567260742, 0.03559589385986328, 0.03688669204711914, 0.038177490234375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 11.0, 12.0, 11.0, 27.0, 41.0, 36.0, 71.0, 105.0, 139.0, 187.0, 310.0, 425.0, 641.0, 914.0, 1330.0, 1831.0, 2657.0, 3791.0, 5697.0, 8171.0, 12325.0, 18231.0, 28113.0, 43466.0, 70862.0, 122972.0, 232401.0, 203333.0, 108196.0, 63848.0, 39835.0, 26020.0, 16931.0, 11310.0, 7529.0, 5167.0, 3628.0, 2421.0, 1711.0, 1194.0, 819.0, 552.0, 383.0, 274.0, 210.0, 126.0, 102.0, 63.0, 45.0, 28.0, 20.0, 17.0, 9.0, 6.0, 2.0, 9.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07684326171875, -0.0743560791015625, -0.071868896484375, -0.0693817138671875, -0.06689453125, -0.0644073486328125, -0.061920166015625, -0.0594329833984375, -0.05694580078125, -0.0544586181640625, -0.051971435546875, -0.0494842529296875, -0.0469970703125, -0.0445098876953125, -0.042022705078125, -0.0395355224609375, -0.03704833984375, -0.0345611572265625, -0.032073974609375, -0.0295867919921875, -0.027099609375, -0.0246124267578125, -0.022125244140625, -0.0196380615234375, -0.01715087890625, -0.0146636962890625, -0.012176513671875, -0.0096893310546875, -0.0072021484375, -0.0047149658203125, -0.002227783203125, 0.0002593994140625, 0.00274658203125, 0.0052337646484375, 0.007720947265625, 0.0102081298828125, 0.0126953125, 0.0151824951171875, 0.017669677734375, 0.0201568603515625, 0.02264404296875, 0.0251312255859375, 0.027618408203125, 0.0301055908203125, 0.0325927734375, 0.0350799560546875, 0.037567138671875, 0.0400543212890625, 0.04254150390625, 0.0450286865234375, 0.047515869140625, 0.0500030517578125, 0.052490234375, 0.0549774169921875, 0.057464599609375, 0.0599517822265625, 0.06243896484375, 0.0649261474609375, 0.067413330078125, 0.0699005126953125, 0.0723876953125, 0.0748748779296875, 0.077362060546875, 0.0798492431640625, 0.08233642578125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 8.0, 9.0, 13.0, 11.0, 7.0, 20.0, 15.0, 16.0, 21.0, 26.0, 24.0, 22.0, 24.0, 31.0, 26.0, 22.0, 28.0, 41.0, 20.0, 37.0, 45.0, 42.0, 32.0, 39.0, 39.0, 32.0, 37.0, 38.0, 28.0, 27.0, 28.0, 17.0, 28.0, 28.0, 21.0, 19.0, 18.0, 13.0, 11.0, 8.0, 6.0, 4.0, 2.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0250396728515625, -0.024225711822509766, -0.02341175079345703, -0.022597789764404297, -0.021783828735351562, -0.020969867706298828, -0.020155906677246094, -0.01934194564819336, -0.018527984619140625, -0.01771402359008789, -0.016900062561035156, -0.016086101531982422, -0.015272140502929688, -0.014458179473876953, -0.013644218444824219, -0.012830257415771484, -0.01201629638671875, -0.011202335357666016, -0.010388374328613281, -0.009574413299560547, -0.008760452270507812, -0.007946491241455078, -0.007132530212402344, -0.006318569183349609, -0.005504608154296875, -0.004690647125244141, -0.0038766860961914062, -0.003062725067138672, -0.0022487640380859375, -0.0014348030090332031, -0.0006208419799804688, 0.00019311904907226562, 0.001007080078125, 0.0018210411071777344, 0.0026350021362304688, 0.003448963165283203, 0.0042629241943359375, 0.005076885223388672, 0.005890846252441406, 0.006704807281494141, 0.007518768310546875, 0.00833272933959961, 0.009146690368652344, 0.009960651397705078, 0.010774612426757812, 0.011588573455810547, 0.012402534484863281, 0.013216495513916016, 0.01403045654296875, 0.014844417572021484, 0.01565837860107422, 0.016472339630126953, 0.017286300659179688, 0.018100261688232422, 0.018914222717285156, 0.01972818374633789, 0.020542144775390625, 0.02135610580444336, 0.022170066833496094, 0.022984027862548828, 0.023797988891601562, 0.024611949920654297, 0.02542591094970703, 0.026239871978759766, 0.0270538330078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 17.0, 11.0, 22.0, 15.0, 31.0, 34.0, 41.0, 67.0, 99.0, 145.0, 197.0, 277.0, 440.0, 697.0, 1159.0, 2087.0, 3937.0, 7622.0, 16049.0, 43339.0, 266025.0, 622205.0, 48128.0, 18089.0, 8038.0, 4090.0, 2185.0, 1269.0, 751.0, 507.0, 284.0, 199.0, 134.0, 95.0, 76.0, 43.0, 48.0, 27.0, 19.0, 10.0, 16.0, 7.0, 7.0, 3.0, 3.0, 0.0, 4.0, 0.0, 5.0, 1.0, 2.0], "bins": [-0.0277252197265625, -0.026911020278930664, -0.026096820831298828, -0.025282621383666992, -0.024468421936035156, -0.02365422248840332, -0.022840023040771484, -0.02202582359313965, -0.021211624145507812, -0.020397424697875977, -0.01958322525024414, -0.018769025802612305, -0.01795482635498047, -0.017140626907348633, -0.016326427459716797, -0.015512228012084961, -0.014698028564453125, -0.013883829116821289, -0.013069629669189453, -0.012255430221557617, -0.011441230773925781, -0.010627031326293945, -0.00981283187866211, -0.008998632431030273, -0.008184432983398438, -0.0073702335357666016, -0.006556034088134766, -0.00574183464050293, -0.004927635192871094, -0.004113435745239258, -0.003299236297607422, -0.002485036849975586, -0.00167083740234375, -0.0008566379547119141, -4.2438507080078125e-05, 0.0007717609405517578, 0.0015859603881835938, 0.0024001598358154297, 0.0032143592834472656, 0.0040285587310791016, 0.0048427581787109375, 0.0056569576263427734, 0.006471157073974609, 0.007285356521606445, 0.008099555969238281, 0.008913755416870117, 0.009727954864501953, 0.010542154312133789, 0.011356353759765625, 0.012170553207397461, 0.012984752655029297, 0.013798952102661133, 0.014613151550292969, 0.015427350997924805, 0.01624155044555664, 0.017055749893188477, 0.017869949340820312, 0.01868414878845215, 0.019498348236083984, 0.02031254768371582, 0.021126747131347656, 0.021940946578979492, 0.022755146026611328, 0.023569345474243164, 0.024383544921875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 10.0, 3.0, 0.0, 10.0, 14.0, 20.0, 0.0, 19.0, 29.0, 30.0, 0.0, 58.0, 66.0, 76.0, 0.0, 94.0, 111.0, 113.0, 0.0, 78.0, 59.0, 53.0, 0.0, 40.0, 32.0, 19.0, 0.0, 22.0, 7.0, 9.0, 0.0, 10.0, 6.0, 5.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1324882507324219e-06, -1.087784767150879e-06, -1.043081283569336e-06, -9.98377799987793e-07, -9.5367431640625e-07, -9.08970832824707e-07, -8.642673492431641e-07, -8.195638656616211e-07, -7.748603820800781e-07, -7.301568984985352e-07, -6.854534149169922e-07, -6.407499313354492e-07, -5.960464477539062e-07, -5.513429641723633e-07, -5.066394805908203e-07, -4.6193599700927734e-07, -4.172325134277344e-07, -3.725290298461914e-07, -3.2782554626464844e-07, -2.8312206268310547e-07, -2.384185791015625e-07, -1.9371509552001953e-07, -1.4901161193847656e-07, -1.043081283569336e-07, -5.960464477539063e-08, -1.4901161193847656e-08, 2.9802322387695312e-08, 7.450580596923828e-08, 1.1920928955078125e-07, 1.6391277313232422e-07, 2.086162567138672e-07, 2.5331974029541016e-07, 2.980232238769531e-07, 3.427267074584961e-07, 3.8743019104003906e-07, 4.3213367462158203e-07, 4.76837158203125e-07, 5.21540641784668e-07, 5.662441253662109e-07, 6.109476089477539e-07, 6.556510925292969e-07, 7.003545761108398e-07, 7.450580596923828e-07, 7.897615432739258e-07, 8.344650268554688e-07, 8.791685104370117e-07, 9.238719940185547e-07, 9.685754776000977e-07, 1.0132789611816406e-06, 1.0579824447631836e-06, 1.1026859283447266e-06, 1.1473894119262695e-06, 1.1920928955078125e-06, 1.2367963790893555e-06, 1.2814998626708984e-06, 1.3262033462524414e-06, 1.3709068298339844e-06, 1.4156103134155273e-06, 1.4603137969970703e-06, 1.5050172805786133e-06, 1.5497207641601562e-06, 1.5944242477416992e-06, 1.6391277313232422e-06, 1.6838312149047852e-06, 1.7285346984863281e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 11.0, 13.0, 14.0, 21.0, 25.0, 46.0, 46.0, 61.0, 107.0, 111.0, 146.0, 225.0, 328.0, 433.0, 589.0, 889.0, 1166.0, 1822.0, 2753.0, 4578.0, 8386.0, 17792.0, 46568.0, 539066.0, 339213.0, 45435.0, 17444.0, 8101.0, 4426.0, 2728.0, 1698.0, 1206.0, 871.0, 590.0, 457.0, 286.0, 265.0, 165.0, 124.0, 102.0, 67.0, 42.0, 34.0, 33.0, 23.0, 14.0, 13.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261383056640625, -0.025294780731201172, -0.024451255798339844, -0.023607730865478516, -0.022764205932617188, -0.02192068099975586, -0.02107715606689453, -0.020233631134033203, -0.019390106201171875, -0.018546581268310547, -0.01770305633544922, -0.01685953140258789, -0.016016006469726562, -0.015172481536865234, -0.014328956604003906, -0.013485431671142578, -0.01264190673828125, -0.011798381805419922, -0.010954856872558594, -0.010111331939697266, -0.009267807006835938, -0.00842428207397461, -0.007580757141113281, -0.006737232208251953, -0.005893707275390625, -0.005050182342529297, -0.004206657409667969, -0.0033631324768066406, -0.0025196075439453125, -0.0016760826110839844, -0.0008325576782226562, 1.0967254638671875e-05, 0.0008544921875, 0.0016980171203613281, 0.0025415420532226562, 0.0033850669860839844, 0.0042285919189453125, 0.005072116851806641, 0.005915641784667969, 0.006759166717529297, 0.007602691650390625, 0.008446216583251953, 0.009289741516113281, 0.01013326644897461, 0.010976791381835938, 0.011820316314697266, 0.012663841247558594, 0.013507366180419922, 0.01435089111328125, 0.015194416046142578, 0.016037940979003906, 0.016881465911865234, 0.017724990844726562, 0.01856851577758789, 0.01941204071044922, 0.020255565643310547, 0.021099090576171875, 0.021942615509033203, 0.02278614044189453, 0.02362966537475586, 0.024473190307617188, 0.025316715240478516, 0.026160240173339844, 0.027003765106201172, 0.0278472900390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 8.0, 15.0, 17.0, 24.0, 34.0, 36.0, 58.0, 190.0, 373.0, 59.0, 47.0, 36.0, 26.0, 16.0, 11.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00820159912109375, -0.007937908172607422, -0.007674217224121094, -0.007410526275634766, -0.0071468353271484375, -0.006883144378662109, -0.006619453430175781, -0.006355762481689453, -0.006092071533203125, -0.005828380584716797, -0.005564689636230469, -0.005300998687744141, -0.0050373077392578125, -0.004773616790771484, -0.004509925842285156, -0.004246234893798828, -0.0039825439453125, -0.003718852996826172, -0.0034551620483398438, -0.0031914710998535156, -0.0029277801513671875, -0.0026640892028808594, -0.0024003982543945312, -0.002136707305908203, -0.001873016357421875, -0.0016093254089355469, -0.0013456344604492188, -0.0010819435119628906, -0.0008182525634765625, -0.0005545616149902344, -0.00029087066650390625, -2.7179718017578125e-05, 0.00023651123046875, 0.0005002021789550781, 0.0007638931274414062, 0.0010275840759277344, 0.0012912750244140625, 0.0015549659729003906, 0.0018186569213867188, 0.002082347869873047, 0.002346038818359375, 0.002609729766845703, 0.0028734207153320312, 0.0031371116638183594, 0.0034008026123046875, 0.0036644935607910156, 0.003928184509277344, 0.004191875457763672, 0.00445556640625, 0.004719257354736328, 0.004982948303222656, 0.005246639251708984, 0.0055103302001953125, 0.005774021148681641, 0.006037712097167969, 0.006301403045654297, 0.006565093994140625, 0.006828784942626953, 0.007092475891113281, 0.007356166839599609, 0.0076198577880859375, 0.007883548736572266, 0.008147239685058594, 0.008410930633544922, 0.00867462158203125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 14.0, 12.0, 27.0, 33.0, 31.0, 37.0, 51.0, 57.0, 83.0, 112.0, 114.0, 95.0, 53.0, 53.0, 38.0, 28.0, 27.0, 25.0, 21.0, 14.0, 9.0, 10.0, 7.0, 8.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0], "bins": [-0.07726425677537918, -0.07508154213428497, -0.07289882004261017, -0.07071610540151596, -0.06853339076042175, -0.06635066866874695, -0.06416795402765274, -0.061985235661268234, -0.05980251729488373, -0.05761979892849922, -0.055437084287405014, -0.05325436592102051, -0.051071647554636, -0.048888929188251495, -0.04670621454715729, -0.04452349618077278, -0.042340781539678574, -0.04015806317329407, -0.03797534853219986, -0.03579263016581535, -0.03360991179943085, -0.03142719715833664, -0.029244478791952133, -0.027061760425567627, -0.02487904392182827, -0.022696327418088913, -0.020513609051704407, -0.01833089254796505, -0.016148176044225693, -0.013965457677841187, -0.01178274117410183, -0.009600023739039898, -0.007417306303977966, -0.005234588868916035, -0.0030518718995153904, -0.0008691549301147461, 0.0013135625049471855, 0.003496279940009117, 0.005678996443748474, 0.007861713878810406, 0.010044431313872337, 0.012227148748934269, 0.0144098661839962, 0.016592582687735558, 0.018775299191474915, 0.02095801755785942, 0.023140734061598778, 0.025323450565338135, 0.02750616893172264, 0.029688885435461998, 0.031871601939201355, 0.03405432030558586, 0.03623703867197037, 0.038419753313064575, 0.04060247167944908, 0.04278519004583359, 0.044967904686927795, 0.0471506230533123, 0.04933333769440651, 0.051516056060791016, 0.05369877442717552, 0.05588149279356003, 0.058064207434654236, 0.06024692580103874, 0.06242964416742325]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 4.0, 11.0, 9.0, 9.0, 14.0, 15.0, 20.0, 31.0, 26.0, 33.0, 32.0, 33.0, 38.0, 42.0, 32.0, 42.0, 44.0, 45.0, 49.0, 35.0, 26.0, 52.0, 30.0, 35.0, 33.0, 26.0, 29.0, 34.0, 22.0, 18.0, 29.0, 14.0, 13.0, 4.0, 12.0, 13.0, 13.0, 9.0, 1.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0441107414662838, -0.0426083467900753, -0.041105952113866806, -0.03960356116294861, -0.03810116648674011, -0.036598771810531616, -0.03509637713432312, -0.033593982458114624, -0.03209158778190613, -0.030589193105697632, -0.029086800292134285, -0.02758440561592579, -0.026082012802362442, -0.024579618126153946, -0.02307722344994545, -0.021574828773736954, -0.020072437822818756, -0.01857004314661026, -0.017067650333046913, -0.015565255656838417, -0.014062861911952496, -0.012560468167066574, -0.011058073490858078, -0.009555679745972157, -0.008053286001086235, -0.006550892256200314, -0.005048498045653105, -0.003546103835105896, -0.0020437100902199745, -0.000541316345334053, 0.000961078330874443, 0.0024634720757603645, 0.003965865820646286, 0.0054682595655322075, 0.006970653776079416, 0.008473047986626625, 0.009975441731512547, 0.011477835476398468, 0.012980230152606964, 0.014482623897492886, 0.015985017642378807, 0.017487412318587303, 0.01898980513215065, 0.020492199808359146, 0.021994594484567642, 0.02349698729813099, 0.024999381974339485, 0.026501774787902832, 0.028004169464111328, 0.029506564140319824, 0.03100895695388317, 0.032511353492736816, 0.034013744443655014, 0.03551613911986351, 0.037018533796072006, 0.0385209284722805, 0.0400233194231987, 0.041525714099407196, 0.04302810877561569, 0.04453050345182419, 0.046032894402742386, 0.04753528907895088, 0.04903768375515938, 0.050540078431367874, 0.05204247310757637]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 17.0, 21.0, 29.0, 39.0, 74.0, 111.0, 201.0, 362.0, 549.0, 946.0, 1685.0, 2976.0, 5392.0, 9979.0, 19442.0, 38387.0, 82333.0, 195171.0, 702662.0, 2213048.0, 598569.0, 176360.0, 75013.0, 34715.0, 16984.0, 8659.0, 4613.0, 2452.0, 1388.0, 841.0, 459.0, 286.0, 175.0, 112.0, 75.0, 57.0, 30.0, 12.0, 15.0, 8.0, 9.0, 5.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07427978515625, -0.07157421112060547, -0.06886863708496094, -0.0661630630493164, -0.06345748901367188, -0.060751914978027344, -0.05804634094238281, -0.05534076690673828, -0.05263519287109375, -0.04992961883544922, -0.04722404479980469, -0.044518470764160156, -0.041812896728515625, -0.039107322692871094, -0.03640174865722656, -0.03369617462158203, -0.0309906005859375, -0.02828502655029297, -0.025579452514648438, -0.022873878479003906, -0.020168304443359375, -0.017462730407714844, -0.014757156372070312, -0.012051582336425781, -0.00934600830078125, -0.006640434265136719, -0.0039348602294921875, -0.0012292861938476562, 0.001476287841796875, 0.004181861877441406, 0.0068874359130859375, 0.009593009948730469, 0.012298583984375, 0.015004158020019531, 0.017709732055664062, 0.020415306091308594, 0.023120880126953125, 0.025826454162597656, 0.028532028198242188, 0.03123760223388672, 0.03394317626953125, 0.03664875030517578, 0.03935432434082031, 0.042059898376464844, 0.044765472412109375, 0.047471046447753906, 0.05017662048339844, 0.05288219451904297, 0.0555877685546875, 0.05829334259033203, 0.06099891662597656, 0.0637044906616211, 0.06641006469726562, 0.06911563873291016, 0.07182121276855469, 0.07452678680419922, 0.07723236083984375, 0.07993793487548828, 0.08264350891113281, 0.08534908294677734, 0.08805465698242188, 0.0907602310180664, 0.09346580505371094, 0.09617137908935547, 0.098876953125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 5.0, 8.0, 12.0, 12.0, 16.0, 14.0, 17.0, 27.0, 24.0, 29.0, 32.0, 27.0, 42.0, 47.0, 42.0, 39.0, 42.0, 43.0, 40.0, 45.0, 41.0, 42.0, 47.0, 31.0, 36.0, 30.0, 27.0, 32.0, 19.0, 27.0, 17.0, 16.0, 17.0, 10.0, 9.0, 6.0, 11.0, 5.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026947021484375, -0.026000022888183594, -0.025053024291992188, -0.02410602569580078, -0.023159027099609375, -0.02221202850341797, -0.021265029907226562, -0.020318031311035156, -0.01937103271484375, -0.018424034118652344, -0.017477035522460938, -0.01653003692626953, -0.015583038330078125, -0.014636039733886719, -0.013689041137695312, -0.012742042541503906, -0.0117950439453125, -0.010848045349121094, -0.009901046752929688, -0.008954048156738281, -0.008007049560546875, -0.007060050964355469, -0.0061130523681640625, -0.005166053771972656, -0.00421905517578125, -0.0032720565795898438, -0.0023250579833984375, -0.0013780593872070312, -0.000431060791015625, 0.0005159378051757812, 0.0014629364013671875, 0.0024099349975585938, 0.00335693359375, 0.004303932189941406, 0.0052509307861328125, 0.006197929382324219, 0.007144927978515625, 0.008091926574707031, 0.009038925170898438, 0.009985923767089844, 0.01093292236328125, 0.011879920959472656, 0.012826919555664062, 0.013773918151855469, 0.014720916748046875, 0.01566791534423828, 0.016614913940429688, 0.017561912536621094, 0.0185089111328125, 0.019455909729003906, 0.020402908325195312, 0.02134990692138672, 0.022296905517578125, 0.02324390411376953, 0.024190902709960938, 0.025137901306152344, 0.02608489990234375, 0.027031898498535156, 0.027978897094726562, 0.02892589569091797, 0.029872894287109375, 0.03081989288330078, 0.03176689147949219, 0.032713890075683594, 0.033660888671875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 16.0, 19.0, 36.0, 47.0, 70.0, 133.0, 161.0, 236.0, 357.0, 496.0, 743.0, 1127.0, 1768.0, 2549.0, 3846.0, 5761.0, 8882.0, 13972.0, 21848.0, 35093.0, 57969.0, 100597.0, 181565.0, 350136.0, 780443.0, 1349892.0, 611569.0, 289916.0, 152402.0, 86096.0, 51173.0, 30824.0, 19165.0, 12298.0, 7952.0, 5039.0, 3239.0, 2288.0, 1432.0, 1002.0, 681.0, 474.0, 307.0, 197.0, 138.0, 113.0, 69.0, 44.0, 26.0, 28.0, 12.0, 16.0, 5.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.043731689453125, -0.042380332946777344, -0.04102897644042969, -0.03967761993408203, -0.038326263427734375, -0.03697490692138672, -0.03562355041503906, -0.034272193908691406, -0.03292083740234375, -0.031569480895996094, -0.030218124389648438, -0.02886676788330078, -0.027515411376953125, -0.02616405487060547, -0.024812698364257812, -0.023461341857910156, -0.0221099853515625, -0.020758628845214844, -0.019407272338867188, -0.01805591583251953, -0.016704559326171875, -0.015353202819824219, -0.014001846313476562, -0.012650489807128906, -0.01129913330078125, -0.009947776794433594, -0.008596420288085938, -0.007245063781738281, -0.005893707275390625, -0.004542350769042969, -0.0031909942626953125, -0.0018396377563476562, -0.00048828125, 0.0008630752563476562, 0.0022144317626953125, 0.0035657882690429688, 0.004917144775390625, 0.006268501281738281, 0.0076198577880859375, 0.008971214294433594, 0.01032257080078125, 0.011673927307128906, 0.013025283813476562, 0.014376640319824219, 0.015727996826171875, 0.01707935333251953, 0.018430709838867188, 0.019782066345214844, 0.0211334228515625, 0.022484779357910156, 0.023836135864257812, 0.02518749237060547, 0.026538848876953125, 0.02789020538330078, 0.029241561889648438, 0.030592918395996094, 0.03194427490234375, 0.033295631408691406, 0.03464698791503906, 0.03599834442138672, 0.037349700927734375, 0.03870105743408203, 0.04005241394042969, 0.041403770446777344, 0.042755126953125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 9.0, 5.0, 9.0, 16.0, 12.0, 11.0, 22.0, 29.0, 31.0, 44.0, 60.0, 72.0, 61.0, 85.0, 88.0, 141.0, 152.0, 186.0, 204.0, 208.0, 223.0, 258.0, 287.0, 274.0, 239.0, 214.0, 178.0, 158.0, 129.0, 131.0, 83.0, 71.0, 74.0, 61.0, 44.0, 53.0, 37.0, 36.0, 16.0, 13.0, 12.0, 16.0, 5.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01509857177734375, -0.014648079872131348, -0.014197587966918945, -0.013747096061706543, -0.01329660415649414, -0.012846112251281738, -0.012395620346069336, -0.011945128440856934, -0.011494636535644531, -0.011044144630432129, -0.010593652725219727, -0.010143160820007324, -0.009692668914794922, -0.00924217700958252, -0.008791685104370117, -0.008341193199157715, -0.007890701293945312, -0.00744020938873291, -0.006989717483520508, -0.0065392255783081055, -0.006088733673095703, -0.005638241767883301, -0.0051877498626708984, -0.004737257957458496, -0.004286766052246094, -0.0038362741470336914, -0.003385782241821289, -0.0029352903366088867, -0.0024847984313964844, -0.002034306526184082, -0.0015838146209716797, -0.0011333227157592773, -0.000682830810546875, -0.00023233890533447266, 0.0002181529998779297, 0.000668644905090332, 0.0011191368103027344, 0.0015696287155151367, 0.002020120620727539, 0.0024706125259399414, 0.0029211044311523438, 0.003371596336364746, 0.0038220882415771484, 0.004272580146789551, 0.004723072052001953, 0.0051735639572143555, 0.005624055862426758, 0.00607454776763916, 0.0065250396728515625, 0.006975531578063965, 0.007426023483276367, 0.00787651538848877, 0.008327007293701172, 0.008777499198913574, 0.009227991104125977, 0.009678483009338379, 0.010128974914550781, 0.010579466819763184, 0.011029958724975586, 0.011480450630187988, 0.01193094253540039, 0.012381434440612793, 0.012831926345825195, 0.013282418251037598, 0.01373291015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 12.0, 18.0, 21.0, 23.0, 18.0, 46.0, 37.0, 60.0, 68.0, 53.0, 86.0, 81.0, 82.0, 84.0, 66.0, 40.0, 43.0, 31.0, 16.0, 18.0, 23.0, 8.0, 12.0, 9.0, 5.0, 4.0, 4.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0431818813085556, -0.041818127036094666, -0.04045437276363373, -0.03909061849117279, -0.03772686421871185, -0.036363113671541214, -0.034999359399080276, -0.03363560512661934, -0.0322718508541584, -0.030908096581697464, -0.029544342309236526, -0.028180589899420738, -0.0268168356269598, -0.025453081354498863, -0.024089328944683075, -0.022725574672222137, -0.0213618203997612, -0.019998066127300262, -0.018634311854839325, -0.017270559445023537, -0.0159068051725626, -0.014543050900101662, -0.013179297558963299, -0.011815544217824936, -0.010451789945363998, -0.009088035672903061, -0.007724282331764698, -0.006360528524965048, -0.004996774718165398, -0.0036330209113657475, -0.0022692671045660973, -0.0009055137634277344, 0.0004582405090332031, 0.0018219943158328533, 0.0031857481226325035, 0.004549501929432154, 0.005913255736231804, 0.007277009543031454, 0.008640763349831104, 0.010004516690969467, 0.011368270963430405, 0.012732025235891342, 0.014095778577029705, 0.015459531918168068, 0.016823286190629005, 0.018187040463089943, 0.01955079287290573, 0.02091454714536667, 0.022278301417827606, 0.023642055690288544, 0.02500580996274948, 0.02636956237256527, 0.027733316645026207, 0.029097070917487144, 0.030460823327302933, 0.03182457759976387, 0.03318833187222481, 0.034552086144685745, 0.03591584041714668, 0.03727959468960762, 0.03864334523677826, 0.0400070995092392, 0.041370853781700134, 0.04273460805416107, 0.04409836232662201]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 5.0, 8.0, 7.0, 10.0, 18.0, 15.0, 16.0, 23.0, 18.0, 33.0, 31.0, 36.0, 40.0, 23.0, 42.0, 40.0, 45.0, 35.0, 39.0, 40.0, 39.0, 39.0, 45.0, 45.0, 28.0, 22.0, 30.0, 25.0, 22.0, 30.0, 27.0, 23.0, 20.0, 12.0, 10.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03274519369006157, -0.031783267855644226, -0.030821340158581734, -0.02985941432416439, -0.028897486627101898, -0.027935560792684555, -0.026973634958267212, -0.02601170726120472, -0.025049779564142227, -0.024087853729724884, -0.02312592603266239, -0.02216400019824505, -0.021202072501182556, -0.020240146666765213, -0.01927822083234787, -0.018316293135285378, -0.017354367300868034, -0.01639244146645069, -0.015430513769388199, -0.014468587934970856, -0.013506660237908363, -0.01254473440349102, -0.011582807637751102, -0.010620880872011185, -0.009658954106271267, -0.00869702734053135, -0.007735100574791431, -0.006773174274712801, -0.005811247508972883, -0.0048493207432329655, -0.003887394443154335, -0.0029254676774144173, -0.0019635427743196487, -0.0010016161249950528, -3.9689475670456886e-05, 0.0009222370572388172, 0.001884163822978735, 0.0028460905887186527, 0.003808016888797283, 0.004769943654537201, 0.005731870420277119, 0.0066937971860170364, 0.007655723951756954, 0.008617650717496872, 0.009579576551914215, 0.010541504248976707, 0.01150343008339405, 0.012465356849133968, 0.013427283614873886, 0.014389210380613804, 0.015351137146353722, 0.016313062980771065, 0.017274990677833557, 0.0182369165122509, 0.019198842346668243, 0.020160770043730736, 0.021122697740793228, 0.02208462357521057, 0.023046551272273064, 0.024008477106690407, 0.0249704048037529, 0.025932330638170242, 0.026894256472587585, 0.027856184169650078, 0.02881811000406742]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 9.0, 10.0, 16.0, 22.0, 36.0, 70.0, 84.0, 125.0, 193.0, 280.0, 455.0, 585.0, 866.0, 1295.0, 1885.0, 2899.0, 4187.0, 6437.0, 9815.0, 15223.0, 24261.0, 40061.0, 71628.0, 144258.0, 333571.0, 182722.0, 83715.0, 46323.0, 27643.0, 17251.0, 11023.0, 7220.0, 4725.0, 3174.0, 2064.0, 1392.0, 926.0, 673.0, 479.0, 299.0, 190.0, 128.0, 103.0, 83.0, 34.0, 46.0, 19.0, 15.0, 14.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.0281829833984375, -0.027344942092895508, -0.026506900787353516, -0.025668859481811523, -0.02483081817626953, -0.02399277687072754, -0.023154735565185547, -0.022316694259643555, -0.021478652954101562, -0.02064061164855957, -0.019802570343017578, -0.018964529037475586, -0.018126487731933594, -0.0172884464263916, -0.01645040512084961, -0.015612363815307617, -0.014774322509765625, -0.013936281204223633, -0.01309823989868164, -0.012260198593139648, -0.011422157287597656, -0.010584115982055664, -0.009746074676513672, -0.00890803337097168, -0.008069992065429688, -0.007231950759887695, -0.006393909454345703, -0.005555868148803711, -0.004717826843261719, -0.0038797855377197266, -0.0030417442321777344, -0.002203702926635742, -0.00136566162109375, -0.0005276203155517578, 0.0003104209899902344, 0.0011484622955322266, 0.0019865036010742188, 0.002824544906616211, 0.003662586212158203, 0.004500627517700195, 0.0053386688232421875, 0.00617671012878418, 0.007014751434326172, 0.007852792739868164, 0.008690834045410156, 0.009528875350952148, 0.01036691665649414, 0.011204957962036133, 0.012042999267578125, 0.012881040573120117, 0.01371908187866211, 0.014557123184204102, 0.015395164489746094, 0.016233205795288086, 0.017071247100830078, 0.01790928840637207, 0.018747329711914062, 0.019585371017456055, 0.020423412322998047, 0.02126145362854004, 0.02209949493408203, 0.022937536239624023, 0.023775577545166016, 0.024613618850708008, 0.02545166015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 8.0, 12.0, 12.0, 12.0, 13.0, 26.0, 22.0, 25.0, 21.0, 40.0, 38.0, 34.0, 35.0, 37.0, 45.0, 51.0, 49.0, 42.0, 42.0, 36.0, 34.0, 47.0, 32.0, 30.0, 29.0, 32.0, 27.0, 31.0, 21.0, 22.0, 18.0, 13.0, 15.0, 10.0, 8.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.036651611328125, -0.03561520576477051, -0.034578800201416016, -0.03354239463806152, -0.03250598907470703, -0.03146958351135254, -0.030433177947998047, -0.029396772384643555, -0.028360366821289062, -0.02732396125793457, -0.026287555694580078, -0.025251150131225586, -0.024214744567871094, -0.0231783390045166, -0.02214193344116211, -0.021105527877807617, -0.020069122314453125, -0.019032716751098633, -0.01799631118774414, -0.01695990562438965, -0.015923500061035156, -0.014887094497680664, -0.013850688934326172, -0.01281428337097168, -0.011777877807617188, -0.010741472244262695, -0.009705066680908203, -0.008668661117553711, -0.007632255554199219, -0.0065958499908447266, -0.005559444427490234, -0.004523038864135742, -0.00348663330078125, -0.002450227737426758, -0.0014138221740722656, -0.00037741661071777344, 0.0006589889526367188, 0.001695394515991211, 0.002731800079345703, 0.0037682056427001953, 0.0048046112060546875, 0.00584101676940918, 0.006877422332763672, 0.007913827896118164, 0.008950233459472656, 0.009986639022827148, 0.01102304458618164, 0.012059450149536133, 0.013095855712890625, 0.014132261276245117, 0.01516866683959961, 0.0162050724029541, 0.017241477966308594, 0.018277883529663086, 0.019314289093017578, 0.02035069465637207, 0.021387100219726562, 0.022423505783081055, 0.023459911346435547, 0.02449631690979004, 0.02553272247314453, 0.026569128036499023, 0.027605533599853516, 0.028641939163208008, 0.0296783447265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 7.0, 15.0, 16.0, 38.0, 39.0, 57.0, 73.0, 107.0, 137.0, 200.0, 319.0, 397.0, 582.0, 849.0, 1077.0, 1686.0, 2541.0, 3943.0, 6417.0, 11595.0, 23837.0, 63133.0, 622364.0, 223757.0, 42126.0, 17918.0, 9458.0, 5331.0, 3404.0, 2193.0, 1470.0, 964.0, 735.0, 522.0, 390.0, 250.0, 167.0, 117.0, 104.0, 55.0, 50.0, 34.0, 29.0, 17.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.051116943359375, -0.04945850372314453, -0.04780006408691406, -0.046141624450683594, -0.044483184814453125, -0.042824745178222656, -0.04116630554199219, -0.03950786590576172, -0.03784942626953125, -0.03619098663330078, -0.03453254699707031, -0.032874107360839844, -0.031215667724609375, -0.029557228088378906, -0.027898788452148438, -0.02624034881591797, -0.0245819091796875, -0.02292346954345703, -0.021265029907226562, -0.019606590270996094, -0.017948150634765625, -0.016289710998535156, -0.014631271362304688, -0.012972831726074219, -0.01131439208984375, -0.009655952453613281, -0.007997512817382812, -0.006339073181152344, -0.004680633544921875, -0.0030221939086914062, -0.0013637542724609375, 0.00029468536376953125, 0.001953125, 0.0036115646362304688, 0.0052700042724609375, 0.006928443908691406, 0.008586883544921875, 0.010245323181152344, 0.011903762817382812, 0.013562202453613281, 0.01522064208984375, 0.01687908172607422, 0.018537521362304688, 0.020195960998535156, 0.021854400634765625, 0.023512840270996094, 0.025171279907226562, 0.02682971954345703, 0.0284881591796875, 0.03014659881591797, 0.03180503845214844, 0.033463478088378906, 0.035121917724609375, 0.036780357360839844, 0.03843879699707031, 0.04009723663330078, 0.04175567626953125, 0.04341411590576172, 0.04507255554199219, 0.046730995178222656, 0.048389434814453125, 0.050047874450683594, 0.05170631408691406, 0.05336475372314453, 0.055023193359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 13.0, 12.0, 15.0, 14.0, 17.0, 18.0, 16.0, 12.0, 24.0, 21.0, 20.0, 20.0, 47.0, 32.0, 32.0, 45.0, 40.0, 38.0, 53.0, 28.0, 46.0, 44.0, 26.0, 35.0, 23.0, 34.0, 27.0, 35.0, 30.0, 28.0, 19.0, 18.0, 21.0, 22.0, 16.0, 11.0, 9.0, 6.0, 7.0, 4.0, 2.0, 9.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0], "bins": [-0.0212554931640625, -0.020656585693359375, -0.02005767822265625, -0.019458770751953125, -0.01885986328125, -0.018260955810546875, -0.01766204833984375, -0.017063140869140625, -0.0164642333984375, -0.015865325927734375, -0.01526641845703125, -0.014667510986328125, -0.014068603515625, -0.013469696044921875, -0.01287078857421875, -0.012271881103515625, -0.0116729736328125, -0.011074066162109375, -0.01047515869140625, -0.009876251220703125, -0.00927734375, -0.008678436279296875, -0.00807952880859375, -0.007480621337890625, -0.0068817138671875, -0.006282806396484375, -0.00568389892578125, -0.005084991455078125, -0.004486083984375, -0.003887176513671875, -0.00328826904296875, -0.002689361572265625, -0.0020904541015625, -0.001491546630859375, -0.00089263916015625, -0.000293731689453125, 0.00030517578125, 0.000904083251953125, 0.00150299072265625, 0.002101898193359375, 0.0027008056640625, 0.003299713134765625, 0.00389862060546875, 0.004497528076171875, 0.005096435546875, 0.005695343017578125, 0.00629425048828125, 0.006893157958984375, 0.0074920654296875, 0.008090972900390625, 0.00868988037109375, 0.009288787841796875, 0.0098876953125, 0.010486602783203125, 0.01108551025390625, 0.011684417724609375, 0.0122833251953125, 0.012882232666015625, 0.01348114013671875, 0.014080047607421875, 0.014678955078125, 0.015277862548828125, 0.01587677001953125, 0.016475677490234375, 0.0170745849609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 4.0, 7.0, 17.0, 21.0, 27.0, 31.0, 54.0, 57.0, 74.0, 126.0, 144.0, 230.0, 308.0, 446.0, 665.0, 899.0, 1456.0, 2245.0, 3856.0, 6728.0, 13441.0, 33737.0, 204481.0, 689828.0, 51661.0, 17306.0, 8203.0, 4491.0, 2651.0, 1713.0, 1103.0, 769.0, 511.0, 365.0, 265.0, 171.0, 122.0, 103.0, 59.0, 45.0, 35.0, 23.0, 21.0, 13.0, 12.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0059051513671875, -0.005715668201446533, -0.005526185035705566, -0.0053367018699646, -0.005147218704223633, -0.004957735538482666, -0.004768252372741699, -0.004578769207000732, -0.004389286041259766, -0.004199802875518799, -0.004010319709777832, -0.0038208365440368652, -0.0036313533782958984, -0.0034418702125549316, -0.003252387046813965, -0.003062903881072998, -0.0028734207153320312, -0.0026839375495910645, -0.0024944543838500977, -0.002304971218109131, -0.002115488052368164, -0.0019260048866271973, -0.0017365217208862305, -0.0015470385551452637, -0.0013575553894042969, -0.00116807222366333, -0.0009785890579223633, -0.0007891058921813965, -0.0005996227264404297, -0.0004101395606994629, -0.0002206563949584961, -3.11732292175293e-05, 0.0001583099365234375, 0.0003477931022644043, 0.0005372762680053711, 0.0007267594337463379, 0.0009162425994873047, 0.0011057257652282715, 0.0012952089309692383, 0.001484692096710205, 0.0016741752624511719, 0.0018636584281921387, 0.0020531415939331055, 0.0022426247596740723, 0.002432107925415039, 0.002621591091156006, 0.0028110742568969727, 0.0030005574226379395, 0.0031900405883789062, 0.003379523754119873, 0.00356900691986084, 0.0037584900856018066, 0.0039479732513427734, 0.00413745641708374, 0.004326939582824707, 0.004516422748565674, 0.004705905914306641, 0.004895389080047607, 0.005084872245788574, 0.005274355411529541, 0.005463838577270508, 0.005653321743011475, 0.005842804908752441, 0.006032288074493408, 0.006221771240234375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 2.0, 13.0, 11.0, 9.0, 33.0, 18.0, 37.0, 113.0, 72.0, 70.0, 157.0, 68.0, 71.0, 143.0, 44.0, 33.0, 44.0, 13.0, 10.0, 11.0, 5.0, 8.0, 9.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.6030465960502625e-06, -2.5238841772079468e-06, -2.444721758365631e-06, -2.3655593395233154e-06, -2.2863969206809998e-06, -2.207234501838684e-06, -2.1280720829963684e-06, -2.0489096641540527e-06, -1.969747245311737e-06, -1.8905848264694214e-06, -1.8114224076271057e-06, -1.73225998878479e-06, -1.6530975699424744e-06, -1.5739351511001587e-06, -1.494772732257843e-06, -1.4156103134155273e-06, -1.3364478945732117e-06, -1.257285475730896e-06, -1.1781230568885803e-06, -1.0989606380462646e-06, -1.019798219203949e-06, -9.406358003616333e-07, -8.614733815193176e-07, -7.82310962677002e-07, -7.031485438346863e-07, -6.239861249923706e-07, -5.448237061500549e-07, -4.6566128730773926e-07, -3.864988684654236e-07, -3.073364496231079e-07, -2.2817403078079224e-07, -1.4901161193847656e-07, -6.984919309616089e-08, 9.313225746154785e-09, 8.847564458847046e-08, 1.6763806343078613e-07, 2.468004822731018e-07, 3.259629011154175e-07, 4.0512531995773315e-07, 4.842877388000488e-07, 5.634501576423645e-07, 6.426125764846802e-07, 7.217749953269958e-07, 8.009374141693115e-07, 8.800998330116272e-07, 9.592622518539429e-07, 1.0384246706962585e-06, 1.1175870895385742e-06, 1.1967495083808899e-06, 1.2759119272232056e-06, 1.3550743460655212e-06, 1.434236764907837e-06, 1.5133991837501526e-06, 1.5925616025924683e-06, 1.671724021434784e-06, 1.7508864402770996e-06, 1.8300488591194153e-06, 1.909211277961731e-06, 1.9883736968040466e-06, 2.0675361156463623e-06, 2.146698534488678e-06, 2.2258609533309937e-06, 2.3050233721733093e-06, 2.384185791015625e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 5.0, 4.0, 2.0, 7.0, 3.0, 11.0, 18.0, 21.0, 25.0, 48.0, 69.0, 115.0, 160.0, 255.0, 404.0, 617.0, 927.0, 1558.0, 2586.0, 4445.0, 7654.0, 13956.0, 27585.0, 64863.0, 261142.0, 502970.0, 85899.0, 34564.0, 16707.0, 8940.0, 5131.0, 3002.0, 1846.0, 1125.0, 660.0, 434.0, 276.0, 165.0, 103.0, 84.0, 51.0, 38.0, 28.0, 20.0, 10.0, 10.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.004726409912109375, -0.004569590091705322, -0.0044127702713012695, -0.004255950450897217, -0.004099130630493164, -0.003942310810089111, -0.0037854909896850586, -0.003628671169281006, -0.003471851348876953, -0.0033150315284729004, -0.0031582117080688477, -0.003001391887664795, -0.002844572067260742, -0.0026877522468566895, -0.0025309324264526367, -0.002374112606048584, -0.0022172927856445312, -0.0020604729652404785, -0.0019036531448364258, -0.001746833324432373, -0.0015900135040283203, -0.0014331936836242676, -0.0012763738632202148, -0.0011195540428161621, -0.0009627342224121094, -0.0008059144020080566, -0.0006490945816040039, -0.0004922747611999512, -0.00033545494079589844, -0.0001786351203918457, -2.181529998779297e-05, 0.00013500452041625977, 0.0002918243408203125, 0.00044864416122436523, 0.000605463981628418, 0.0007622838020324707, 0.0009191036224365234, 0.0010759234428405762, 0.001232743263244629, 0.0013895630836486816, 0.0015463829040527344, 0.0017032027244567871, 0.0018600225448608398, 0.0020168423652648926, 0.0021736621856689453, 0.002330482006072998, 0.0024873018264770508, 0.0026441216468811035, 0.0028009414672851562, 0.002957761287689209, 0.0031145811080932617, 0.0032714009284973145, 0.003428220748901367, 0.00358504056930542, 0.0037418603897094727, 0.0038986802101135254, 0.004055500030517578, 0.004212319850921631, 0.004369139671325684, 0.004525959491729736, 0.004682779312133789, 0.004839599132537842, 0.0049964189529418945, 0.005153238773345947, 0.00531005859375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 7.0, 4.0, 6.0, 4.0, 3.0, 7.0, 7.0, 7.0, 13.0, 10.0, 24.0, 25.0, 26.0, 45.0, 55.0, 84.0, 140.0, 169.0, 97.0, 76.0, 44.0, 38.0, 21.0, 20.0, 14.0, 8.0, 9.0, 10.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.0018768310546875, -0.001826271414756775, -0.0017757117748260498, -0.0017251521348953247, -0.0016745924949645996, -0.0016240328550338745, -0.0015734732151031494, -0.0015229135751724243, -0.0014723539352416992, -0.0014217942953109741, -0.001371234655380249, -0.001320675015449524, -0.0012701153755187988, -0.0012195557355880737, -0.0011689960956573486, -0.0011184364557266235, -0.0010678768157958984, -0.0010173171758651733, -0.0009667575359344482, -0.0009161978960037231, -0.000865638256072998, -0.000815078616142273, -0.0007645189762115479, -0.0007139593362808228, -0.0006633996963500977, -0.0006128400564193726, -0.0005622804164886475, -0.0005117207765579224, -0.00046116113662719727, -0.00041060149669647217, -0.00036004185676574707, -0.00030948221683502197, -0.0002589225769042969, -0.00020836293697357178, -0.00015780329704284668, -0.00010724365711212158, -5.6684017181396484e-05, -6.124377250671387e-06, 4.443526268005371e-05, 9.499490261077881e-05, 0.0001455545425415039, 0.000196114182472229, 0.0002466738224029541, 0.0002972334623336792, 0.0003477931022644043, 0.0003983527421951294, 0.0004489123821258545, 0.0004994720220565796, 0.0005500316619873047, 0.0006005913019180298, 0.0006511509418487549, 0.00070171058177948, 0.0007522702217102051, 0.0008028298616409302, 0.0008533895015716553, 0.0009039491415023804, 0.0009545087814331055, 0.0010050684213638306, 0.0010556280612945557, 0.0011061877012252808, 0.0011567473411560059, 0.001207306981086731, 0.001257866621017456, 0.0013084262609481812, 0.0013589859008789062]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 9.0, 20.0, 28.0, 23.0, 24.0, 36.0, 40.0, 76.0, 61.0, 72.0, 95.0, 85.0, 96.0, 63.0, 59.0, 41.0, 35.0, 17.0, 23.0, 15.0, 12.0, 15.0, 8.0, 6.0, 3.0, 4.0, 0.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044713977724313736, -0.04331965744495392, -0.0419253371655941, -0.04053101688623428, -0.039136696606874466, -0.03774237632751465, -0.03634805232286453, -0.03495373576879501, -0.0335594117641449, -0.03216509148478508, -0.030770771205425262, -0.029376450926065445, -0.027982130646705627, -0.02658781036734581, -0.025193488225340843, -0.023799167945981026, -0.022404849529266357, -0.02101052924990654, -0.019616208970546722, -0.018221888691186905, -0.016827568411827087, -0.015433247201144695, -0.014038925990462303, -0.012644605711102486, -0.011250285431742668, -0.00985596515238285, -0.008461644873023033, -0.007067323662340641, -0.0056730033829808235, -0.004278683103621006, -0.002884361892938614, -0.0014900416135787964, -9.572133421897888e-05, 0.0012985991779714823, 0.0026929196901619434, 0.004087240435183048, 0.005481560714542866, 0.006875880993902683, 0.008270202204585075, 0.009664522483944893, 0.01105884276330471, 0.012453163042664528, 0.013847483322024345, 0.015241804532706738, 0.01663612574338913, 0.018030446022748947, 0.019424766302108765, 0.020819086581468582, 0.0222134068608284, 0.023607727140188217, 0.025002047419548035, 0.026396367698907852, 0.02779068797826767, 0.029185008257627487, 0.030579330399632454, 0.03197365254163742, 0.03336796909570694, 0.03476228937506676, 0.036156609654426575, 0.03755092993378639, 0.03894525021314621, 0.04033957049250603, 0.041733890771865845, 0.04312821477651596, 0.04452253505587578]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 6.0, 9.0, 8.0, 17.0, 14.0, 17.0, 23.0, 17.0, 31.0, 32.0, 37.0, 34.0, 32.0, 38.0, 40.0, 46.0, 36.0, 41.0, 40.0, 37.0, 35.0, 47.0, 47.0, 28.0, 23.0, 32.0, 23.0, 25.0, 34.0, 22.0, 24.0, 18.0, 14.0, 10.0, 14.0, 11.0, 7.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03296642005443573, -0.03200586512684822, -0.03104531019926071, -0.030084755271673203, -0.029124202206730843, -0.028163647279143333, -0.027203092351555824, -0.026242537423968315, -0.025281984359025955, -0.024321429431438446, -0.023360874503850937, -0.022400319576263428, -0.021439766511321068, -0.02047921158373356, -0.01951865665614605, -0.01855810172855854, -0.01759754680097103, -0.016636991873383522, -0.015676436945796013, -0.014715882949531078, -0.013755328953266144, -0.012794774025678635, -0.011834219098091125, -0.010873664170503616, -0.009913110174238682, -0.008952555246651173, -0.007992001250386238, -0.007031446322798729, -0.006070891860872507, -0.005110337398946285, -0.004149782471358776, -0.0031892280094325542, -0.002228671684861183, -0.0012681171065196395, -0.0003075625281780958, 0.0006529921665787697, 0.0016135466285049915, 0.0025741010904312134, 0.0035346560180187225, 0.004495210479944944, 0.005455764941871166, 0.006416319403797388, 0.00737687386572361, 0.008337428793311119, 0.009297983720898628, 0.010258537717163563, 0.011219092644751072, 0.012179646641016006, 0.013140201568603516, 0.014100756496191025, 0.01506131049245596, 0.016021866351366043, 0.016982419416308403, 0.017942974343895912, 0.01890352927148342, 0.01986408419907093, 0.02082463726401329, 0.0217851921916008, 0.02274574711918831, 0.023706302046775818, 0.024666855111718178, 0.025627410039305687, 0.026587964966893196, 0.027548519894480705, 0.028509074822068214]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 16.0, 21.0, 39.0, 43.0, 82.0, 98.0, 165.0, 252.0, 369.0, 604.0, 803.0, 1231.0, 1777.0, 2791.0, 4320.0, 6852.0, 10281.0, 16095.0, 25456.0, 40783.0, 68503.0, 123042.0, 237594.0, 221326.0, 114747.0, 64555.0, 38818.0, 24316.0, 15282.0, 9860.0, 6277.0, 4195.0, 2656.0, 1763.0, 1221.0, 762.0, 494.0, 339.0, 254.0, 153.0, 112.0, 56.0, 44.0, 30.0, 18.0, 17.0, 8.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.058013916015625, -0.05625295639038086, -0.05449199676513672, -0.05273103713989258, -0.05097007751464844, -0.0492091178894043, -0.047448158264160156, -0.045687198638916016, -0.043926239013671875, -0.042165279388427734, -0.040404319763183594, -0.03864336013793945, -0.03688240051269531, -0.03512144088745117, -0.03336048126220703, -0.03159952163696289, -0.02983856201171875, -0.02807760238647461, -0.02631664276123047, -0.024555683135986328, -0.022794723510742188, -0.021033763885498047, -0.019272804260253906, -0.017511844635009766, -0.015750885009765625, -0.013989925384521484, -0.012228965759277344, -0.010468006134033203, -0.008707046508789062, -0.006946086883544922, -0.005185127258300781, -0.0034241676330566406, -0.0016632080078125, 9.775161743164062e-05, 0.0018587112426757812, 0.003619670867919922, 0.0053806304931640625, 0.007141590118408203, 0.008902549743652344, 0.010663509368896484, 0.012424468994140625, 0.014185428619384766, 0.015946388244628906, 0.017707347869873047, 0.019468307495117188, 0.021229267120361328, 0.02299022674560547, 0.02475118637084961, 0.02651214599609375, 0.02827310562133789, 0.03003406524658203, 0.03179502487182617, 0.03355598449707031, 0.03531694412231445, 0.037077903747558594, 0.038838863372802734, 0.040599822998046875, 0.042360782623291016, 0.044121742248535156, 0.0458827018737793, 0.04764366149902344, 0.04940462112426758, 0.05116558074951172, 0.05292654037475586, 0.0546875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 7.0, 6.0, 9.0, 13.0, 9.0, 16.0, 22.0, 15.0, 24.0, 25.0, 23.0, 26.0, 33.0, 40.0, 37.0, 42.0, 49.0, 43.0, 44.0, 47.0, 37.0, 44.0, 35.0, 45.0, 32.0, 36.0, 24.0, 25.0, 23.0, 35.0, 29.0, 25.0, 20.0, 14.0, 11.0, 7.0, 12.0, 6.0, 5.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.030059814453125, -0.02916717529296875, -0.0282745361328125, -0.02738189697265625, -0.0264892578125, -0.02559661865234375, -0.0247039794921875, -0.02381134033203125, -0.022918701171875, -0.02202606201171875, -0.0211334228515625, -0.02024078369140625, -0.01934814453125, -0.01845550537109375, -0.0175628662109375, -0.01667022705078125, -0.015777587890625, -0.01488494873046875, -0.0139923095703125, -0.01309967041015625, -0.01220703125, -0.01131439208984375, -0.0104217529296875, -0.00952911376953125, -0.008636474609375, -0.00774383544921875, -0.0068511962890625, -0.00595855712890625, -0.00506591796875, -0.00417327880859375, -0.0032806396484375, -0.00238800048828125, -0.001495361328125, -0.00060272216796875, 0.0002899169921875, 0.00118255615234375, 0.0020751953125, 0.00296783447265625, 0.0038604736328125, 0.00475311279296875, 0.005645751953125, 0.00653839111328125, 0.0074310302734375, 0.00832366943359375, 0.00921630859375, 0.01010894775390625, 0.0110015869140625, 0.01189422607421875, 0.012786865234375, 0.01367950439453125, 0.0145721435546875, 0.01546478271484375, 0.016357421875, 0.01725006103515625, 0.0181427001953125, 0.01903533935546875, 0.019927978515625, 0.02082061767578125, 0.0217132568359375, 0.02260589599609375, 0.02349853515625, 0.02439117431640625, 0.0252838134765625, 0.02617645263671875, 0.027069091796875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 5.0, 9.0, 25.0, 23.0, 29.0, 49.0, 74.0, 117.0, 176.0, 235.0, 378.0, 576.0, 867.0, 1332.0, 1994.0, 3216.0, 4988.0, 7632.0, 12209.0, 19013.0, 31352.0, 51254.0, 86351.0, 158804.0, 273664.0, 165657.0, 89368.0, 52535.0, 32388.0, 19768.0, 12465.0, 7725.0, 4790.0, 3208.0, 2135.0, 1346.0, 922.0, 596.0, 409.0, 294.0, 193.0, 113.0, 88.0, 62.0, 38.0, 28.0, 17.0, 16.0, 3.0, 7.0, 5.0, 4.0, 1.0, 4.0], "bins": [-0.061676025390625, -0.059889793395996094, -0.05810356140136719, -0.05631732940673828, -0.054531097412109375, -0.05274486541748047, -0.05095863342285156, -0.049172401428222656, -0.04738616943359375, -0.045599937438964844, -0.04381370544433594, -0.04202747344970703, -0.040241241455078125, -0.03845500946044922, -0.03666877746582031, -0.034882545471191406, -0.0330963134765625, -0.031310081481933594, -0.029523849487304688, -0.02773761749267578, -0.025951385498046875, -0.02416515350341797, -0.022378921508789062, -0.020592689514160156, -0.01880645751953125, -0.017020225524902344, -0.015233993530273438, -0.013447761535644531, -0.011661529541015625, -0.009875297546386719, -0.008089065551757812, -0.006302833557128906, -0.0045166015625, -0.0027303695678710938, -0.0009441375732421875, 0.0008420944213867188, 0.002628326416015625, 0.004414558410644531, 0.0062007904052734375, 0.007987022399902344, 0.00977325439453125, 0.011559486389160156, 0.013345718383789062, 0.015131950378417969, 0.016918182373046875, 0.01870441436767578, 0.020490646362304688, 0.022276878356933594, 0.0240631103515625, 0.025849342346191406, 0.027635574340820312, 0.02942180633544922, 0.031208038330078125, 0.03299427032470703, 0.03478050231933594, 0.036566734313964844, 0.03835296630859375, 0.040139198303222656, 0.04192543029785156, 0.04371166229248047, 0.045497894287109375, 0.04728412628173828, 0.04907035827636719, 0.050856590270996094, 0.052642822265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 3.0, 6.0, 10.0, 11.0, 14.0, 12.0, 21.0, 12.0, 24.0, 16.0, 31.0, 29.0, 32.0, 30.0, 50.0, 45.0, 43.0, 47.0, 50.0, 40.0, 42.0, 38.0, 37.0, 49.0, 38.0, 43.0, 35.0, 18.0, 30.0, 36.0, 21.0, 21.0, 9.0, 18.0, 11.0, 8.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0163421630859375, -0.015743017196655273, -0.015143871307373047, -0.01454472541809082, -0.013945579528808594, -0.013346433639526367, -0.01274728775024414, -0.012148141860961914, -0.011548995971679688, -0.010949850082397461, -0.010350704193115234, -0.009751558303833008, -0.009152412414550781, -0.008553266525268555, -0.007954120635986328, -0.0073549747467041016, -0.006755828857421875, -0.0061566829681396484, -0.005557537078857422, -0.004958391189575195, -0.004359245300292969, -0.003760099411010742, -0.0031609535217285156, -0.002561807632446289, -0.0019626617431640625, -0.001363515853881836, -0.0007643699645996094, -0.0001652240753173828, 0.00043392181396484375, 0.0010330677032470703, 0.0016322135925292969, 0.0022313594818115234, 0.00283050537109375, 0.0034296512603759766, 0.004028797149658203, 0.00462794303894043, 0.005227088928222656, 0.005826234817504883, 0.006425380706787109, 0.007024526596069336, 0.0076236724853515625, 0.008222818374633789, 0.008821964263916016, 0.009421110153198242, 0.010020256042480469, 0.010619401931762695, 0.011218547821044922, 0.011817693710327148, 0.012416839599609375, 0.013015985488891602, 0.013615131378173828, 0.014214277267456055, 0.014813423156738281, 0.015412569046020508, 0.016011714935302734, 0.01661086082458496, 0.017210006713867188, 0.017809152603149414, 0.01840829849243164, 0.019007444381713867, 0.019606590270996094, 0.02020573616027832, 0.020804882049560547, 0.021404027938842773, 0.022003173828125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 9.0, 9.0, 21.0, 20.0, 32.0, 54.0, 55.0, 93.0, 109.0, 159.0, 247.0, 316.0, 500.0, 661.0, 1012.0, 1358.0, 2130.0, 3173.0, 5390.0, 9520.0, 20768.0, 62304.0, 663593.0, 203138.0, 38485.0, 14913.0, 7545.0, 4311.0, 2801.0, 1771.0, 1190.0, 788.0, 574.0, 377.0, 314.0, 250.0, 139.0, 115.0, 83.0, 67.0, 44.0, 32.0, 13.0, 23.0, 12.0, 9.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0047607421875, -0.004611074924468994, -0.004461407661437988, -0.004311740398406982, -0.0041620731353759766, -0.004012405872344971, -0.003862738609313965, -0.003713071346282959, -0.003563404083251953, -0.0034137368202209473, -0.0032640695571899414, -0.0031144022941589355, -0.0029647350311279297, -0.002815067768096924, -0.002665400505065918, -0.002515733242034912, -0.0023660659790039062, -0.0022163987159729004, -0.0020667314529418945, -0.0019170641899108887, -0.0017673969268798828, -0.001617729663848877, -0.001468062400817871, -0.0013183951377868652, -0.0011687278747558594, -0.0010190606117248535, -0.0008693933486938477, -0.0007197260856628418, -0.0005700588226318359, -0.0004203915596008301, -0.0002707242965698242, -0.00012105703353881836, 2.86102294921875e-05, 0.00017827749252319336, 0.0003279447555541992, 0.0004776120185852051, 0.0006272792816162109, 0.0007769465446472168, 0.0009266138076782227, 0.0010762810707092285, 0.0012259483337402344, 0.0013756155967712402, 0.001525282859802246, 0.001674950122833252, 0.0018246173858642578, 0.0019742846488952637, 0.0021239519119262695, 0.0022736191749572754, 0.0024232864379882812, 0.002572953701019287, 0.002722620964050293, 0.002872288227081299, 0.0030219554901123047, 0.0031716227531433105, 0.0033212900161743164, 0.0034709572792053223, 0.003620624542236328, 0.003770291805267334, 0.00391995906829834, 0.004069626331329346, 0.0042192935943603516, 0.004368960857391357, 0.004518628120422363, 0.004668295383453369, 0.004817962646484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 11.0, 12.0, 11.0, 17.0, 30.0, 0.0, 37.0, 66.0, 102.0, 118.0, 138.0, 124.0, 0.0, 113.0, 83.0, 39.0, 30.0, 20.0, 11.0, 0.0, 9.0, 4.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.319684088230133e-06, -1.2684613466262817e-06, -1.2172386050224304e-06, -1.166015863418579e-06, -1.1147931218147278e-06, -1.0635703802108765e-06, -1.0123476386070251e-06, -9.611248970031738e-07, -9.099021553993225e-07, -8.586794137954712e-07, -8.074566721916199e-07, -7.562339305877686e-07, -7.050111889839172e-07, -6.537884473800659e-07, -6.025657057762146e-07, -5.513429641723633e-07, -5.00120222568512e-07, -4.4889748096466064e-07, -3.976747393608093e-07, -3.46451997756958e-07, -2.952292561531067e-07, -2.4400651454925537e-07, -1.9278377294540405e-07, -1.4156103134155273e-07, -9.033828973770142e-08, -3.91155481338501e-08, 1.210719347000122e-08, 6.332993507385254e-08, 1.1455267667770386e-07, 1.6577541828155518e-07, 2.169981598854065e-07, 2.682209014892578e-07, 3.1944364309310913e-07, 3.7066638469696045e-07, 4.2188912630081177e-07, 4.731118679046631e-07, 5.243346095085144e-07, 5.755573511123657e-07, 6.26780092716217e-07, 6.780028343200684e-07, 7.292255759239197e-07, 7.80448317527771e-07, 8.316710591316223e-07, 8.828938007354736e-07, 9.34116542339325e-07, 9.853392839431763e-07, 1.0365620255470276e-06, 1.087784767150879e-06, 1.1390075087547302e-06, 1.1902302503585815e-06, 1.2414529919624329e-06, 1.2926757335662842e-06, 1.3438984751701355e-06, 1.3951212167739868e-06, 1.4463439583778381e-06, 1.4975666999816895e-06, 1.5487894415855408e-06, 1.600012183189392e-06, 1.6512349247932434e-06, 1.7024576663970947e-06, 1.753680408000946e-06, 1.8049031496047974e-06, 1.8561258912086487e-06, 1.9073486328125e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 2.0, 5.0, 8.0, 19.0, 14.0, 20.0, 28.0, 34.0, 49.0, 75.0, 90.0, 125.0, 168.0, 228.0, 339.0, 458.0, 724.0, 977.0, 1574.0, 2351.0, 3867.0, 6430.0, 11634.0, 22921.0, 75072.0, 735411.0, 122635.0, 29720.0, 13381.0, 7560.0, 4490.0, 2744.0, 1722.0, 1091.0, 745.0, 525.0, 365.0, 266.0, 185.0, 145.0, 98.0, 71.0, 49.0, 41.0, 22.0, 14.0, 15.0, 12.0, 12.0, 8.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00493621826171875, -0.004780173301696777, -0.004624128341674805, -0.004468083381652832, -0.004312038421630859, -0.004155993461608887, -0.003999948501586914, -0.0038439035415649414, -0.0036878585815429688, -0.003531813621520996, -0.0033757686614990234, -0.0032197237014770508, -0.003063678741455078, -0.0029076337814331055, -0.002751588821411133, -0.00259554386138916, -0.0024394989013671875, -0.002283453941345215, -0.002127408981323242, -0.0019713640213012695, -0.0018153190612792969, -0.0016592741012573242, -0.0015032291412353516, -0.001347184181213379, -0.0011911392211914062, -0.0010350942611694336, -0.0008790493011474609, -0.0007230043411254883, -0.0005669593811035156, -0.00041091442108154297, -0.0002548694610595703, -9.882450103759766e-05, 5.7220458984375e-05, 0.00021326541900634766, 0.0003693103790283203, 0.000525355339050293, 0.0006814002990722656, 0.0008374452590942383, 0.000993490219116211, 0.0011495351791381836, 0.0013055801391601562, 0.001461625099182129, 0.0016176700592041016, 0.0017737150192260742, 0.0019297599792480469, 0.0020858049392700195, 0.002241849899291992, 0.002397894859313965, 0.0025539398193359375, 0.00270998477935791, 0.002866029739379883, 0.0030220746994018555, 0.003178119659423828, 0.0033341646194458008, 0.0034902095794677734, 0.003646254539489746, 0.0038022994995117188, 0.003958344459533691, 0.004114389419555664, 0.004270434379577637, 0.004426479339599609, 0.004582524299621582, 0.004738569259643555, 0.004894614219665527, 0.0050506591796875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 2.0, 4.0, 7.0, 10.0, 17.0, 13.0, 14.0, 21.0, 59.0, 149.0, 346.0, 148.0, 76.0, 32.0, 15.0, 8.0, 14.0, 5.0, 7.0, 11.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001644134521484375, -0.0015965253114700317, -0.0015489161014556885, -0.0015013068914413452, -0.001453697681427002, -0.0014060884714126587, -0.0013584792613983154, -0.0013108700513839722, -0.001263260841369629, -0.0012156516313552856, -0.0011680424213409424, -0.0011204332113265991, -0.0010728240013122559, -0.0010252147912979126, -0.0009776055812835693, -0.0009299963712692261, -0.0008823871612548828, -0.0008347779512405396, -0.0007871687412261963, -0.000739559531211853, -0.0006919503211975098, -0.0006443411111831665, -0.0005967319011688232, -0.00054912269115448, -0.0005015134811401367, -0.00045390427112579346, -0.0004062950611114502, -0.00035868585109710693, -0.00031107664108276367, -0.0002634674310684204, -0.00021585822105407715, -0.0001682490110397339, -0.00012063980102539062, -7.303059101104736e-05, -2.54213809967041e-05, 2.218782901763916e-05, 6.979703903198242e-05, 0.00011740624904632568, 0.00016501545906066895, 0.0002126246690750122, 0.00026023387908935547, 0.00030784308910369873, 0.000355452299118042, 0.00040306150913238525, 0.0004506707191467285, 0.0004982799291610718, 0.000545889139175415, 0.0005934983491897583, 0.0006411075592041016, 0.0006887167692184448, 0.0007363259792327881, 0.0007839351892471313, 0.0008315443992614746, 0.0008791536092758179, 0.0009267628192901611, 0.0009743720293045044, 0.0010219812393188477, 0.001069590449333191, 0.0011171996593475342, 0.0011648088693618774, 0.0012124180793762207, 0.001260027289390564, 0.0013076364994049072, 0.0013552457094192505, 0.0014028549194335938]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 12.0, 7.0, 15.0, 17.0, 20.0, 28.0, 23.0, 28.0, 40.0, 50.0, 51.0, 71.0, 97.0, 106.0, 71.0, 53.0, 68.0, 48.0, 37.0, 37.0, 19.0, 21.0, 15.0, 12.0, 10.0, 6.0, 7.0, 8.0, 1.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.03839346393942833, -0.03717665746808052, -0.03595985099673271, -0.034743040800094604, -0.033526234328746796, -0.03230942785739899, -0.031092621386051178, -0.02987581491470337, -0.02865900844335556, -0.02744220197200775, -0.026225393638014793, -0.025008587166666985, -0.023791780695319176, -0.022574972361326218, -0.02135816588997841, -0.0201413594186306, -0.018924551084637642, -0.017707744613289833, -0.016490936279296875, -0.015274129807949066, -0.014057323336601257, -0.012840515933930874, -0.01162370853126049, -0.010406902059912682, -0.009190094657242298, -0.007973287254571915, -0.006756480783224106, -0.005539673380553722, -0.004322866443544626, -0.00310605950653553, -0.0018892521038651466, -0.0006724456325173378, 0.0005443617701530457, 0.0017611688235774636, 0.0029779758770018816, 0.004194783046841621, 0.0054115899838507175, 0.006628396920859814, 0.007845204323530197, 0.009062010794878006, 0.01027881819754839, 0.011495625600218773, 0.012712432071566582, 0.013929239474236965, 0.015146046876907349, 0.016362853348255157, 0.017579659819602966, 0.018796466290950775, 0.020013274624943733, 0.021230081096291542, 0.0224468894302845, 0.02366369590163231, 0.024880502372980118, 0.026097308844327927, 0.027314117178320885, 0.028530923649668694, 0.02974773198366165, 0.03096453845500946, 0.03218134492635727, 0.03339815139770508, 0.034614961594343185, 0.035831768065690994, 0.0370485745370388, 0.03826538100838661, 0.03948218747973442]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 13.0, 9.0, 14.0, 15.0, 19.0, 25.0, 16.0, 33.0, 21.0, 44.0, 27.0, 29.0, 33.0, 39.0, 33.0, 41.0, 35.0, 23.0, 41.0, 31.0, 31.0, 50.0, 30.0, 42.0, 26.0, 27.0, 26.0, 28.0, 24.0, 19.0, 21.0, 19.0, 20.0, 9.0, 11.0, 11.0, 9.0, 12.0, 8.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.02709183655679226, -0.02627384476363659, -0.02545585110783577, -0.0246378593146801, -0.02381986565887928, -0.02300187386572361, -0.02218388020992279, -0.02136588841676712, -0.02054789662361145, -0.01972990483045578, -0.01891191117465496, -0.01809391938149929, -0.01727592572569847, -0.0164579339325428, -0.01563994213938713, -0.014821948483586311, -0.014003954827785492, -0.013185962103307247, -0.012367969378829002, -0.011549977585673332, -0.010731983929872513, -0.009913992136716843, -0.009095999412238598, -0.008278006687760353, -0.007460013963282108, -0.0066420212388038635, -0.005824028514325619, -0.005006036255508661, -0.0041880435310304165, -0.0033700508065521717, -0.0025520585477352142, -0.0017340658232569695, -0.0009160712361335754, -9.807862807065248e-05, 0.0007199139799922705, 0.0015379064716398716, 0.0023558991961181164, 0.003173891920596361, 0.003991884179413319, 0.004809876903891563, 0.005627869628369808, 0.006445862352848053, 0.007263855077326298, 0.008081847801804543, 0.008899839594960213, 0.009717833250761032, 0.010535825043916702, 0.011353817768394947, 0.012171810492873192, 0.012989803217351437, 0.013807795941829681, 0.014625787734985352, 0.015443781390786171, 0.01626177318394184, 0.01707976683974266, 0.01789775863289833, 0.018715750426054, 0.01953374221920967, 0.02035173587501049, 0.02116972766816616, 0.02198772132396698, 0.02280571311712265, 0.02362370491027832, 0.02444169856607914, 0.02525969222187996]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 9.0, 5.0, 24.0, 35.0, 48.0, 57.0, 104.0, 158.0, 215.0, 344.0, 493.0, 750.0, 1039.0, 1605.0, 2314.0, 3395.0, 5005.0, 7300.0, 10926.0, 16372.0, 24844.0, 39798.0, 65058.0, 112142.0, 214753.0, 595188.0, 1624470.0, 863190.0, 272641.0, 132687.0, 74932.0, 44393.0, 27702.0, 17792.0, 11599.0, 7554.0, 4988.0, 3445.0, 2173.0, 1537.0, 1023.0, 685.0, 529.0, 318.0, 222.0, 151.0, 103.0, 64.0, 40.0, 21.0, 21.0, 8.0, 8.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03167724609375, -0.030608654022216797, -0.029540061950683594, -0.02847146987915039, -0.027402877807617188, -0.026334285736083984, -0.02526569366455078, -0.024197101593017578, -0.023128509521484375, -0.022059917449951172, -0.02099132537841797, -0.019922733306884766, -0.018854141235351562, -0.01778554916381836, -0.016716957092285156, -0.015648365020751953, -0.01457977294921875, -0.013511180877685547, -0.012442588806152344, -0.01137399673461914, -0.010305404663085938, -0.009236812591552734, -0.008168220520019531, -0.007099628448486328, -0.006031036376953125, -0.004962444305419922, -0.0038938522338867188, -0.0028252601623535156, -0.0017566680908203125, -0.0006880760192871094, 0.00038051605224609375, 0.0014491081237792969, 0.0025177001953125, 0.003586292266845703, 0.004654884338378906, 0.005723476409912109, 0.0067920684814453125, 0.007860660552978516, 0.008929252624511719, 0.009997844696044922, 0.011066436767578125, 0.012135028839111328, 0.013203620910644531, 0.014272212982177734, 0.015340805053710938, 0.01640939712524414, 0.017477989196777344, 0.018546581268310547, 0.01961517333984375, 0.020683765411376953, 0.021752357482910156, 0.02282094955444336, 0.023889541625976562, 0.024958133697509766, 0.02602672576904297, 0.027095317840576172, 0.028163909912109375, 0.029232501983642578, 0.03030109405517578, 0.031369686126708984, 0.03243827819824219, 0.03350687026977539, 0.034575462341308594, 0.0356440544128418, 0.036712646484375]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 12.0, 10.0, 9.0, 13.0, 16.0, 22.0, 15.0, 23.0, 24.0, 27.0, 46.0, 25.0, 23.0, 31.0, 38.0, 41.0, 35.0, 35.0, 36.0, 38.0, 29.0, 36.0, 44.0, 36.0, 44.0, 39.0, 28.0, 23.0, 25.0, 28.0, 27.0, 18.0, 11.0, 14.0, 14.0, 14.0, 12.0, 13.0, 8.0, 1.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016845703125, -0.01634061336517334, -0.01583552360534668, -0.01533043384552002, -0.01482534408569336, -0.0143202543258667, -0.013815164566040039, -0.013310074806213379, -0.012804985046386719, -0.012299895286560059, -0.011794805526733398, -0.011289715766906738, -0.010784626007080078, -0.010279536247253418, -0.009774446487426758, -0.009269356727600098, -0.008764266967773438, -0.008259177207946777, -0.007754087448120117, -0.007248997688293457, -0.006743907928466797, -0.006238818168640137, -0.0057337284088134766, -0.005228638648986816, -0.004723548889160156, -0.004218459129333496, -0.003713369369506836, -0.0032082796096801758, -0.0027031898498535156, -0.0021981000900268555, -0.0016930103302001953, -0.0011879205703735352, -0.000682830810546875, -0.00017774105072021484, 0.0003273487091064453, 0.0008324384689331055, 0.0013375282287597656, 0.0018426179885864258, 0.002347707748413086, 0.002852797508239746, 0.0033578872680664062, 0.0038629770278930664, 0.0043680667877197266, 0.004873156547546387, 0.005378246307373047, 0.005883336067199707, 0.006388425827026367, 0.006893515586853027, 0.0073986053466796875, 0.007903695106506348, 0.008408784866333008, 0.008913874626159668, 0.009418964385986328, 0.009924054145812988, 0.010429143905639648, 0.010934233665466309, 0.011439323425292969, 0.011944413185119629, 0.012449502944946289, 0.01295459270477295, 0.01345968246459961, 0.01396477222442627, 0.01446986198425293, 0.01497495174407959, 0.01548004150390625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 9.0, 4.0, 12.0, 13.0, 20.0, 42.0, 46.0, 58.0, 126.0, 169.0, 258.0, 459.0, 714.0, 1063.0, 1689.0, 2834.0, 4593.0, 7586.0, 13209.0, 22270.0, 39554.0, 72148.0, 134894.0, 271757.0, 636813.0, 1531573.0, 788006.0, 320987.0, 154990.0, 81578.0, 44903.0, 25431.0, 14513.0, 8572.0, 5096.0, 3052.0, 1946.0, 1172.0, 743.0, 489.0, 331.0, 205.0, 136.0, 84.0, 51.0, 37.0, 26.0, 15.0, 12.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02764892578125, -0.026682376861572266, -0.02571582794189453, -0.024749279022216797, -0.023782730102539062, -0.022816181182861328, -0.021849632263183594, -0.02088308334350586, -0.019916534423828125, -0.01894998550415039, -0.017983436584472656, -0.017016887664794922, -0.016050338745117188, -0.015083789825439453, -0.014117240905761719, -0.013150691986083984, -0.01218414306640625, -0.011217594146728516, -0.010251045227050781, -0.009284496307373047, -0.008317947387695312, -0.007351398468017578, -0.006384849548339844, -0.005418300628662109, -0.004451751708984375, -0.0034852027893066406, -0.0025186538696289062, -0.0015521049499511719, -0.0005855560302734375, 0.0003809928894042969, 0.0013475418090820312, 0.0023140907287597656, 0.0032806396484375, 0.004247188568115234, 0.005213737487792969, 0.006180286407470703, 0.0071468353271484375, 0.008113384246826172, 0.009079933166503906, 0.01004648208618164, 0.011013031005859375, 0.01197957992553711, 0.012946128845214844, 0.013912677764892578, 0.014879226684570312, 0.015845775604248047, 0.01681232452392578, 0.017778873443603516, 0.01874542236328125, 0.019711971282958984, 0.02067852020263672, 0.021645069122314453, 0.022611618041992188, 0.023578166961669922, 0.024544715881347656, 0.02551126480102539, 0.026477813720703125, 0.02744436264038086, 0.028410911560058594, 0.029377460479736328, 0.030344009399414062, 0.0313105583190918, 0.03227710723876953, 0.033243656158447266, 0.034210205078125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 14.0, 17.0, 16.0, 25.0, 31.0, 34.0, 33.0, 36.0, 54.0, 62.0, 81.0, 84.0, 100.0, 98.0, 122.0, 129.0, 161.0, 209.0, 195.0, 209.0, 251.0, 266.0, 232.0, 238.0, 164.0, 156.0, 155.0, 157.0, 108.0, 100.0, 72.0, 77.0, 70.0, 56.0, 53.0, 36.0, 42.0, 29.0, 17.0, 18.0, 11.0, 10.0, 9.0, 3.0, 5.0, 7.0, 0.0, 2.0, 2.0, 4.0, 3.0], "bins": [-0.00852203369140625, -0.008272528648376465, -0.00802302360534668, -0.0077735185623168945, -0.007524013519287109, -0.007274508476257324, -0.007025003433227539, -0.006775498390197754, -0.006525993347167969, -0.006276488304138184, -0.0060269832611083984, -0.005777478218078613, -0.005527973175048828, -0.005278468132019043, -0.005028963088989258, -0.004779458045959473, -0.0045299530029296875, -0.004280447959899902, -0.004030942916870117, -0.003781437873840332, -0.003531932830810547, -0.0032824277877807617, -0.0030329227447509766, -0.0027834177017211914, -0.0025339126586914062, -0.002284407615661621, -0.002034902572631836, -0.0017853975296020508, -0.0015358924865722656, -0.0012863874435424805, -0.0010368824005126953, -0.0007873773574829102, -0.000537872314453125, -0.00028836727142333984, -3.886222839355469e-05, 0.00021064281463623047, 0.0004601478576660156, 0.0007096529006958008, 0.0009591579437255859, 0.001208662986755371, 0.0014581680297851562, 0.0017076730728149414, 0.0019571781158447266, 0.0022066831588745117, 0.002456188201904297, 0.002705693244934082, 0.002955198287963867, 0.0032047033309936523, 0.0034542083740234375, 0.0037037134170532227, 0.003953218460083008, 0.004202723503112793, 0.004452228546142578, 0.004701733589172363, 0.0049512386322021484, 0.005200743675231934, 0.005450248718261719, 0.005699753761291504, 0.005949258804321289, 0.006198763847351074, 0.006448268890380859, 0.0066977739334106445, 0.00694727897644043, 0.007196784019470215, 0.0074462890625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 6.0, 1.0, 10.0, 11.0, 17.0, 16.0, 17.0, 25.0, 37.0, 48.0, 33.0, 58.0, 65.0, 72.0, 84.0, 93.0, 72.0, 63.0, 61.0, 28.0, 50.0, 19.0, 20.0, 17.0, 13.0, 10.0, 8.0, 6.0, 3.0, 6.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022141853347420692, -0.021349061280488968, -0.020556269213557243, -0.01976347528398037, -0.018970683217048645, -0.01817789115011692, -0.017385099083185196, -0.016592305153608322, -0.015799513086676598, -0.015006721019744873, -0.014213928021490574, -0.01342113595455885, -0.01262834295630455, -0.011835550889372826, -0.011042758822441101, -0.010249965824186802, -0.009457173757255077, -0.008664381690323353, -0.007871588692069054, -0.007078796625137329, -0.00628600362688303, -0.005493211559951305, -0.0047004190273582935, -0.003907626494765282, -0.00311483396217227, -0.002322041429579258, -0.001529249013401568, -0.0007364565972238779, 5.633593536913395e-05, 0.0008491282351315022, 0.001641920767724514, 0.002434713300317526, 0.0032275058329105377, 0.00402029836550355, 0.004813090898096561, 0.005605882965028286, 0.006398675963282585, 0.00719146803021431, 0.007984260097146034, 0.008777053095400333, 0.009569846093654633, 0.010362638160586357, 0.011155431158840656, 0.01194822322577238, 0.01274101622402668, 0.013533808290958405, 0.014326600357890129, 0.015119393356144428, 0.015912186354398727, 0.016704978421330452, 0.017497770488262177, 0.01829056441783905, 0.019083356484770775, 0.0198761485517025, 0.020668940618634224, 0.02146173268556595, 0.022254524752497673, 0.023047316819429398, 0.023840108886361122, 0.024632902815937996, 0.02542569488286972, 0.026218486949801445, 0.02701127901673317, 0.027804072946310043, 0.028596865013241768]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 3.0, 7.0, 17.0, 16.0, 14.0, 19.0, 23.0, 19.0, 22.0, 33.0, 25.0, 27.0, 37.0, 29.0, 41.0, 45.0, 44.0, 37.0, 45.0, 35.0, 41.0, 47.0, 49.0, 33.0, 34.0, 29.0, 22.0, 28.0, 31.0, 17.0, 25.0, 20.0, 13.0, 15.0, 10.0, 8.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020570410415530205, -0.01997828297317028, -0.019386157393455505, -0.01879402995109558, -0.018201902508735657, -0.01760977692902088, -0.017017649486660957, -0.016425523906946182, -0.015833396464586258, -0.015241269953548908, -0.014649143442511559, -0.014057016000151634, -0.013464889489114285, -0.012872762978076935, -0.01228063553571701, -0.01168850902467966, -0.011096382513642311, -0.010504256002604961, -0.009912129491567612, -0.009320002049207687, -0.008727875538170338, -0.008135749027132988, -0.007543622050434351, -0.006951495073735714, -0.006359368562698364, -0.0057672420516610146, -0.0051751150749623775, -0.0045829880982637405, -0.003990861587226391, -0.0033987348433583975, -0.002806608099490404, -0.002214481122791767, -0.0016223546117544174, -0.001030227867886424, -0.0004381011240184307, 0.00015402561984956264, 0.000746152363717556, 0.0013382791075855494, 0.0019304058514535427, 0.0025225328281521797, 0.0031146593391895294, 0.0037067860830575228, 0.004298912826925516, 0.004891039803624153, 0.005483166314661503, 0.0060752928256988525, 0.0066674198023974895, 0.0072595467790961266, 0.007851673290133476, 0.008443799801170826, 0.009035926312208176, 0.0096280537545681, 0.01022018026560545, 0.0108123067766428, 0.011404434219002724, 0.011996560730040073, 0.012588687241077423, 0.013180813752114773, 0.013772940263152122, 0.014365067705512047, 0.014957194216549397, 0.015549320727586746, 0.01614144816994667, 0.016733575612306595, 0.01732570119202137]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 8.0, 8.0, 8.0, 11.0, 11.0, 13.0, 36.0, 42.0, 62.0, 84.0, 95.0, 159.0, 226.0, 367.0, 547.0, 773.0, 1272.0, 1894.0, 3028.0, 4852.0, 8103.0, 14042.0, 25602.0, 51585.0, 118837.0, 382632.0, 254507.0, 88499.0, 40318.0, 20731.0, 11756.0, 6936.0, 4118.0, 2612.0, 1642.0, 1014.0, 717.0, 431.0, 297.0, 210.0, 159.0, 97.0, 61.0, 44.0, 25.0, 27.0, 28.0, 20.0, 5.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0185546875, -0.017911195755004883, -0.017267704010009766, -0.01662421226501465, -0.01598072052001953, -0.015337228775024414, -0.014693737030029297, -0.01405024528503418, -0.013406753540039062, -0.012763261795043945, -0.012119770050048828, -0.011476278305053711, -0.010832786560058594, -0.010189294815063477, -0.00954580307006836, -0.008902311325073242, -0.008258819580078125, -0.007615327835083008, -0.006971836090087891, -0.0063283443450927734, -0.005684852600097656, -0.005041360855102539, -0.004397869110107422, -0.0037543773651123047, -0.0031108856201171875, -0.0024673938751220703, -0.0018239021301269531, -0.001180410385131836, -0.0005369186401367188, 0.00010657310485839844, 0.0007500648498535156, 0.0013935565948486328, 0.00203704833984375, 0.002680540084838867, 0.0033240318298339844, 0.0039675235748291016, 0.004611015319824219, 0.005254507064819336, 0.005897998809814453, 0.00654149055480957, 0.0071849822998046875, 0.007828474044799805, 0.008471965789794922, 0.009115457534790039, 0.009758949279785156, 0.010402441024780273, 0.01104593276977539, 0.011689424514770508, 0.012332916259765625, 0.012976408004760742, 0.01361989974975586, 0.014263391494750977, 0.014906883239746094, 0.015550374984741211, 0.016193866729736328, 0.016837358474731445, 0.017480850219726562, 0.01812434196472168, 0.018767833709716797, 0.019411325454711914, 0.02005481719970703, 0.02069830894470215, 0.021341800689697266, 0.021985292434692383, 0.0226287841796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 16.0, 16.0, 15.0, 23.0, 16.0, 20.0, 23.0, 33.0, 28.0, 42.0, 37.0, 35.0, 38.0, 40.0, 55.0, 48.0, 46.0, 42.0, 55.0, 39.0, 30.0, 41.0, 28.0, 33.0, 19.0, 21.0, 21.0, 31.0, 12.0, 20.0, 20.0, 8.0, 7.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0224151611328125, -0.021768569946289062, -0.021121978759765625, -0.020475387573242188, -0.01982879638671875, -0.019182205200195312, -0.018535614013671875, -0.017889022827148438, -0.017242431640625, -0.016595840454101562, -0.015949249267578125, -0.015302658081054688, -0.01465606689453125, -0.014009475708007812, -0.013362884521484375, -0.012716293334960938, -0.0120697021484375, -0.011423110961914062, -0.010776519775390625, -0.010129928588867188, -0.00948333740234375, -0.008836746215820312, -0.008190155029296875, -0.0075435638427734375, -0.00689697265625, -0.0062503814697265625, -0.005603790283203125, -0.0049571990966796875, -0.00431060791015625, -0.0036640167236328125, -0.003017425537109375, -0.0023708343505859375, -0.0017242431640625, -0.0010776519775390625, -0.000431060791015625, 0.0002155303955078125, 0.00086212158203125, 0.0015087127685546875, 0.002155303955078125, 0.0028018951416015625, 0.003448486328125, 0.0040950775146484375, 0.004741668701171875, 0.0053882598876953125, 0.00603485107421875, 0.0066814422607421875, 0.007328033447265625, 0.007974624633789062, 0.0086212158203125, 0.009267807006835938, 0.009914398193359375, 0.010560989379882812, 0.01120758056640625, 0.011854171752929688, 0.012500762939453125, 0.013147354125976562, 0.0137939453125, 0.014440536499023438, 0.015087127685546875, 0.015733718872070312, 0.01638031005859375, 0.017026901245117188, 0.017673492431640625, 0.018320083618164062, 0.0189666748046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 1.0, 7.0, 10.0, 21.0, 28.0, 27.0, 42.0, 65.0, 98.0, 160.0, 201.0, 360.0, 521.0, 812.0, 1257.0, 2017.0, 3378.0, 5870.0, 11126.0, 25227.0, 85091.0, 743035.0, 111708.0, 28857.0, 12389.0, 6483.0, 3702.0, 2199.0, 1344.0, 847.0, 527.0, 356.0, 266.0, 144.0, 113.0, 77.0, 69.0, 40.0, 18.0, 15.0, 19.0, 10.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04168701171875, -0.04044532775878906, -0.039203643798828125, -0.03796195983886719, -0.03672027587890625, -0.03547859191894531, -0.034236907958984375, -0.03299522399902344, -0.0317535400390625, -0.030511856079101562, -0.029270172119140625, -0.028028488159179688, -0.02678680419921875, -0.025545120239257812, -0.024303436279296875, -0.023061752319335938, -0.021820068359375, -0.020578384399414062, -0.019336700439453125, -0.018095016479492188, -0.01685333251953125, -0.015611648559570312, -0.014369964599609375, -0.013128280639648438, -0.0118865966796875, -0.010644912719726562, -0.009403228759765625, -0.008161544799804688, -0.00691986083984375, -0.0056781768798828125, -0.004436492919921875, -0.0031948089599609375, -0.001953125, -0.0007114410400390625, 0.000530242919921875, 0.0017719268798828125, 0.00301361083984375, 0.0042552947998046875, 0.005496978759765625, 0.0067386627197265625, 0.0079803466796875, 0.009222030639648438, 0.010463714599609375, 0.011705398559570312, 0.01294708251953125, 0.014188766479492188, 0.015430450439453125, 0.016672134399414062, 0.017913818359375, 0.019155502319335938, 0.020397186279296875, 0.021638870239257812, 0.02288055419921875, 0.024122238159179688, 0.025363922119140625, 0.026605606079101562, 0.0278472900390625, 0.029088973999023438, 0.030330657958984375, 0.03157234191894531, 0.03281402587890625, 0.03405570983886719, 0.035297393798828125, 0.03653907775878906, 0.03778076171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 10.0, 3.0, 7.0, 9.0, 10.0, 10.0, 16.0, 11.0, 17.0, 19.0, 26.0, 22.0, 27.0, 28.0, 31.0, 43.0, 32.0, 32.0, 41.0, 38.0, 38.0, 42.0, 46.0, 38.0, 38.0, 34.0, 42.0, 35.0, 25.0, 27.0, 35.0, 33.0, 24.0, 15.0, 24.0, 16.0, 14.0, 16.0, 9.0, 5.0, 6.0, 4.0, 5.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01015472412109375, -0.009767413139343262, -0.009380102157592773, -0.008992791175842285, -0.008605480194091797, -0.008218169212341309, -0.00783085823059082, -0.007443547248840332, -0.007056236267089844, -0.0066689252853393555, -0.006281614303588867, -0.005894303321838379, -0.005506992340087891, -0.005119681358337402, -0.004732370376586914, -0.004345059394836426, -0.0039577484130859375, -0.0035704374313354492, -0.003183126449584961, -0.0027958154678344727, -0.0024085044860839844, -0.002021193504333496, -0.0016338825225830078, -0.0012465715408325195, -0.0008592605590820312, -0.00047194957733154297, -8.463859558105469e-05, 0.0003026723861694336, 0.0006899833679199219, 0.0010772943496704102, 0.0014646053314208984, 0.0018519163131713867, 0.002239227294921875, 0.0026265382766723633, 0.0030138492584228516, 0.00340116024017334, 0.003788471221923828, 0.004175782203674316, 0.004563093185424805, 0.004950404167175293, 0.005337715148925781, 0.0057250261306762695, 0.006112337112426758, 0.006499648094177246, 0.006886959075927734, 0.007274270057678223, 0.007661581039428711, 0.0080488920211792, 0.008436203002929688, 0.008823513984680176, 0.009210824966430664, 0.009598135948181152, 0.00998544692993164, 0.010372757911682129, 0.010760068893432617, 0.011147379875183105, 0.011534690856933594, 0.011922001838684082, 0.01230931282043457, 0.012696623802185059, 0.013083934783935547, 0.013471245765686035, 0.013858556747436523, 0.014245867729187012, 0.0146331787109375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 14.0, 15.0, 7.0, 14.0, 19.0, 28.0, 31.0, 46.0, 52.0, 115.0, 121.0, 158.0, 228.0, 395.0, 593.0, 1032.0, 1826.0, 3661.0, 8419.0, 26933.0, 691321.0, 275010.0, 23077.0, 7659.0, 3306.0, 1683.0, 960.0, 598.0, 362.0, 257.0, 159.0, 132.0, 79.0, 80.0, 38.0, 23.0, 16.0, 22.0, 15.0, 17.0, 9.0, 4.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.006374359130859375, -0.006168365478515625, -0.005962371826171875, -0.005756378173828125, -0.005550384521484375, -0.005344390869140625, -0.005138397216796875, -0.004932403564453125, -0.004726409912109375, -0.004520416259765625, -0.004314422607421875, -0.004108428955078125, -0.003902435302734375, -0.003696441650390625, -0.003490447998046875, -0.003284454345703125, -0.003078460693359375, -0.002872467041015625, -0.002666473388671875, -0.002460479736328125, -0.002254486083984375, -0.002048492431640625, -0.001842498779296875, -0.001636505126953125, -0.001430511474609375, -0.001224517822265625, -0.001018524169921875, -0.000812530517578125, -0.000606536865234375, -0.000400543212890625, -0.000194549560546875, 1.1444091796875e-05, 0.000217437744140625, 0.000423431396484375, 0.000629425048828125, 0.000835418701171875, 0.001041412353515625, 0.001247406005859375, 0.001453399658203125, 0.001659393310546875, 0.001865386962890625, 0.002071380615234375, 0.002277374267578125, 0.002483367919921875, 0.002689361572265625, 0.002895355224609375, 0.003101348876953125, 0.003307342529296875, 0.003513336181640625, 0.003719329833984375, 0.003925323486328125, 0.004131317138671875, 0.004337310791015625, 0.004543304443359375, 0.004749298095703125, 0.004955291748046875, 0.005161285400390625, 0.005367279052734375, 0.005573272705078125, 0.005779266357421875, 0.005985260009765625, 0.006191253662109375, 0.006397247314453125, 0.006603240966796875, 0.006809234619140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 6.0, 12.0, 16.0, 0.0, 22.0, 28.0, 37.0, 0.0, 46.0, 51.0, 70.0, 0.0, 82.0, 90.0, 94.0, 0.0, 93.0, 91.0, 68.0, 0.0, 55.0, 40.0, 30.0, 0.0, 23.0, 13.0, 11.0, 0.0, 10.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5050172805786133e-06, -1.4603137969970703e-06, -1.4156103134155273e-06, -1.3709068298339844e-06, -1.3262033462524414e-06, -1.2814998626708984e-06, -1.2367963790893555e-06, -1.1920928955078125e-06, -1.1473894119262695e-06, -1.1026859283447266e-06, -1.0579824447631836e-06, -1.0132789611816406e-06, -9.685754776000977e-07, -9.238719940185547e-07, -8.791685104370117e-07, -8.344650268554688e-07, -7.897615432739258e-07, -7.450580596923828e-07, -7.003545761108398e-07, -6.556510925292969e-07, -6.109476089477539e-07, -5.662441253662109e-07, -5.21540641784668e-07, -4.76837158203125e-07, -4.3213367462158203e-07, -3.8743019104003906e-07, -3.427267074584961e-07, -2.980232238769531e-07, -2.5331974029541016e-07, -2.086162567138672e-07, -1.6391277313232422e-07, -1.1920928955078125e-07, -7.450580596923828e-08, -2.9802322387695312e-08, 1.4901161193847656e-08, 5.960464477539063e-08, 1.043081283569336e-07, 1.4901161193847656e-07, 1.9371509552001953e-07, 2.384185791015625e-07, 2.8312206268310547e-07, 3.2782554626464844e-07, 3.725290298461914e-07, 4.172325134277344e-07, 4.6193599700927734e-07, 5.066394805908203e-07, 5.513429641723633e-07, 5.960464477539062e-07, 6.407499313354492e-07, 6.854534149169922e-07, 7.301568984985352e-07, 7.748603820800781e-07, 8.195638656616211e-07, 8.642673492431641e-07, 9.08970832824707e-07, 9.5367431640625e-07, 9.98377799987793e-07, 1.043081283569336e-06, 1.087784767150879e-06, 1.1324882507324219e-06, 1.1771917343139648e-06, 1.2218952178955078e-06, 1.2665987014770508e-06, 1.3113021850585938e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 4.0, 17.0, 19.0, 22.0, 43.0, 45.0, 69.0, 76.0, 153.0, 185.0, 289.0, 430.0, 657.0, 1146.0, 2192.0, 5023.0, 14436.0, 63438.0, 778008.0, 144514.0, 23685.0, 7321.0, 2997.0, 1424.0, 782.0, 478.0, 320.0, 243.0, 141.0, 116.0, 76.0, 55.0, 39.0, 29.0, 21.0, 22.0, 7.0, 6.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007411956787109375, -0.007185220718383789, -0.006958484649658203, -0.006731748580932617, -0.006505012512207031, -0.006278276443481445, -0.006051540374755859, -0.0058248043060302734, -0.0055980682373046875, -0.0053713321685791016, -0.005144596099853516, -0.00491786003112793, -0.004691123962402344, -0.004464387893676758, -0.004237651824951172, -0.004010915756225586, -0.0037841796875, -0.003557443618774414, -0.003330707550048828, -0.003103971481323242, -0.0028772354125976562, -0.0026504993438720703, -0.0024237632751464844, -0.0021970272064208984, -0.0019702911376953125, -0.0017435550689697266, -0.0015168190002441406, -0.0012900829315185547, -0.0010633468627929688, -0.0008366107940673828, -0.0006098747253417969, -0.00038313865661621094, -0.000156402587890625, 7.033348083496094e-05, 0.0002970695495605469, 0.0005238056182861328, 0.0007505416870117188, 0.0009772777557373047, 0.0012040138244628906, 0.0014307498931884766, 0.0016574859619140625, 0.0018842220306396484, 0.0021109580993652344, 0.0023376941680908203, 0.0025644302368164062, 0.002791166305541992, 0.003017902374267578, 0.003244638442993164, 0.00347137451171875, 0.003698110580444336, 0.003924846649169922, 0.004151582717895508, 0.004378318786621094, 0.00460505485534668, 0.004831790924072266, 0.0050585269927978516, 0.0052852630615234375, 0.0055119991302490234, 0.005738735198974609, 0.005965471267700195, 0.006192207336425781, 0.006418943405151367, 0.006645679473876953, 0.006872415542602539, 0.007099151611328125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 9.0, 16.0, 22.0, 29.0, 64.0, 115.0, 316.0, 199.0, 88.0, 54.0, 22.0, 13.0, 19.0, 6.0, 3.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001361846923828125, -0.001320376992225647, -0.001278907060623169, -0.001237437129020691, -0.0011959671974182129, -0.0011544972658157349, -0.0011130273342132568, -0.0010715574026107788, -0.0010300874710083008, -0.0009886175394058228, -0.0009471476078033447, -0.0009056776762008667, -0.0008642077445983887, -0.0008227378129959106, -0.0007812678813934326, -0.0007397979497909546, -0.0006983280181884766, -0.0006568580865859985, -0.0006153881549835205, -0.0005739182233810425, -0.0005324482917785645, -0.0004909783601760864, -0.0004495084285736084, -0.00040803849697113037, -0.00036656856536865234, -0.0003250986337661743, -0.0002836287021636963, -0.00024215877056121826, -0.00020068883895874023, -0.0001592189073562622, -0.00011774897575378418, -7.627904415130615e-05, -3.4809112548828125e-05, 6.660819053649902e-06, 4.813075065612793e-05, 8.960068225860596e-05, 0.00013107061386108398, 0.000172540545463562, 0.00021401047706604004, 0.00025548040866851807, 0.0002969503402709961, 0.0003384202718734741, 0.00037989020347595215, 0.0004213601350784302, 0.0004628300666809082, 0.0005042999982833862, 0.0005457699298858643, 0.0005872398614883423, 0.0006287097930908203, 0.0006701797246932983, 0.0007116496562957764, 0.0007531195878982544, 0.0007945895195007324, 0.0008360594511032104, 0.0008775293827056885, 0.0009189993143081665, 0.0009604692459106445, 0.0010019391775131226, 0.0010434091091156006, 0.0010848790407180786, 0.0011263489723205566, 0.0011678189039230347, 0.0012092888355255127, 0.0012507587671279907, 0.0012922286987304688]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 11.0, 11.0, 13.0, 18.0, 17.0, 23.0, 30.0, 38.0, 42.0, 56.0, 81.0, 58.0, 99.0, 93.0, 77.0, 67.0, 61.0, 41.0, 32.0, 23.0, 16.0, 17.0, 14.0, 12.0, 7.0, 5.0, 2.0, 1.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021865997463464737, -0.02105432003736496, -0.020242640748620033, -0.019430963322520256, -0.01861928403377533, -0.017807606607675552, -0.016995927318930626, -0.01618424989283085, -0.015372570604085922, -0.01456089224666357, -0.013749213889241219, -0.012937535531818867, -0.012125857174396515, -0.011314179748296738, -0.010502500459551811, -0.009690823033452034, -0.008879144676029682, -0.00806746631860733, -0.0072557879611849785, -0.006444109603762627, -0.005632431246340275, -0.00482075335457921, -0.0040090749971568584, -0.0031973966397345066, -0.0023857182823121548, -0.001574039924889803, -0.0007623616838827729, 4.931655712425709e-05, 0.0008609949145466089, 0.001672673039138317, 0.002484351396560669, 0.0032960297539830208, 0.004107708111405373, 0.0049193864688277245, 0.005731064826250076, 0.006542743183672428, 0.00735442154109478, 0.008166098967194557, 0.008977778255939484, 0.00978945568203926, 0.010601134970784187, 0.01141281332820654, 0.012224491685628891, 0.013036170043051243, 0.013847848400473595, 0.014659525826573372, 0.015471205115318298, 0.016282882541418076, 0.017094559967517853, 0.01790623739361763, 0.018717916682362556, 0.019529594108462334, 0.02034127339720726, 0.021152950823307037, 0.021964630112051964, 0.02277630753815174, 0.023587986826896667, 0.024399664252996445, 0.02521134354174137, 0.02602302096784115, 0.026834700256586075, 0.027646377682685852, 0.02845805697143078, 0.029269734397530556, 0.030081413686275482]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 3.0, 9.0, 16.0, 17.0, 15.0, 20.0, 21.0, 18.0, 24.0, 26.0, 31.0, 31.0, 38.0, 23.0, 51.0, 36.0, 47.0, 37.0, 44.0, 36.0, 39.0, 44.0, 54.0, 36.0, 29.0, 31.0, 21.0, 27.0, 32.0, 14.0, 28.0, 18.0, 14.0, 14.0, 10.0, 8.0, 6.0, 9.0, 5.0, 7.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020207522436976433, -0.019622666761279106, -0.01903780922293663, -0.018452953547239304, -0.017868097871541977, -0.01728324219584465, -0.016698384657502174, -0.016113528981804848, -0.015528672374784946, -0.014943815767765045, -0.014358960092067719, -0.013774103485047817, -0.013189246878027916, -0.01260439120233059, -0.012019534595310688, -0.011434677988290787, -0.01084982231259346, -0.010264965705573559, -0.009680110029876232, -0.009095253422856331, -0.008510397747159004, -0.007925541140139103, -0.007340684533119202, -0.006755828391760588, -0.006170972250401974, -0.00558611610904336, -0.005001259967684746, -0.0044164033606648445, -0.0038315472193062305, -0.0032466910779476166, -0.002661834703758359, -0.0020769783295691013, -0.0014921203255653381, -0.0009072640677914023, -0.00032240781001746655, 0.00026244844775646925, 0.000847304705530405, 0.001432160846889019, 0.0020170172210782766, 0.0026018735952675343, 0.0031867297366261482, 0.003771585877984762, 0.004356442019343376, 0.0049412986263632774, 0.005526154767721891, 0.006111010909080505, 0.006695867516100407, 0.007280723657459021, 0.007865579798817635, 0.008450436405837536, 0.009035292081534863, 0.009620148688554764, 0.01020500436425209, 0.010789860971271992, 0.011374717578291893, 0.01195957325398922, 0.012544429861009121, 0.013129286468029022, 0.013714142143726349, 0.01429899875074625, 0.014883855357766151, 0.015468711033463478, 0.016053566709160805, 0.01663842424750328, 0.017223279923200607]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 7.0, 9.0, 13.0, 23.0, 43.0, 54.0, 82.0, 118.0, 188.0, 267.0, 348.0, 504.0, 738.0, 1079.0, 1496.0, 2219.0, 3176.0, 4705.0, 6735.0, 9973.0, 14559.0, 22243.0, 33891.0, 53773.0, 87582.0, 150481.0, 238004.0, 159927.0, 92567.0, 56654.0, 35796.0, 22933.0, 15440.0, 10201.0, 7072.0, 4761.0, 3336.0, 2260.0, 1636.0, 1193.0, 820.0, 515.0, 353.0, 263.0, 193.0, 121.0, 58.0, 45.0, 35.0, 19.0, 15.0, 13.0, 9.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.0291290283203125, -0.02817559242248535, -0.027222156524658203, -0.026268720626831055, -0.025315284729003906, -0.024361848831176758, -0.02340841293334961, -0.02245497703552246, -0.021501541137695312, -0.020548105239868164, -0.019594669342041016, -0.018641233444213867, -0.01768779754638672, -0.01673436164855957, -0.015780925750732422, -0.014827489852905273, -0.013874053955078125, -0.012920618057250977, -0.011967182159423828, -0.01101374626159668, -0.010060310363769531, -0.009106874465942383, -0.008153438568115234, -0.007200002670288086, -0.0062465667724609375, -0.005293130874633789, -0.004339694976806641, -0.003386259078979492, -0.0024328231811523438, -0.0014793872833251953, -0.0005259513854980469, 0.00042748451232910156, 0.00138092041015625, 0.0023343563079833984, 0.003287792205810547, 0.004241228103637695, 0.005194664001464844, 0.006148099899291992, 0.007101535797119141, 0.008054971694946289, 0.009008407592773438, 0.009961843490600586, 0.010915279388427734, 0.011868715286254883, 0.012822151184082031, 0.01377558708190918, 0.014729022979736328, 0.015682458877563477, 0.016635894775390625, 0.017589330673217773, 0.018542766571044922, 0.01949620246887207, 0.02044963836669922, 0.021403074264526367, 0.022356510162353516, 0.023309946060180664, 0.024263381958007812, 0.02521681785583496, 0.02617025375366211, 0.027123689651489258, 0.028077125549316406, 0.029030561447143555, 0.029983997344970703, 0.03093743324279785, 0.031890869140625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 9.0, 5.0, 9.0, 11.0, 17.0, 21.0, 11.0, 16.0, 25.0, 28.0, 26.0, 29.0, 31.0, 40.0, 34.0, 39.0, 37.0, 49.0, 35.0, 51.0, 47.0, 55.0, 42.0, 34.0, 37.0, 41.0, 28.0, 25.0, 25.0, 22.0, 20.0, 25.0, 8.0, 12.0, 9.0, 11.0, 6.0, 8.0, 9.0, 4.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0179595947265625, -0.017437219619750977, -0.016914844512939453, -0.01639246940612793, -0.015870094299316406, -0.015347719192504883, -0.01482534408569336, -0.014302968978881836, -0.013780593872070312, -0.013258218765258789, -0.012735843658447266, -0.012213468551635742, -0.011691093444824219, -0.011168718338012695, -0.010646343231201172, -0.010123968124389648, -0.009601593017578125, -0.009079217910766602, -0.008556842803955078, -0.008034467697143555, -0.007512092590332031, -0.006989717483520508, -0.006467342376708984, -0.005944967269897461, -0.0054225921630859375, -0.004900217056274414, -0.004377841949462891, -0.003855466842651367, -0.0033330917358398438, -0.0028107166290283203, -0.002288341522216797, -0.0017659664154052734, -0.00124359130859375, -0.0007212162017822266, -0.00019884109497070312, 0.0003235340118408203, 0.0008459091186523438, 0.0013682842254638672, 0.0018906593322753906, 0.002413034439086914, 0.0029354095458984375, 0.003457784652709961, 0.003980159759521484, 0.004502534866333008, 0.005024909973144531, 0.005547285079956055, 0.006069660186767578, 0.0065920352935791016, 0.007114410400390625, 0.0076367855072021484, 0.008159160614013672, 0.008681535720825195, 0.009203910827636719, 0.009726285934448242, 0.010248661041259766, 0.010771036148071289, 0.011293411254882812, 0.011815786361694336, 0.01233816146850586, 0.012860536575317383, 0.013382911682128906, 0.01390528678894043, 0.014427661895751953, 0.014950037002563477, 0.015472412109375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 7.0, 6.0, 10.0, 6.0, 25.0, 26.0, 47.0, 53.0, 84.0, 124.0, 194.0, 290.0, 399.0, 590.0, 931.0, 1271.0, 2127.0, 3150.0, 4905.0, 7694.0, 12217.0, 19848.0, 32565.0, 55039.0, 93205.0, 171914.0, 271082.0, 154048.0, 85780.0, 50650.0, 29966.0, 18526.0, 11306.0, 7313.0, 4621.0, 2868.0, 1908.0, 1245.0, 842.0, 528.0, 353.0, 254.0, 183.0, 117.0, 74.0, 52.0, 29.0, 25.0, 24.0, 8.0, 18.0, 4.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.035369873046875, -0.03427886962890625, -0.0331878662109375, -0.03209686279296875, -0.031005859375, -0.02991485595703125, -0.0288238525390625, -0.02773284912109375, -0.026641845703125, -0.02555084228515625, -0.0244598388671875, -0.02336883544921875, -0.02227783203125, -0.02118682861328125, -0.0200958251953125, -0.01900482177734375, -0.017913818359375, -0.01682281494140625, -0.0157318115234375, -0.01464080810546875, -0.0135498046875, -0.01245880126953125, -0.0113677978515625, -0.01027679443359375, -0.009185791015625, -0.00809478759765625, -0.0070037841796875, -0.00591278076171875, -0.00482177734375, -0.00373077392578125, -0.0026397705078125, -0.00154876708984375, -0.000457763671875, 0.00063323974609375, 0.0017242431640625, 0.00281524658203125, 0.00390625, 0.00499725341796875, 0.0060882568359375, 0.00717926025390625, 0.008270263671875, 0.00936126708984375, 0.0104522705078125, 0.01154327392578125, 0.01263427734375, 0.01372528076171875, 0.0148162841796875, 0.01590728759765625, 0.016998291015625, 0.01808929443359375, 0.0191802978515625, 0.02027130126953125, 0.0213623046875, 0.02245330810546875, 0.0235443115234375, 0.02463531494140625, 0.025726318359375, 0.02681732177734375, 0.0279083251953125, 0.02899932861328125, 0.03009033203125, 0.03118133544921875, 0.0322723388671875, 0.03336334228515625, 0.034454345703125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 0.0, 0.0, 6.0, 5.0, 6.0, 5.0, 11.0, 11.0, 15.0, 11.0, 20.0, 20.0, 21.0, 17.0, 28.0, 21.0, 32.0, 46.0, 31.0, 34.0, 35.0, 42.0, 45.0, 38.0, 33.0, 34.0, 44.0, 26.0, 31.0, 37.0, 44.0, 36.0, 18.0, 23.0, 28.0, 21.0, 22.0, 15.0, 10.0, 13.0, 14.0, 6.0, 10.0, 7.0, 13.0, 5.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.01025390625, -0.009952306747436523, -0.009650707244873047, -0.00934910774230957, -0.009047508239746094, -0.008745908737182617, -0.00844430923461914, -0.008142709732055664, -0.007841110229492188, -0.007539510726928711, -0.007237911224365234, -0.006936311721801758, -0.006634712219238281, -0.006333112716674805, -0.006031513214111328, -0.0057299137115478516, -0.005428314208984375, -0.0051267147064208984, -0.004825115203857422, -0.004523515701293945, -0.004221916198730469, -0.003920316696166992, -0.0036187171936035156, -0.003317117691040039, -0.0030155181884765625, -0.002713918685913086, -0.0024123191833496094, -0.002110719680786133, -0.0018091201782226562, -0.0015075206756591797, -0.0012059211730957031, -0.0009043216705322266, -0.00060272216796875, -0.00030112266540527344, 4.76837158203125e-07, 0.0003020763397216797, 0.0006036758422851562, 0.0009052753448486328, 0.0012068748474121094, 0.001508474349975586, 0.0018100738525390625, 0.002111673355102539, 0.0024132728576660156, 0.002714872360229492, 0.0030164718627929688, 0.0033180713653564453, 0.003619670867919922, 0.0039212703704833984, 0.004222869873046875, 0.0045244693756103516, 0.004826068878173828, 0.005127668380737305, 0.005429267883300781, 0.005730867385864258, 0.006032466888427734, 0.006334066390991211, 0.0066356658935546875, 0.006937265396118164, 0.007238864898681641, 0.007540464401245117, 0.007842063903808594, 0.00814366340637207, 0.008445262908935547, 0.008746862411499023, 0.0090484619140625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 5.0, 17.0, 21.0, 12.0, 25.0, 47.0, 86.0, 104.0, 136.0, 170.0, 295.0, 385.0, 502.0, 710.0, 1052.0, 1524.0, 2326.0, 3524.0, 5437.0, 8889.0, 16142.0, 31441.0, 94911.0, 646754.0, 147859.0, 38726.0, 18671.0, 10512.0, 6264.0, 3878.0, 2552.0, 1669.0, 1243.0, 736.0, 513.0, 397.0, 288.0, 198.0, 136.0, 114.0, 87.0, 77.0, 40.0, 22.0, 19.0, 16.0, 13.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0016117095947265625, -0.0015607476234436035, -0.0015097856521606445, -0.0014588236808776855, -0.0014078617095947266, -0.0013568997383117676, -0.0013059377670288086, -0.0012549757957458496, -0.0012040138244628906, -0.0011530518531799316, -0.0011020898818969727, -0.0010511279106140137, -0.0010001659393310547, -0.0009492039680480957, -0.0008982419967651367, -0.0008472800254821777, -0.0007963180541992188, -0.0007453560829162598, -0.0006943941116333008, -0.0006434321403503418, -0.0005924701690673828, -0.0005415081977844238, -0.0004905462265014648, -0.00043958425521850586, -0.0003886222839355469, -0.0003376603126525879, -0.0002866983413696289, -0.00023573637008666992, -0.00018477439880371094, -0.00013381242752075195, -8.285045623779297e-05, -3.1888484954833984e-05, 1.9073486328125e-05, 7.003545761108398e-05, 0.00012099742889404297, 0.00017195940017700195, 0.00022292137145996094, 0.0002738833427429199, 0.0003248453140258789, 0.0003758072853088379, 0.0004267692565917969, 0.00047773122787475586, 0.0005286931991577148, 0.0005796551704406738, 0.0006306171417236328, 0.0006815791130065918, 0.0007325410842895508, 0.0007835030555725098, 0.0008344650268554688, 0.0008854269981384277, 0.0009363889694213867, 0.0009873509407043457, 0.0010383129119873047, 0.0010892748832702637, 0.0011402368545532227, 0.0011911988258361816, 0.0012421607971191406, 0.0012931227684020996, 0.0013440847396850586, 0.0013950467109680176, 0.0014460086822509766, 0.0014969706535339355, 0.0015479326248168945, 0.0015988945960998535, 0.0016498565673828125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 5.0, 4.0, 7.0, 8.0, 9.0, 0.0, 16.0, 19.0, 44.0, 44.0, 81.0, 0.0, 87.0, 113.0, 101.0, 109.0, 82.0, 86.0, 0.0, 53.0, 47.0, 29.0, 26.0, 9.0, 0.0, 8.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6782432794570923e-06, -1.6279518604278564e-06, -1.5776604413986206e-06, -1.5273690223693848e-06, -1.477077603340149e-06, -1.426786184310913e-06, -1.3764947652816772e-06, -1.3262033462524414e-06, -1.2759119272232056e-06, -1.2256205081939697e-06, -1.1753290891647339e-06, -1.125037670135498e-06, -1.0747462511062622e-06, -1.0244548320770264e-06, -9.741634130477905e-07, -9.238719940185547e-07, -8.735805749893188e-07, -8.23289155960083e-07, -7.729977369308472e-07, -7.227063179016113e-07, -6.724148988723755e-07, -6.221234798431396e-07, -5.718320608139038e-07, -5.21540641784668e-07, -4.7124922275543213e-07, -4.209578037261963e-07, -3.7066638469696045e-07, -3.203749656677246e-07, -2.7008354663848877e-07, -2.1979212760925293e-07, -1.695007085800171e-07, -1.1920928955078125e-07, -6.891787052154541e-08, -1.862645149230957e-08, 3.166496753692627e-08, 8.195638656616211e-08, 1.3224780559539795e-07, 1.825392246246338e-07, 2.3283064365386963e-07, 2.8312206268310547e-07, 3.334134817123413e-07, 3.8370490074157715e-07, 4.33996319770813e-07, 4.842877388000488e-07, 5.345791578292847e-07, 5.848705768585205e-07, 6.351619958877563e-07, 6.854534149169922e-07, 7.35744833946228e-07, 7.860362529754639e-07, 8.363276720046997e-07, 8.866190910339355e-07, 9.369105100631714e-07, 9.872019290924072e-07, 1.037493348121643e-06, 1.087784767150879e-06, 1.1380761861801147e-06, 1.1883676052093506e-06, 1.2386590242385864e-06, 1.2889504432678223e-06, 1.339241862297058e-06, 1.389533281326294e-06, 1.4398247003555298e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 5.0, 8.0, 19.0, 20.0, 28.0, 36.0, 49.0, 61.0, 65.0, 126.0, 176.0, 256.0, 427.0, 815.0, 1523.0, 3033.0, 6672.0, 15951.0, 47077.0, 560020.0, 343535.0, 41588.0, 14705.0, 6197.0, 2785.0, 1397.0, 721.0, 397.0, 249.0, 154.0, 136.0, 63.0, 67.0, 48.0, 32.0, 25.0, 23.0, 21.0, 6.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0024852752685546875, -0.0024074912071228027, -0.002329707145690918, -0.002251923084259033, -0.0021741390228271484, -0.0020963549613952637, -0.002018570899963379, -0.0019407868385314941, -0.0018630027770996094, -0.0017852187156677246, -0.0017074346542358398, -0.001629650592803955, -0.0015518665313720703, -0.0014740824699401855, -0.0013962984085083008, -0.001318514347076416, -0.0012407302856445312, -0.0011629462242126465, -0.0010851621627807617, -0.001007378101348877, -0.0009295940399169922, -0.0008518099784851074, -0.0007740259170532227, -0.0006962418556213379, -0.0006184577941894531, -0.0005406737327575684, -0.0004628896713256836, -0.00038510560989379883, -0.00030732154846191406, -0.0002295374870300293, -0.00015175342559814453, -7.396936416625977e-05, 3.814697265625e-06, 8.159875869750977e-05, 0.00015938282012939453, 0.0002371668815612793, 0.00031495094299316406, 0.00039273500442504883, 0.0004705190658569336, 0.0005483031272888184, 0.0006260871887207031, 0.0007038712501525879, 0.0007816553115844727, 0.0008594393730163574, 0.0009372234344482422, 0.001015007495880127, 0.0010927915573120117, 0.0011705756187438965, 0.0012483596801757812, 0.001326143741607666, 0.0014039278030395508, 0.0014817118644714355, 0.0015594959259033203, 0.001637279987335205, 0.0017150640487670898, 0.0017928481101989746, 0.0018706321716308594, 0.0019484162330627441, 0.002026200294494629, 0.0021039843559265137, 0.0021817684173583984, 0.002259552478790283, 0.002337336540222168, 0.0024151206016540527, 0.0024929046630859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 7.0, 6.0, 9.0, 16.0, 10.0, 28.0, 38.0, 39.0, 92.0, 210.0, 312.0, 99.0, 39.0, 23.0, 23.0, 17.0, 13.0, 6.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00070953369140625, -0.000687427818775177, -0.000665321946144104, -0.000643216073513031, -0.000621110200881958, -0.000599004328250885, -0.000576898455619812, -0.000554792582988739, -0.000532686710357666, -0.000510580837726593, -0.00048847496509552, -0.000466369092464447, -0.000444263219833374, -0.000422157347202301, -0.00040005147457122803, -0.00037794560194015503, -0.00035583972930908203, -0.00033373385667800903, -0.00031162798404693604, -0.00028952211141586304, -0.00026741623878479004, -0.00024531036615371704, -0.00022320449352264404, -0.00020109862089157104, -0.00017899274826049805, -0.00015688687562942505, -0.00013478100299835205, -0.00011267513036727905, -9.056925773620605e-05, -6.846338510513306e-05, -4.635751247406006e-05, -2.425163984298706e-05, -2.1457672119140625e-06, 1.9960105419158936e-05, 4.2065978050231934e-05, 6.417185068130493e-05, 8.627772331237793e-05, 0.00010838359594345093, 0.00013048946857452393, 0.00015259534120559692, 0.00017470121383666992, 0.00019680708646774292, 0.00021891295909881592, 0.00024101883172988892, 0.0002631247043609619, 0.0002852305769920349, 0.0003073364496231079, 0.0003294423222541809, 0.0003515481948852539, 0.0003736540675163269, 0.0003957599401473999, 0.0004178658127784729, 0.0004399716854095459, 0.0004620775580406189, 0.0004841834306716919, 0.0005062893033027649, 0.0005283951759338379, 0.0005505010485649109, 0.0005726069211959839, 0.0005947127938270569, 0.0006168186664581299, 0.0006389245390892029, 0.0006610304117202759, 0.0006831362843513489, 0.0007052421569824219]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 7.0, 8.0, 8.0, 17.0, 14.0, 30.0, 19.0, 35.0, 40.0, 53.0, 64.0, 56.0, 93.0, 107.0, 84.0, 77.0, 59.0, 54.0, 35.0, 31.0, 16.0, 18.0, 9.0, 6.0, 10.0, 8.0, 5.0, 5.0, 6.0, 0.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.01990484818816185, -0.019156500697135925, -0.01840815506875515, -0.017659807577729225, -0.01691146194934845, -0.016163114458322525, -0.01541476882994175, -0.014666421338915825, -0.01391807571053505, -0.0131697291508317, -0.01242138259112835, -0.011673036031425, -0.01092468947172165, -0.010176342912018299, -0.009427996352314949, -0.008679648861289024, -0.007931302301585674, -0.007182955741882324, -0.006434609182178974, -0.005686262622475624, -0.004937916062772274, -0.004189569503068924, -0.0034412224777042866, -0.0026928759180009365, -0.0019445293582975864, -0.0011961827985942364, -0.0004478361224755645, 0.0003005105536431074, 0.0010488571133464575, 0.0017972036730498075, 0.0025455504655838013, 0.0032938970252871513, 0.004042243584990501, 0.0047905901446938515, 0.0055389367043972015, 0.006287283264100552, 0.007035629823803902, 0.007783976383507252, 0.008532322943210602, 0.009280670434236526, 0.010029016062617302, 0.010777362622320652, 0.011525709182024002, 0.012274055741727352, 0.013022402301430702, 0.013770748861134052, 0.014519095420837402, 0.015267442911863327, 0.01601579040288925, 0.016764137893915176, 0.017512483522295952, 0.018260831013321877, 0.019009176641702652, 0.019757524132728577, 0.020505869761109352, 0.021254217252135277, 0.022002562880516052, 0.022750910371541977, 0.023499255999922752, 0.024247603490948677, 0.024995949119329453, 0.025744296610355377, 0.026492642238736153, 0.027240989729762077, 0.027989335358142853]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 5.0, 9.0, 16.0, 9.0, 9.0, 16.0, 13.0, 20.0, 22.0, 23.0, 25.0, 21.0, 32.0, 36.0, 32.0, 35.0, 37.0, 44.0, 50.0, 45.0, 41.0, 45.0, 46.0, 39.0, 30.0, 34.0, 29.0, 32.0, 18.0, 20.0, 31.0, 21.0, 20.0, 17.0, 16.0, 8.0, 10.0, 7.0, 11.0, 10.0, 4.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01770825870335102, -0.01717531494796276, -0.01664237305521965, -0.01610942929983139, -0.01557648554444313, -0.015043542720377445, -0.01451059989631176, -0.0139776561409235, -0.013444713316857815, -0.01291177049279213, -0.01237882673740387, -0.011845883913338184, -0.011312941089272499, -0.01077999733388424, -0.010247054509818554, -0.009714111685752869, -0.009181167930364609, -0.008648225106298923, -0.008115281350910664, -0.007582338526844978, -0.007049395237118006, -0.006516451947391033, -0.005983509123325348, -0.005450565833598375, -0.004917622543871403, -0.00438467925414443, -0.0038517361972481012, -0.0033187931403517723, -0.0027858498506247997, -0.002252906560897827, -0.0017199635040014982, -0.0011870204471051693, -0.000654079020023346, -0.0001211358467116952, 0.00041180732659995556, 0.0009447504999116063, 0.001477693673223257, 0.0020106369629502296, 0.0025435800198465586, 0.0030765230767428875, 0.00360946636646986, 0.004142409656196833, 0.004675352945923805, 0.0052082957699894905, 0.005741239059716463, 0.006274182349443436, 0.006807125173509121, 0.0073400684632360935, 0.007873011752963066, 0.008405954577028751, 0.008938898332417011, 0.009471841156482697, 0.010004784911870956, 0.010537727735936642, 0.011070670560002327, 0.011603614315390587, 0.012136557139456272, 0.012669499963521957, 0.013202443718910217, 0.013735386542975903, 0.014268329367041588, 0.014801273122429848, 0.015334215946495533, 0.015867158770561218, 0.016400102525949478]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 13.0, 7.0, 17.0, 41.0, 54.0, 80.0, 127.0, 155.0, 237.0, 339.0, 532.0, 808.0, 1094.0, 1585.0, 2230.0, 3312.0, 4899.0, 6978.0, 10625.0, 16311.0, 25687.0, 41479.0, 70077.0, 127631.0, 268566.0, 859368.0, 1671560.0, 597862.0, 214078.0, 108291.0, 61075.0, 36440.0, 22393.0, 13990.0, 8919.0, 5773.0, 3846.0, 2512.0, 1661.0, 1103.0, 791.0, 518.0, 372.0, 235.0, 206.0, 124.0, 78.0, 72.0, 44.0, 31.0, 23.0, 18.0, 8.0, 7.0, 4.0, 4.0, 2.0], "bins": [-0.0218658447265625, -0.021210432052612305, -0.02055501937866211, -0.019899606704711914, -0.01924419403076172, -0.018588781356811523, -0.017933368682861328, -0.017277956008911133, -0.016622543334960938, -0.015967130661010742, -0.015311717987060547, -0.014656305313110352, -0.014000892639160156, -0.013345479965209961, -0.012690067291259766, -0.01203465461730957, -0.011379241943359375, -0.01072382926940918, -0.010068416595458984, -0.009413003921508789, -0.008757591247558594, -0.008102178573608398, -0.007446765899658203, -0.006791353225708008, -0.0061359405517578125, -0.005480527877807617, -0.004825115203857422, -0.0041697025299072266, -0.0035142898559570312, -0.002858877182006836, -0.0022034645080566406, -0.0015480518341064453, -0.00089263916015625, -0.0002372264862060547, 0.0004181861877441406, 0.001073598861694336, 0.0017290115356445312, 0.0023844242095947266, 0.003039836883544922, 0.003695249557495117, 0.0043506622314453125, 0.005006074905395508, 0.005661487579345703, 0.0063169002532958984, 0.006972312927246094, 0.007627725601196289, 0.008283138275146484, 0.00893855094909668, 0.009593963623046875, 0.01024937629699707, 0.010904788970947266, 0.011560201644897461, 0.012215614318847656, 0.012871026992797852, 0.013526439666748047, 0.014181852340698242, 0.014837265014648438, 0.015492677688598633, 0.016148090362548828, 0.016803503036499023, 0.01745891571044922, 0.018114328384399414, 0.01876974105834961, 0.019425153732299805, 0.02008056640625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 4.0, 10.0, 9.0, 24.0, 15.0, 19.0, 25.0, 24.0, 27.0, 28.0, 31.0, 35.0, 23.0, 48.0, 46.0, 56.0, 43.0, 47.0, 45.0, 46.0, 44.0, 35.0, 29.0, 37.0, 32.0, 29.0, 22.0, 32.0, 18.0, 15.0, 15.0, 14.0, 12.0, 14.0, 10.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01117706298828125, -0.01085364818572998, -0.010530233383178711, -0.010206818580627441, -0.009883403778076172, -0.009559988975524902, -0.009236574172973633, -0.008913159370422363, -0.008589744567871094, -0.008266329765319824, -0.007942914962768555, -0.007619500160217285, -0.007296085357666016, -0.006972670555114746, -0.0066492557525634766, -0.006325840950012207, -0.0060024261474609375, -0.005679011344909668, -0.0053555965423583984, -0.005032181739807129, -0.004708766937255859, -0.00438535213470459, -0.00406193733215332, -0.0037385225296020508, -0.0034151077270507812, -0.0030916929244995117, -0.002768278121948242, -0.0024448633193969727, -0.002121448516845703, -0.0017980337142944336, -0.001474618911743164, -0.0011512041091918945, -0.000827789306640625, -0.0005043745040893555, -0.00018095970153808594, 0.0001424551010131836, 0.0004658699035644531, 0.0007892847061157227, 0.0011126995086669922, 0.0014361143112182617, 0.0017595291137695312, 0.0020829439163208008, 0.0024063587188720703, 0.00272977352142334, 0.0030531883239746094, 0.003376603126525879, 0.0037000179290771484, 0.004023432731628418, 0.0043468475341796875, 0.004670262336730957, 0.0049936771392822266, 0.005317091941833496, 0.005640506744384766, 0.005963921546936035, 0.006287336349487305, 0.006610751152038574, 0.006934165954589844, 0.007257580757141113, 0.007580995559692383, 0.007904410362243652, 0.008227825164794922, 0.008551239967346191, 0.008874654769897461, 0.00919806957244873, 0.009521484375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 12.0, 14.0, 38.0, 41.0, 88.0, 97.0, 172.0, 283.0, 434.0, 677.0, 1118.0, 1755.0, 2672.0, 4523.0, 7521.0, 12302.0, 21185.0, 37481.0, 68298.0, 132644.0, 274632.0, 657691.0, 1602754.0, 749693.0, 302980.0, 144227.0, 74246.0, 40376.0, 22698.0, 12954.0, 7941.0, 4764.0, 2989.0, 1825.0, 1129.0, 729.0, 471.0, 296.0, 208.0, 102.0, 76.0, 56.0, 25.0, 19.0, 16.0, 12.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0173492431640625, -0.01678156852722168, -0.01621389389038086, -0.01564621925354004, -0.015078544616699219, -0.014510869979858398, -0.013943195343017578, -0.013375520706176758, -0.012807846069335938, -0.012240171432495117, -0.011672496795654297, -0.011104822158813477, -0.010537147521972656, -0.009969472885131836, -0.009401798248291016, -0.008834123611450195, -0.008266448974609375, -0.007698774337768555, -0.007131099700927734, -0.006563425064086914, -0.005995750427246094, -0.0054280757904052734, -0.004860401153564453, -0.004292726516723633, -0.0037250518798828125, -0.003157377243041992, -0.002589702606201172, -0.0020220279693603516, -0.0014543533325195312, -0.0008866786956787109, -0.0003190040588378906, 0.0002486705780029297, 0.00081634521484375, 0.0013840198516845703, 0.0019516944885253906, 0.002519369125366211, 0.0030870437622070312, 0.0036547183990478516, 0.004222393035888672, 0.004790067672729492, 0.0053577423095703125, 0.005925416946411133, 0.006493091583251953, 0.0070607662200927734, 0.007628440856933594, 0.008196115493774414, 0.008763790130615234, 0.009331464767456055, 0.009899139404296875, 0.010466814041137695, 0.011034488677978516, 0.011602163314819336, 0.012169837951660156, 0.012737512588500977, 0.013305187225341797, 0.013872861862182617, 0.014440536499023438, 0.015008211135864258, 0.015575885772705078, 0.0161435604095459, 0.01671123504638672, 0.01727890968322754, 0.01784658432006836, 0.01841425895690918, 0.01898193359375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 5.0, 6.0, 13.0, 12.0, 17.0, 17.0, 22.0, 21.0, 34.0, 40.0, 47.0, 54.0, 79.0, 92.0, 95.0, 135.0, 149.0, 181.0, 212.0, 221.0, 273.0, 304.0, 319.0, 276.0, 218.0, 189.0, 177.0, 152.0, 131.0, 119.0, 79.0, 65.0, 61.0, 47.0, 44.0, 39.0, 31.0, 23.0, 11.0, 19.0, 12.0, 9.0, 4.0, 8.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00568389892578125, -0.005521237850189209, -0.005358576774597168, -0.005195915699005127, -0.005033254623413086, -0.004870593547821045, -0.004707932472229004, -0.004545271396636963, -0.004382610321044922, -0.004219949245452881, -0.00405728816986084, -0.003894627094268799, -0.003731966018676758, -0.003569304943084717, -0.0034066438674926758, -0.0032439827919006348, -0.0030813217163085938, -0.0029186606407165527, -0.0027559995651245117, -0.0025933384895324707, -0.0024306774139404297, -0.0022680163383483887, -0.0021053552627563477, -0.0019426941871643066, -0.0017800331115722656, -0.0016173720359802246, -0.0014547109603881836, -0.0012920498847961426, -0.0011293888092041016, -0.0009667277336120605, -0.0008040666580200195, -0.0006414055824279785, -0.0004787445068359375, -0.0003160834312438965, -0.00015342235565185547, 9.238719940185547e-06, 0.00017189979553222656, 0.0003345608711242676, 0.0004972219467163086, 0.0006598830223083496, 0.0008225440979003906, 0.0009852051734924316, 0.0011478662490844727, 0.0013105273246765137, 0.0014731884002685547, 0.0016358494758605957, 0.0017985105514526367, 0.0019611716270446777, 0.0021238327026367188, 0.0022864937782287598, 0.0024491548538208008, 0.002611815929412842, 0.002774477005004883, 0.002937138080596924, 0.003099799156188965, 0.003262460231781006, 0.003425121307373047, 0.003587782382965088, 0.003750443458557129, 0.00391310453414917, 0.004075765609741211, 0.004238426685333252, 0.004401087760925293, 0.004563748836517334, 0.004726409912109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 7.0, 4.0, 7.0, 19.0, 19.0, 26.0, 30.0, 36.0, 39.0, 53.0, 67.0, 71.0, 93.0, 81.0, 98.0, 58.0, 66.0, 36.0, 43.0, 19.0, 25.0, 23.0, 10.0, 10.0, 11.0, 9.0, 7.0, 7.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.011549476534128189, -0.011093901470303535, -0.010638326406478882, -0.010182751342654228, -0.009727176278829575, -0.009271601215004921, -0.008816026151180267, -0.008360451087355614, -0.00790487602353096, -0.0074493009597063065, -0.006993725895881653, -0.006538150832056999, -0.006082575768232346, -0.005627000704407692, -0.005171425640583038, -0.004715850576758385, -0.004260275512933731, -0.0038047004491090775, -0.003349125385284424, -0.00289355032145977, -0.0024379752576351166, -0.001982400193810463, -0.0015268251299858093, -0.0010712500661611557, -0.0006156750023365021, -0.00016009993851184845, 0.0002954751253128052, 0.0007510501891374588, 0.0012066252529621124, 0.001662200316786766, 0.0021177753806114197, 0.0025733504444360733, 0.003028925508260727, 0.0034845005720853806, 0.003940075635910034, 0.004395650699734688, 0.004851225763559341, 0.005306800827383995, 0.005762375891208649, 0.006217950955033302, 0.006673526018857956, 0.0071291010826826096, 0.007584676146507263, 0.008040251210331917, 0.00849582627415657, 0.008951401337981224, 0.009406976401805878, 0.009862551465630531, 0.010318126529455185, 0.010773701593279839, 0.011229276657104492, 0.011684851720929146, 0.0121404267847538, 0.012596001848578453, 0.013051576912403107, 0.01350715197622776, 0.013962727040052414, 0.014418302103877068, 0.014873877167701721, 0.015329452231526375, 0.01578502729535103, 0.016240602359175682, 0.016696177423000336, 0.01715175248682499, 0.017607327550649643]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 9.0, 9.0, 14.0, 14.0, 20.0, 21.0, 29.0, 36.0, 20.0, 29.0, 30.0, 41.0, 43.0, 40.0, 39.0, 40.0, 40.0, 41.0, 42.0, 42.0, 47.0, 44.0, 37.0, 34.0, 31.0, 24.0, 26.0, 26.0, 18.0, 14.0, 9.0, 17.0, 7.0, 7.0, 4.0, 5.0, 11.0, 5.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.011295566335320473, -0.010952138341963291, -0.01060871034860611, -0.010265281423926353, -0.009921853430569172, -0.00957842543721199, -0.009234997443854809, -0.008891569450497627, -0.008548140525817871, -0.00820471253246069, -0.007861284539103508, -0.007517856080085039, -0.00717442762106657, -0.006830999627709389, -0.006487571634352207, -0.006144143640995026, -0.005800715647637844, -0.0054572876542806625, -0.005113859195262194, -0.004770431201905012, -0.004427002742886543, -0.004083574749529362, -0.00374014675617218, -0.003396718529984355, -0.0030532903037965298, -0.0027098620776087046, -0.0023664338514208794, -0.002023005858063698, -0.0016795776318758726, -0.0013361494056880474, -0.0009927214123308659, -0.0006492931861430407, -0.00030586402863264084, 3.756413934752345e-05, 0.00038099230732768774, 0.0007244204171001911, 0.0010678486432880163, 0.0014112768694758415, 0.001754704862833023, 0.0020981330890208483, 0.0024415613152086735, 0.0027849895413964987, 0.003128417767584324, 0.0034718457609415054, 0.0038152739871293306, 0.004158702213317156, 0.004502130206674337, 0.004845558665692806, 0.005188986659049988, 0.005532414652407169, 0.005875843111425638, 0.00621927110478282, 0.006562699563801289, 0.00690612755715847, 0.007249555550515652, 0.007592983543872833, 0.00793641246855259, 0.008279840461909771, 0.008623268455266953, 0.008966697379946709, 0.00931012537330389, 0.009653553366661072, 0.009996981360018253, 0.010340409353375435, 0.010683837346732616]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 9.0, 12.0, 21.0, 39.0, 30.0, 55.0, 91.0, 157.0, 203.0, 328.0, 506.0, 850.0, 1223.0, 2197.0, 3529.0, 6041.0, 10532.0, 19522.0, 36925.0, 75365.0, 190286.0, 426244.0, 142630.0, 61724.0, 30884.0, 16574.0, 9119.0, 5373.0, 3080.0, 1873.0, 1100.0, 729.0, 437.0, 287.0, 192.0, 132.0, 75.0, 52.0, 29.0, 29.0, 15.0, 10.0, 17.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01313018798828125, -0.012697815895080566, -0.012265443801879883, -0.0118330717086792, -0.011400699615478516, -0.010968327522277832, -0.010535955429077148, -0.010103583335876465, -0.009671211242675781, -0.009238839149475098, -0.008806467056274414, -0.00837409496307373, -0.007941722869873047, -0.007509350776672363, -0.00707697868347168, -0.006644606590270996, -0.0062122344970703125, -0.005779862403869629, -0.005347490310668945, -0.004915118217468262, -0.004482746124267578, -0.0040503740310668945, -0.003618001937866211, -0.0031856298446655273, -0.0027532577514648438, -0.00232088565826416, -0.0018885135650634766, -0.001456141471862793, -0.0010237693786621094, -0.0005913972854614258, -0.0001590251922607422, 0.0002733469009399414, 0.000705718994140625, 0.0011380910873413086, 0.0015704631805419922, 0.0020028352737426758, 0.0024352073669433594, 0.002867579460144043, 0.0032999515533447266, 0.00373232364654541, 0.004164695739746094, 0.004597067832946777, 0.005029439926147461, 0.0054618120193481445, 0.005894184112548828, 0.006326556205749512, 0.006758928298950195, 0.007191300392150879, 0.0076236724853515625, 0.008056044578552246, 0.00848841667175293, 0.008920788764953613, 0.009353160858154297, 0.00978553295135498, 0.010217905044555664, 0.010650277137756348, 0.011082649230957031, 0.011515021324157715, 0.011947393417358398, 0.012379765510559082, 0.012812137603759766, 0.01324450969696045, 0.013676881790161133, 0.014109253883361816, 0.0145416259765625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 7.0, 7.0, 6.0, 12.0, 14.0, 12.0, 16.0, 19.0, 32.0, 29.0, 28.0, 23.0, 33.0, 47.0, 38.0, 41.0, 49.0, 35.0, 33.0, 45.0, 60.0, 42.0, 51.0, 48.0, 30.0, 29.0, 35.0, 33.0, 26.0, 13.0, 17.0, 20.0, 18.0, 6.0, 3.0, 9.0, 9.0, 3.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01242828369140625, -0.012061476707458496, -0.011694669723510742, -0.011327862739562988, -0.010961055755615234, -0.01059424877166748, -0.010227441787719727, -0.009860634803771973, -0.009493827819824219, -0.009127020835876465, -0.008760213851928711, -0.008393406867980957, -0.008026599884033203, -0.007659792900085449, -0.007292985916137695, -0.006926178932189941, -0.0065593719482421875, -0.006192564964294434, -0.00582575798034668, -0.005458950996398926, -0.005092144012451172, -0.004725337028503418, -0.004358530044555664, -0.00399172306060791, -0.0036249160766601562, -0.0032581090927124023, -0.0028913021087646484, -0.0025244951248168945, -0.0021576881408691406, -0.0017908811569213867, -0.0014240741729736328, -0.001057267189025879, -0.000690460205078125, -0.0003236532211303711, 4.315376281738281e-05, 0.0004099607467651367, 0.0007767677307128906, 0.0011435747146606445, 0.0015103816986083984, 0.0018771886825561523, 0.0022439956665039062, 0.00261080265045166, 0.002977609634399414, 0.003344416618347168, 0.003711223602294922, 0.004078030586242676, 0.00444483757019043, 0.004811644554138184, 0.0051784515380859375, 0.005545258522033691, 0.005912065505981445, 0.006278872489929199, 0.006645679473876953, 0.007012486457824707, 0.007379293441772461, 0.007746100425720215, 0.008112907409667969, 0.008479714393615723, 0.008846521377563477, 0.00921332836151123, 0.009580135345458984, 0.009946942329406738, 0.010313749313354492, 0.010680556297302246, 0.01104736328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 20.0, 24.0, 22.0, 41.0, 52.0, 82.0, 119.0, 165.0, 220.0, 336.0, 499.0, 693.0, 875.0, 1292.0, 1834.0, 2600.0, 3986.0, 6360.0, 10547.0, 19907.0, 44047.0, 198491.0, 617155.0, 74113.0, 27684.0, 14096.0, 7996.0, 4960.0, 3126.0, 2121.0, 1469.0, 1032.0, 770.0, 518.0, 372.0, 257.0, 212.0, 134.0, 98.0, 53.0, 61.0, 43.0, 23.0, 16.0, 4.0, 8.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0189666748046875, -0.01839590072631836, -0.01782512664794922, -0.017254352569580078, -0.016683578491210938, -0.016112804412841797, -0.015542030334472656, -0.014971256256103516, -0.014400482177734375, -0.013829708099365234, -0.013258934020996094, -0.012688159942626953, -0.012117385864257812, -0.011546611785888672, -0.010975837707519531, -0.01040506362915039, -0.00983428955078125, -0.00926351547241211, -0.008692741394042969, -0.008121967315673828, -0.0075511932373046875, -0.006980419158935547, -0.006409645080566406, -0.005838871002197266, -0.005268096923828125, -0.004697322845458984, -0.004126548767089844, -0.003555774688720703, -0.0029850006103515625, -0.002414226531982422, -0.0018434524536132812, -0.0012726783752441406, -0.000701904296875, -0.00013113021850585938, 0.00043964385986328125, 0.0010104179382324219, 0.0015811920166015625, 0.002151966094970703, 0.0027227401733398438, 0.0032935142517089844, 0.003864288330078125, 0.004435062408447266, 0.005005836486816406, 0.005576610565185547, 0.0061473846435546875, 0.006718158721923828, 0.007288932800292969, 0.00785970687866211, 0.00843048095703125, 0.00900125503540039, 0.009572029113769531, 0.010142803192138672, 0.010713577270507812, 0.011284351348876953, 0.011855125427246094, 0.012425899505615234, 0.012996673583984375, 0.013567447662353516, 0.014138221740722656, 0.014708995819091797, 0.015279769897460938, 0.015850543975830078, 0.01642131805419922, 0.01699209213256836, 0.0175628662109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 3.0, 7.0, 12.0, 11.0, 10.0, 22.0, 20.0, 18.0, 24.0, 31.0, 28.0, 35.0, 29.0, 33.0, 30.0, 49.0, 49.0, 54.0, 46.0, 37.0, 44.0, 46.0, 42.0, 45.0, 32.0, 45.0, 35.0, 24.0, 27.0, 21.0, 20.0, 13.0, 7.0, 11.0, 7.0, 10.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00865936279296875, -0.008424758911132812, -0.008190155029296875, -0.007955551147460938, -0.007720947265625, -0.0074863433837890625, -0.007251739501953125, -0.0070171356201171875, -0.00678253173828125, -0.0065479278564453125, -0.006313323974609375, -0.0060787200927734375, -0.0058441162109375, -0.0056095123291015625, -0.005374908447265625, -0.0051403045654296875, -0.00490570068359375, -0.0046710968017578125, -0.004436492919921875, -0.0042018890380859375, -0.00396728515625, -0.0037326812744140625, -0.003498077392578125, -0.0032634735107421875, -0.00302886962890625, -0.0027942657470703125, -0.002559661865234375, -0.0023250579833984375, -0.0020904541015625, -0.0018558502197265625, -0.001621246337890625, -0.0013866424560546875, -0.00115203857421875, -0.0009174346923828125, -0.000682830810546875, -0.0004482269287109375, -0.000213623046875, 2.09808349609375e-05, 0.000255584716796875, 0.0004901885986328125, 0.00072479248046875, 0.0009593963623046875, 0.001194000244140625, 0.0014286041259765625, 0.0016632080078125, 0.0018978118896484375, 0.002132415771484375, 0.0023670196533203125, 0.00260162353515625, 0.0028362274169921875, 0.003070831298828125, 0.0033054351806640625, 0.0035400390625, 0.0037746429443359375, 0.004009246826171875, 0.0042438507080078125, 0.00447845458984375, 0.0047130584716796875, 0.004947662353515625, 0.0051822662353515625, 0.0054168701171875, 0.0056514739990234375, 0.005886077880859375, 0.0061206817626953125, 0.00635528564453125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 13.0, 21.0, 25.0, 26.0, 40.0, 51.0, 66.0, 116.0, 180.0, 202.0, 325.0, 432.0, 704.0, 947.0, 1538.0, 2317.0, 3660.0, 6328.0, 11555.0, 24607.0, 73559.0, 709557.0, 142382.0, 34571.0, 15142.0, 7754.0, 4383.0, 2717.0, 1733.0, 1112.0, 809.0, 476.0, 357.0, 258.0, 180.0, 132.0, 79.0, 48.0, 50.0, 26.0, 17.0, 16.0, 16.0, 11.0, 2.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0021533966064453125, -0.00208321213722229, -0.0020130276679992676, -0.0019428431987762451, -0.0018726587295532227, -0.0018024742603302002, -0.0017322897911071777, -0.0016621053218841553, -0.0015919208526611328, -0.0015217363834381104, -0.0014515519142150879, -0.0013813674449920654, -0.001311182975769043, -0.0012409985065460205, -0.001170814037322998, -0.0011006295680999756, -0.0010304450988769531, -0.0009602606296539307, -0.0008900761604309082, -0.0008198916912078857, -0.0007497072219848633, -0.0006795227527618408, -0.0006093382835388184, -0.0005391538143157959, -0.00046896934509277344, -0.000398784875869751, -0.0003286004066467285, -0.00025841593742370605, -0.0001882314682006836, -0.00011804699897766113, -4.786252975463867e-05, 2.232193946838379e-05, 9.250640869140625e-05, 0.0001626908779144287, 0.00023287534713745117, 0.00030305981636047363, 0.0003732442855834961, 0.00044342875480651855, 0.000513613224029541, 0.0005837976932525635, 0.0006539821624755859, 0.0007241666316986084, 0.0007943511009216309, 0.0008645355701446533, 0.0009347200393676758, 0.0010049045085906982, 0.0010750889778137207, 0.0011452734470367432, 0.0012154579162597656, 0.001285642385482788, 0.0013558268547058105, 0.001426011323928833, 0.0014961957931518555, 0.001566380262374878, 0.0016365647315979004, 0.0017067492008209229, 0.0017769336700439453, 0.0018471181392669678, 0.0019173026084899902, 0.0019874870777130127, 0.002057671546936035, 0.0021278560161590576, 0.00219804048538208, 0.0022682249546051025, 0.002338409423828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 7.0, 8.0, 6.0, 6.0, 18.0, 14.0, 14.0, 30.0, 26.0, 38.0, 58.0, 0.0, 60.0, 81.0, 74.0, 80.0, 74.0, 70.0, 72.0, 51.0, 47.0, 44.0, 23.0, 24.0, 15.0, 8.0, 13.0, 0.0, 8.0, 8.0, 6.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.911073923110962e-06, -1.8551945686340332e-06, -1.7993152141571045e-06, -1.7434358596801758e-06, -1.687556505203247e-06, -1.6316771507263184e-06, -1.5757977962493896e-06, -1.519918441772461e-06, -1.4640390872955322e-06, -1.4081597328186035e-06, -1.3522803783416748e-06, -1.296401023864746e-06, -1.2405216693878174e-06, -1.1846423149108887e-06, -1.12876296043396e-06, -1.0728836059570312e-06, -1.0170042514801025e-06, -9.611248970031738e-07, -9.052455425262451e-07, -8.493661880493164e-07, -7.934868335723877e-07, -7.37607479095459e-07, -6.817281246185303e-07, -6.258487701416016e-07, -5.699694156646729e-07, -5.140900611877441e-07, -4.5821070671081543e-07, -4.023313522338867e-07, -3.46451997756958e-07, -2.905726432800293e-07, -2.3469328880310059e-07, -1.7881393432617188e-07, -1.2293457984924316e-07, -6.705522537231445e-08, -1.1175870895385742e-08, 4.470348358154297e-08, 1.0058283805847168e-07, 1.564621925354004e-07, 2.123415470123291e-07, 2.682209014892578e-07, 3.241002559661865e-07, 3.7997961044311523e-07, 4.3585896492004395e-07, 4.917383193969727e-07, 5.476176738739014e-07, 6.034970283508301e-07, 6.593763828277588e-07, 7.152557373046875e-07, 7.711350917816162e-07, 8.270144462585449e-07, 8.828938007354736e-07, 9.387731552124023e-07, 9.94652509689331e-07, 1.0505318641662598e-06, 1.1064112186431885e-06, 1.1622905731201172e-06, 1.218169927597046e-06, 1.2740492820739746e-06, 1.3299286365509033e-06, 1.385807991027832e-06, 1.4416873455047607e-06, 1.4975666999816895e-06, 1.5534460544586182e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 13.0, 11.0, 15.0, 31.0, 60.0, 76.0, 114.0, 184.0, 266.0, 463.0, 766.0, 1361.0, 2384.0, 4498.0, 9019.0, 19659.0, 45809.0, 123637.0, 523632.0, 199403.0, 65425.0, 26528.0, 12188.0, 5869.0, 3044.0, 1750.0, 920.0, 526.0, 322.0, 208.0, 125.0, 61.0, 59.0, 38.0, 24.0, 24.0, 11.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00283050537109375, -0.0027512013912200928, -0.0026718974113464355, -0.0025925934314727783, -0.002513289451599121, -0.002433985471725464, -0.0023546814918518066, -0.0022753775119781494, -0.002196073532104492, -0.002116769552230835, -0.0020374655723571777, -0.0019581615924835205, -0.0018788576126098633, -0.001799553632736206, -0.0017202496528625488, -0.0016409456729888916, -0.0015616416931152344, -0.0014823377132415771, -0.00140303373336792, -0.0013237297534942627, -0.0012444257736206055, -0.0011651217937469482, -0.001085817813873291, -0.0010065138339996338, -0.0009272098541259766, -0.0008479058742523193, -0.0007686018943786621, -0.0006892979145050049, -0.0006099939346313477, -0.0005306899547576904, -0.0004513859748840332, -0.000372081995010376, -0.00029277801513671875, -0.00021347403526306152, -0.0001341700553894043, -5.486607551574707e-05, 2.4437904357910156e-05, 0.00010374188423156738, 0.0001830458641052246, 0.00026234984397888184, 0.00034165382385253906, 0.0004209578037261963, 0.0005002617835998535, 0.0005795657634735107, 0.000658869743347168, 0.0007381737232208252, 0.0008174777030944824, 0.0008967816829681396, 0.0009760856628417969, 0.001055389642715454, 0.0011346936225891113, 0.0012139976024627686, 0.0012933015823364258, 0.001372605562210083, 0.0014519095420837402, 0.0015312135219573975, 0.0016105175018310547, 0.001689821481704712, 0.0017691254615783691, 0.0018484294414520264, 0.0019277334213256836, 0.002007037401199341, 0.002086341381072998, 0.0021656453609466553, 0.0022449493408203125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 7.0, 4.0, 8.0, 7.0, 18.0, 23.0, 18.0, 33.0, 27.0, 38.0, 42.0, 47.0, 69.0, 107.0, 111.0, 68.0, 75.0, 57.0, 32.0, 30.0, 26.0, 36.0, 17.0, 15.0, 16.0, 7.0, 8.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.00069427490234375, -0.0006765797734260559, -0.0006588846445083618, -0.0006411895155906677, -0.0006234943866729736, -0.0006057992577552795, -0.0005881041288375854, -0.0005704089999198914, -0.0005527138710021973, -0.0005350187420845032, -0.0005173236131668091, -0.000499628484249115, -0.0004819333553314209, -0.0004642382264137268, -0.0004465430974960327, -0.0004288479685783386, -0.00041115283966064453, -0.00039345771074295044, -0.00037576258182525635, -0.00035806745290756226, -0.00034037232398986816, -0.00032267719507217407, -0.00030498206615448, -0.0002872869372367859, -0.0002695918083190918, -0.0002518966794013977, -0.0002342015504837036, -0.00021650642156600952, -0.00019881129264831543, -0.00018111616373062134, -0.00016342103481292725, -0.00014572590589523315, -0.00012803077697753906, -0.00011033564805984497, -9.264051914215088e-05, -7.494539022445679e-05, -5.7250261306762695e-05, -3.9555132389068604e-05, -2.1860003471374512e-05, -4.16487455368042e-06, 1.3530254364013672e-05, 3.1225383281707764e-05, 4.8920512199401855e-05, 6.661564111709595e-05, 8.431077003479004e-05, 0.00010200589895248413, 0.00011970102787017822, 0.00013739615678787231, 0.0001550912857055664, 0.0001727864146232605, 0.0001904815435409546, 0.00020817667245864868, 0.00022587180137634277, 0.00024356693029403687, 0.00026126205921173096, 0.00027895718812942505, 0.00029665231704711914, 0.00031434744596481323, 0.0003320425748825073, 0.0003497377038002014, 0.0003674328327178955, 0.0003851279616355896, 0.0004028230905532837, 0.0004205182194709778, 0.0004382133483886719]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 1.0, 0.0, 4.0, 6.0, 6.0, 8.0, 9.0, 19.0, 30.0, 24.0, 36.0, 39.0, 59.0, 77.0, 91.0, 107.0, 109.0, 70.0, 69.0, 55.0, 42.0, 32.0, 22.0, 16.0, 13.0, 13.0, 18.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014816348440945148, -0.01430505234748125, -0.013793757185339928, -0.01328246109187603, -0.012771164998412132, -0.012259868904948235, -0.011748573742806911, -0.011237277649343014, -0.01072598248720169, -0.010214686393737793, -0.00970339123159647, -0.009192095138132572, -0.008680799044668674, -0.008169503882527351, -0.007658207789063454, -0.007146911695599556, -0.006635615602135658, -0.006124319974333048, -0.00561302388086915, -0.00510172825306654, -0.004590432159602642, -0.004079136531800032, -0.0035678409039974213, -0.003056545043364167, -0.002545249182730913, -0.002033953322097659, -0.0015226575778797269, -0.0010113618336617947, -0.0005000659730285406, 1.122988760471344e-05, 0.0005225255154073238, 0.0010338213760405779, 0.0015451163053512573, 0.0020564121659845114, 0.0025677080266177654, 0.003079003654420376, 0.00359029951505363, 0.004101595375686884, 0.004612891003489494, 0.005124187096953392, 0.005635482724756002, 0.006146778352558613, 0.0066580744460225105, 0.007169370073825121, 0.007680665701627731, 0.008191961795091629, 0.008703257888555527, 0.00921455305069685, 0.009725849144160748, 0.010237145237624645, 0.010748440399765968, 0.011259736493229866, 0.011771032586693764, 0.012282328680157661, 0.012793623842298985, 0.013304919935762882, 0.013816215097904205, 0.014327511191368103, 0.014838806353509426, 0.015350102446973324, 0.015861397609114647, 0.016372693702578545, 0.016883989796042442, 0.01739528588950634, 0.017906581982970238]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 12.0, 7.0, 8.0, 12.0, 15.0, 14.0, 19.0, 23.0, 38.0, 30.0, 23.0, 30.0, 34.0, 46.0, 32.0, 46.0, 43.0, 36.0, 44.0, 37.0, 46.0, 48.0, 39.0, 42.0, 38.0, 33.0, 26.0, 26.0, 28.0, 23.0, 13.0, 14.0, 11.0, 11.0, 8.0, 6.0, 2.0, 12.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01140633039176464, -0.011064806953072548, -0.01072328444570303, -0.010381761007010937, -0.010040238499641418, -0.009698715060949326, -0.009357191622257233, -0.009015669114887714, -0.008674146607518196, -0.008332623168826103, -0.007991100661456585, -0.007649577222764492, -0.007308054715394974, -0.006966531276702881, -0.006625008303672075, -0.00628348533064127, -0.005941961891949177, -0.005600438918918371, -0.005258915945887566, -0.004917392507195473, -0.0045758699998259544, -0.0042343465611338615, -0.003892823588103056, -0.0035513006150722504, -0.0032097776420414448, -0.002868254669010639, -0.0025267316959798336, -0.0021852084901183844, -0.0018436855170875788, -0.0015021625440567732, -0.001160639338195324, -0.0008191163651645184, -0.0004775943234562874, -0.00013607129221782088, 0.00020545173902064562, 0.000546974828466773, 0.0008884978014975786, 0.0012300207745283842, 0.0015715439803898335, 0.001913066953420639, 0.0022545899264514446, 0.00259611289948225, 0.002937635872513056, 0.003279159078374505, 0.0036206820514053106, 0.0039622047916054726, 0.0043037282302975655, 0.004645251203328371, 0.004986774176359177, 0.005328297149389982, 0.005669820122420788, 0.006011343561112881, 0.006352866068482399, 0.006694389507174492, 0.0070359124802052975, 0.007377435453236103, 0.007718958426266909, 0.008060481399297714, 0.008402004837989807, 0.008743527345359325, 0.009085050784051418, 0.009426573291420937, 0.00976809673011303, 0.010109620168805122, 0.01045114267617464]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 15.0, 15.0, 19.0, 22.0, 40.0, 68.0, 105.0, 138.0, 195.0, 285.0, 418.0, 577.0, 893.0, 1250.0, 1858.0, 2684.0, 4006.0, 6106.0, 9063.0, 14045.0, 21549.0, 34937.0, 56694.0, 98869.0, 198730.0, 263755.0, 136389.0, 73275.0, 44126.0, 27226.0, 17480.0, 11192.0, 7426.0, 4945.0, 3210.0, 2214.0, 1492.0, 1002.0, 685.0, 474.0, 334.0, 236.0, 156.0, 105.0, 90.0, 44.0, 47.0, 22.0, 19.0, 16.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01922607421875, -0.018610715866088867, -0.017995357513427734, -0.0173799991607666, -0.01676464080810547, -0.016149282455444336, -0.015533924102783203, -0.01491856575012207, -0.014303207397460938, -0.013687849044799805, -0.013072490692138672, -0.012457132339477539, -0.011841773986816406, -0.011226415634155273, -0.01061105728149414, -0.009995698928833008, -0.009380340576171875, -0.008764982223510742, -0.00814962387084961, -0.0075342655181884766, -0.006918907165527344, -0.006303548812866211, -0.005688190460205078, -0.005072832107543945, -0.0044574737548828125, -0.0038421154022216797, -0.003226757049560547, -0.002611398696899414, -0.0019960403442382812, -0.0013806819915771484, -0.0007653236389160156, -0.0001499652862548828, 0.00046539306640625, 0.0010807514190673828, 0.0016961097717285156, 0.0023114681243896484, 0.0029268264770507812, 0.003542184829711914, 0.004157543182373047, 0.00477290153503418, 0.0053882598876953125, 0.006003618240356445, 0.006618976593017578, 0.007234334945678711, 0.007849693298339844, 0.008465051651000977, 0.00908041000366211, 0.009695768356323242, 0.010311126708984375, 0.010926485061645508, 0.01154184341430664, 0.012157201766967773, 0.012772560119628906, 0.013387918472290039, 0.014003276824951172, 0.014618635177612305, 0.015233993530273438, 0.01584935188293457, 0.016464710235595703, 0.017080068588256836, 0.01769542694091797, 0.0183107852935791, 0.018926143646240234, 0.019541501998901367, 0.0201568603515625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 8.0, 9.0, 11.0, 21.0, 19.0, 25.0, 23.0, 28.0, 22.0, 30.0, 32.0, 42.0, 44.0, 30.0, 44.0, 47.0, 40.0, 39.0, 64.0, 37.0, 41.0, 46.0, 34.0, 40.0, 30.0, 25.0, 23.0, 22.0, 20.0, 13.0, 12.0, 10.0, 7.0, 12.0, 5.0, 3.0, 10.0, 1.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0102691650390625, -0.009965658187866211, -0.009662151336669922, -0.009358644485473633, -0.009055137634277344, -0.008751630783081055, -0.008448123931884766, -0.008144617080688477, -0.007841110229492188, -0.0075376033782958984, -0.007234096527099609, -0.00693058967590332, -0.006627082824707031, -0.006323575973510742, -0.006020069122314453, -0.005716562271118164, -0.005413055419921875, -0.005109548568725586, -0.004806041717529297, -0.004502534866333008, -0.004199028015136719, -0.0038955211639404297, -0.0035920143127441406, -0.0032885074615478516, -0.0029850006103515625, -0.0026814937591552734, -0.0023779869079589844, -0.0020744800567626953, -0.0017709732055664062, -0.0014674663543701172, -0.0011639595031738281, -0.0008604526519775391, -0.00055694580078125, -0.00025343894958496094, 5.0067901611328125e-05, 0.0003535747528076172, 0.0006570816040039062, 0.0009605884552001953, 0.0012640953063964844, 0.0015676021575927734, 0.0018711090087890625, 0.0021746158599853516, 0.0024781227111816406, 0.0027816295623779297, 0.0030851364135742188, 0.003388643264770508, 0.003692150115966797, 0.003995656967163086, 0.004299163818359375, 0.004602670669555664, 0.004906177520751953, 0.005209684371948242, 0.005513191223144531, 0.00581669807434082, 0.006120204925537109, 0.0064237117767333984, 0.0067272186279296875, 0.0070307254791259766, 0.007334232330322266, 0.007637739181518555, 0.007941246032714844, 0.008244752883911133, 0.008548259735107422, 0.008851766586303711, 0.0091552734375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 7.0, 6.0, 18.0, 30.0, 37.0, 77.0, 121.0, 167.0, 280.0, 470.0, 792.0, 1335.0, 2176.0, 3761.0, 6645.0, 11426.0, 20612.0, 37906.0, 71979.0, 151648.0, 324427.0, 210492.0, 96084.0, 47872.0, 26094.0, 14398.0, 8322.0, 4645.0, 2741.0, 1614.0, 921.0, 558.0, 330.0, 223.0, 128.0, 86.0, 38.0, 31.0, 20.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023895263671875, -0.0231168270111084, -0.022338390350341797, -0.021559953689575195, -0.020781517028808594, -0.020003080368041992, -0.01922464370727539, -0.01844620704650879, -0.017667770385742188, -0.016889333724975586, -0.016110897064208984, -0.015332460403442383, -0.014554023742675781, -0.01377558708190918, -0.012997150421142578, -0.012218713760375977, -0.011440277099609375, -0.010661840438842773, -0.009883403778076172, -0.00910496711730957, -0.008326530456542969, -0.007548093795776367, -0.006769657135009766, -0.005991220474243164, -0.0052127838134765625, -0.004434347152709961, -0.0036559104919433594, -0.002877473831176758, -0.0020990371704101562, -0.0013206005096435547, -0.0005421638488769531, 0.00023627281188964844, 0.00101470947265625, 0.0017931461334228516, 0.002571582794189453, 0.0033500194549560547, 0.004128456115722656, 0.004906892776489258, 0.005685329437255859, 0.006463766098022461, 0.0072422027587890625, 0.008020639419555664, 0.008799076080322266, 0.009577512741088867, 0.010355949401855469, 0.01113438606262207, 0.011912822723388672, 0.012691259384155273, 0.013469696044921875, 0.014248132705688477, 0.015026569366455078, 0.01580500602722168, 0.01658344268798828, 0.017361879348754883, 0.018140316009521484, 0.018918752670288086, 0.019697189331054688, 0.02047562599182129, 0.02125406265258789, 0.022032499313354492, 0.022810935974121094, 0.023589372634887695, 0.024367809295654297, 0.0251462459564209, 0.0259246826171875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 12.0, 7.0, 13.0, 12.0, 14.0, 19.0, 19.0, 22.0, 25.0, 32.0, 34.0, 42.0, 42.0, 43.0, 41.0, 36.0, 39.0, 36.0, 43.0, 38.0, 37.0, 43.0, 46.0, 43.0, 37.0, 22.0, 23.0, 22.0, 28.0, 23.0, 19.0, 18.0, 10.0, 12.0, 13.0, 7.0, 5.0, 8.0, 1.0, 7.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004962921142578125, -0.004770994186401367, -0.004579067230224609, -0.0043871402740478516, -0.004195213317871094, -0.004003286361694336, -0.003811359405517578, -0.0036194324493408203, -0.0034275054931640625, -0.0032355785369873047, -0.003043651580810547, -0.002851724624633789, -0.0026597976684570312, -0.0024678707122802734, -0.0022759437561035156, -0.002084016799926758, -0.00189208984375, -0.0017001628875732422, -0.0015082359313964844, -0.0013163089752197266, -0.0011243820190429688, -0.0009324550628662109, -0.0007405281066894531, -0.0005486011505126953, -0.0003566741943359375, -0.0001647472381591797, 2.7179718017578125e-05, 0.00021910667419433594, 0.00041103363037109375, 0.0006029605865478516, 0.0007948875427246094, 0.0009868144989013672, 0.001178741455078125, 0.0013706684112548828, 0.0015625953674316406, 0.0017545223236083984, 0.0019464492797851562, 0.002138376235961914, 0.002330303192138672, 0.0025222301483154297, 0.0027141571044921875, 0.0029060840606689453, 0.003098011016845703, 0.003289937973022461, 0.0034818649291992188, 0.0036737918853759766, 0.0038657188415527344, 0.004057645797729492, 0.00424957275390625, 0.004441499710083008, 0.004633426666259766, 0.0048253536224365234, 0.005017280578613281, 0.005209207534790039, 0.005401134490966797, 0.005593061447143555, 0.0057849884033203125, 0.00597691535949707, 0.006168842315673828, 0.006360769271850586, 0.006552696228027344, 0.0067446231842041016, 0.006936550140380859, 0.007128477096557617, 0.007320404052734375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 5.0, 17.0, 17.0, 26.0, 38.0, 68.0, 70.0, 114.0, 208.0, 240.0, 387.0, 595.0, 833.0, 1225.0, 1743.0, 2481.0, 3645.0, 5190.0, 8388.0, 14625.0, 38063.0, 673711.0, 230577.0, 30084.0, 12939.0, 7653.0, 4678.0, 3347.0, 2338.0, 1590.0, 1123.0, 788.0, 576.0, 337.0, 278.0, 177.0, 125.0, 87.0, 51.0, 43.0, 19.0, 13.0, 16.0, 10.0, 4.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.0020465850830078125, -0.001987949013710022, -0.0019293129444122314, -0.001870676875114441, -0.0018120408058166504, -0.0017534047365188599, -0.0016947686672210693, -0.0016361325979232788, -0.0015774965286254883, -0.0015188604593276978, -0.0014602243900299072, -0.0014015883207321167, -0.0013429522514343262, -0.0012843161821365356, -0.0012256801128387451, -0.0011670440435409546, -0.001108407974243164, -0.0010497719049453735, -0.000991135835647583, -0.0009324997663497925, -0.000873863697052002, -0.0008152276277542114, -0.0007565915584564209, -0.0006979554891586304, -0.0006393194198608398, -0.0005806833505630493, -0.0005220472812652588, -0.00046341121196746826, -0.00040477514266967773, -0.0003461390733718872, -0.0002875030040740967, -0.00022886693477630615, -0.00017023086547851562, -0.0001115947961807251, -5.295872688293457e-05, 5.677342414855957e-06, 6.431341171264648e-05, 0.000122949481010437, 0.00018158555030822754, 0.00024022161960601807, 0.0002988576889038086, 0.0003574937582015991, 0.00041612982749938965, 0.0004747658967971802, 0.0005334019660949707, 0.0005920380353927612, 0.0006506741046905518, 0.0007093101739883423, 0.0007679462432861328, 0.0008265823125839233, 0.0008852183818817139, 0.0009438544511795044, 0.001002490520477295, 0.0010611265897750854, 0.001119762659072876, 0.0011783987283706665, 0.001237034797668457, 0.0012956708669662476, 0.001354306936264038, 0.0014129430055618286, 0.0014715790748596191, 0.0015302151441574097, 0.0015888512134552002, 0.0016474872827529907, 0.0017061233520507812]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 0.0, 1.0, 8.0, 7.0, 0.0, 21.0, 23.0, 0.0, 35.0, 60.0, 0.0, 89.0, 125.0, 222.0, 0.0, 138.0, 67.0, 0.0, 49.0, 53.0, 27.0, 0.0, 25.0, 18.0, 0.0, 9.0, 5.0, 0.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2097880244255066e-06, -1.16787850856781e-06, -1.1259689927101135e-06, -1.084059476852417e-06, -1.0421499609947205e-06, -1.000240445137024e-06, -9.583309292793274e-07, -9.164214134216309e-07, -8.745118975639343e-07, -8.326023817062378e-07, -7.906928658485413e-07, -7.487833499908447e-07, -7.068738341331482e-07, -6.649643182754517e-07, -6.230548024177551e-07, -5.811452865600586e-07, -5.392357707023621e-07, -4.973262548446655e-07, -4.55416738986969e-07, -4.1350722312927246e-07, -3.7159770727157593e-07, -3.296881914138794e-07, -2.8777867555618286e-07, -2.4586915969848633e-07, -2.039596438407898e-07, -1.6205012798309326e-07, -1.2014061212539673e-07, -7.82310962677002e-08, -3.632158041000366e-08, 5.587935447692871e-09, 4.7497451305389404e-08, 8.940696716308594e-08, 1.3131648302078247e-07, 1.73225998878479e-07, 2.1513551473617554e-07, 2.5704503059387207e-07, 2.989545464515686e-07, 3.4086406230926514e-07, 3.8277357816696167e-07, 4.246830940246582e-07, 4.6659260988235474e-07, 5.085021257400513e-07, 5.504116415977478e-07, 5.923211574554443e-07, 6.342306733131409e-07, 6.761401891708374e-07, 7.180497050285339e-07, 7.599592208862305e-07, 8.01868736743927e-07, 8.437782526016235e-07, 8.856877684593201e-07, 9.275972843170166e-07, 9.695068001747131e-07, 1.0114163160324097e-06, 1.0533258318901062e-06, 1.0952353477478027e-06, 1.1371448636054993e-06, 1.1790543794631958e-06, 1.2209638953208923e-06, 1.2628734111785889e-06, 1.3047829270362854e-06, 1.346692442893982e-06, 1.3886019587516785e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 7.0, 9.0, 8.0, 18.0, 23.0, 33.0, 54.0, 69.0, 95.0, 154.0, 253.0, 290.0, 476.0, 755.0, 1085.0, 1550.0, 2516.0, 3836.0, 6283.0, 10567.0, 20367.0, 69699.0, 810939.0, 70697.0, 20573.0, 10630.0, 6236.0, 3922.0, 2497.0, 1622.0, 1107.0, 697.0, 425.0, 311.0, 249.0, 165.0, 92.0, 70.0, 50.0, 45.0, 26.0, 20.0, 9.0, 7.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0024433135986328125, -0.002370387315750122, -0.0022974610328674316, -0.002224534749984741, -0.0021516084671020508, -0.0020786821842193604, -0.00200575590133667, -0.0019328296184539795, -0.001859903335571289, -0.0017869770526885986, -0.0017140507698059082, -0.0016411244869232178, -0.0015681982040405273, -0.001495271921157837, -0.0014223456382751465, -0.001349419355392456, -0.0012764930725097656, -0.0012035667896270752, -0.0011306405067443848, -0.0010577142238616943, -0.000984787940979004, -0.0009118616580963135, -0.000838935375213623, -0.0007660090923309326, -0.0006930828094482422, -0.0006201565265655518, -0.0005472302436828613, -0.0004743039608001709, -0.00040137767791748047, -0.00032845139503479004, -0.0002555251121520996, -0.00018259882926940918, -0.00010967254638671875, -3.674626350402832e-05, 3.618001937866211e-05, 0.00010910630226135254, 0.00018203258514404297, 0.0002549588680267334, 0.00032788515090942383, 0.00040081143379211426, 0.0004737377166748047, 0.0005466639995574951, 0.0006195902824401855, 0.000692516565322876, 0.0007654428482055664, 0.0008383691310882568, 0.0009112954139709473, 0.0009842216968536377, 0.0010571479797363281, 0.0011300742626190186, 0.001203000545501709, 0.0012759268283843994, 0.0013488531112670898, 0.0014217793941497803, 0.0014947056770324707, 0.0015676319599151611, 0.0016405582427978516, 0.001713484525680542, 0.0017864108085632324, 0.0018593370914459229, 0.0019322633743286133, 0.0020051896572113037, 0.002078115940093994, 0.0021510422229766846, 0.002223968505859375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 9.0, 9.0, 8.0, 8.0, 8.0, 9.0, 18.0, 37.0, 93.0, 257.0, 306.0, 90.0, 30.0, 21.0, 16.0, 9.0, 11.0, 2.0, 4.0, 8.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006771087646484375, -0.0006572306156158447, -0.000637352466583252, -0.0006174743175506592, -0.0005975961685180664, -0.0005777180194854736, -0.0005578398704528809, -0.0005379617214202881, -0.0005180835723876953, -0.0004982054233551025, -0.00047832727432250977, -0.000458449125289917, -0.0004385709762573242, -0.00041869282722473145, -0.00039881467819213867, -0.0003789365291595459, -0.0003590583801269531, -0.00033918023109436035, -0.0003193020820617676, -0.0002994239330291748, -0.00027954578399658203, -0.00025966763496398926, -0.00023978948593139648, -0.0002199113368988037, -0.00020003318786621094, -0.00018015503883361816, -0.0001602768898010254, -0.00014039874076843262, -0.00012052059173583984, -0.00010064244270324707, -8.07642936706543e-05, -6.0886144638061523e-05, -4.100799560546875e-05, -2.1129846572875977e-05, -1.2516975402832031e-06, 1.862645149230957e-05, 3.8504600524902344e-05, 5.838274955749512e-05, 7.826089859008789e-05, 9.813904762268066e-05, 0.00011801719665527344, 0.0001378953456878662, 0.00015777349472045898, 0.00017765164375305176, 0.00019752979278564453, 0.0002174079418182373, 0.00023728609085083008, 0.00025716423988342285, 0.0002770423889160156, 0.0002969205379486084, 0.00031679868698120117, 0.00033667683601379395, 0.0003565549850463867, 0.0003764331340789795, 0.00039631128311157227, 0.00041618943214416504, 0.0004360675811767578, 0.0004559457302093506, 0.00047582387924194336, 0.0004957020282745361, 0.0005155801773071289, 0.0005354583263397217, 0.0005553364753723145, 0.0005752146244049072, 0.0005950927734375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 8.0, 3.0, 5.0, 1.0, 8.0, 16.0, 17.0, 13.0, 29.0, 36.0, 36.0, 46.0, 52.0, 57.0, 86.0, 100.0, 83.0, 81.0, 61.0, 61.0, 36.0, 29.0, 26.0, 15.0, 24.0, 12.0, 13.0, 14.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01078855898231268, -0.010390453971922398, -0.00999234989285469, -0.009594244882464409, -0.009196140803396702, -0.00879803579300642, -0.008399931713938713, -0.008001826703548431, -0.007603722158819437, -0.007205617614090443, -0.006807513069361448, -0.006409408524632454, -0.006011303514242172, -0.005613199435174465, -0.0052150944247841835, -0.004816989880055189, -0.004418885335326195, -0.0040207807905972, -0.003622676245868206, -0.003224571468308568, -0.0028264669235795736, -0.0024283623788505793, -0.0020302576012909412, -0.0016321530565619469, -0.0012340485118329525, -0.0008359439088962972, -0.00043783930595964193, -3.973464481532574e-05, 0.00035836989991366863, 0.000756474444642663, 0.001154579222202301, 0.0015526837669312954, 0.0019507883116602898, 0.002348892856389284, 0.0027469974011182785, 0.0031451021786779165, 0.003543206723406911, 0.003941311500966549, 0.004339416045695543, 0.004737520590424538, 0.005135625135153532, 0.005533729679882526, 0.005931834224611521, 0.006329938769340515, 0.006728043779730797, 0.007126147858798504, 0.0075242528691887856, 0.007922356948256493, 0.008320461958646774, 0.008718566969037056, 0.009116671048104763, 0.009514776058495045, 0.009912880137562752, 0.010310985147953033, 0.010709090158343315, 0.011107194237411022, 0.01150529831647873, 0.011903403326869011, 0.012301507405936718, 0.012699612416327, 0.013097716495394707, 0.013495821505784988, 0.01389392651617527, 0.014292030595242977, 0.014690135605633259]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 6.0, 11.0, 15.0, 17.0, 14.0, 17.0, 18.0, 14.0, 30.0, 32.0, 32.0, 27.0, 25.0, 45.0, 27.0, 35.0, 37.0, 34.0, 42.0, 32.0, 36.0, 44.0, 30.0, 33.0, 45.0, 34.0, 28.0, 36.0, 18.0, 20.0, 26.0, 14.0, 16.0, 16.0, 11.0, 6.0, 12.0, 4.0, 6.0, 6.0, 6.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00871752854436636, -0.008444925770163536, -0.008172322064638138, -0.00789971835911274, -0.007627115584909916, -0.007354512345045805, -0.007081909105181694, -0.006809305865317583, -0.006536702625453472, -0.006264099385589361, -0.00599149614572525, -0.005718892905861139, -0.005446289665997028, -0.005173686426132917, -0.0049010831862688065, -0.0046284799464046955, -0.0043558767065405846, -0.004083273466676474, -0.0038106702268123627, -0.0035380669869482517, -0.0032654637470841408, -0.00299286050722003, -0.002720257267355919, -0.002447654027491808, -0.002175050787627697, -0.001902447547763586, -0.001629844307899475, -0.0013572410680353642, -0.0010846378281712532, -0.0008120345883071423, -0.0005394313484430313, -0.00026682810857892036, 5.775131285190582e-06, 0.00027837837114930153, 0.0005509816110134125, 0.0008235848508775234, 0.0010961880907416344, 0.0013687913306057453, 0.0016413945704698563, 0.0019139978103339672, 0.002186601050198078, 0.002459204290062189, 0.0027318075299263, 0.003004410769790411, 0.003277014009654522, 0.003549617249518633, 0.003822220489382744, 0.004094823729246855, 0.004367426969110966, 0.004640030208975077, 0.004912633448839188, 0.005185236688703299, 0.0054578399285674095, 0.0057304431684315205, 0.006003046408295631, 0.006275649648159742, 0.006548252888023853, 0.006820856127887964, 0.007093459367752075, 0.007366062607616186, 0.007638665847480297, 0.00791126862168312, 0.008183872327208519, 0.008456476032733917, 0.008729078806936741]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 1.0, 6.0, 10.0, 9.0, 18.0, 35.0, 27.0, 44.0, 81.0, 125.0, 198.0, 266.0, 370.0, 517.0, 747.0, 1168.0, 1666.0, 2617.0, 3941.0, 5973.0, 9267.0, 14705.0, 23683.0, 38881.0, 66130.0, 120734.0, 254220.0, 785081.0, 1744858.0, 630325.0, 221102.0, 109650.0, 60845.0, 35824.0, 21632.0, 13605.0, 8835.0, 5767.0, 3750.0, 2461.0, 1641.0, 1150.0, 731.0, 529.0, 362.0, 248.0, 144.0, 114.0, 72.0, 50.0, 34.0, 18.0, 11.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01318359375, -0.01280057430267334, -0.01241755485534668, -0.01203453540802002, -0.01165151596069336, -0.0112684965133667, -0.010885477066040039, -0.010502457618713379, -0.010119438171386719, -0.009736418724060059, -0.009353399276733398, -0.008970379829406738, -0.008587360382080078, -0.008204340934753418, -0.007821321487426758, -0.007438302040100098, -0.0070552825927734375, -0.006672263145446777, -0.006289243698120117, -0.005906224250793457, -0.005523204803466797, -0.005140185356140137, -0.0047571659088134766, -0.004374146461486816, -0.003991127014160156, -0.003608107566833496, -0.003225088119506836, -0.0028420686721801758, -0.0024590492248535156, -0.0020760297775268555, -0.0016930103302001953, -0.0013099908828735352, -0.000926971435546875, -0.0005439519882202148, -0.0001609325408935547, 0.00022208690643310547, 0.0006051063537597656, 0.0009881258010864258, 0.001371145248413086, 0.001754164695739746, 0.0021371841430664062, 0.0025202035903930664, 0.0029032230377197266, 0.0032862424850463867, 0.003669261932373047, 0.004052281379699707, 0.004435300827026367, 0.004818320274353027, 0.0052013397216796875, 0.005584359169006348, 0.005967378616333008, 0.006350398063659668, 0.006733417510986328, 0.007116436958312988, 0.0074994564056396484, 0.007882475852966309, 0.008265495300292969, 0.008648514747619629, 0.009031534194946289, 0.00941455364227295, 0.00979757308959961, 0.01018059253692627, 0.01056361198425293, 0.01094663143157959, 0.01132965087890625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 8.0, 9.0, 9.0, 17.0, 10.0, 15.0, 16.0, 22.0, 24.0, 24.0, 17.0, 27.0, 29.0, 35.0, 33.0, 39.0, 34.0, 38.0, 43.0, 34.0, 44.0, 37.0, 33.0, 48.0, 45.0, 36.0, 34.0, 26.0, 25.0, 23.0, 20.0, 17.0, 23.0, 15.0, 17.0, 10.0, 6.0, 10.0, 5.0, 6.0, 6.0, 6.0, 4.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.005268096923828125, -0.005112767219543457, -0.004957437515258789, -0.004802107810974121, -0.004646778106689453, -0.004491448402404785, -0.004336118698120117, -0.004180788993835449, -0.004025459289550781, -0.0038701295852661133, -0.0037147998809814453, -0.0035594701766967773, -0.0034041404724121094, -0.0032488107681274414, -0.0030934810638427734, -0.0029381513595581055, -0.0027828216552734375, -0.0026274919509887695, -0.0024721622467041016, -0.0023168325424194336, -0.0021615028381347656, -0.0020061731338500977, -0.0018508434295654297, -0.0016955137252807617, -0.0015401840209960938, -0.0013848543167114258, -0.0012295246124267578, -0.0010741949081420898, -0.0009188652038574219, -0.0007635354995727539, -0.0006082057952880859, -0.00045287609100341797, -0.00029754638671875, -0.00014221668243408203, 1.3113021850585938e-05, 0.0001684427261352539, 0.0003237724304199219, 0.00047910213470458984, 0.0006344318389892578, 0.0007897615432739258, 0.0009450912475585938, 0.0011004209518432617, 0.0012557506561279297, 0.0014110803604125977, 0.0015664100646972656, 0.0017217397689819336, 0.0018770694732666016, 0.0020323991775512695, 0.0021877288818359375, 0.0023430585861206055, 0.0024983882904052734, 0.0026537179946899414, 0.0028090476989746094, 0.0029643774032592773, 0.0031197071075439453, 0.0032750368118286133, 0.0034303665161132812, 0.0035856962203979492, 0.003741025924682617, 0.003896355628967285, 0.004051685333251953, 0.004207015037536621, 0.004362344741821289, 0.004517674446105957, 0.004673004150390625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 14.0, 10.0, 18.0, 28.0, 42.0, 54.0, 81.0, 146.0, 222.0, 393.0, 570.0, 820.0, 1437.0, 2353.0, 3786.0, 6063.0, 9959.0, 16423.0, 27837.0, 49017.0, 87622.0, 165948.0, 337297.0, 820615.0, 1457866.0, 619645.0, 273110.0, 137711.0, 73529.0, 41313.0, 23945.0, 13905.0, 8590.0, 5211.0, 3264.0, 2086.0, 1272.0, 813.0, 499.0, 263.0, 188.0, 106.0, 84.0, 39.0, 39.0, 21.0, 16.0, 5.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00928497314453125, -0.00898885726928711, -0.008692741394042969, -0.008396625518798828, -0.008100509643554688, -0.007804393768310547, -0.007508277893066406, -0.007212162017822266, -0.006916046142578125, -0.006619930267333984, -0.006323814392089844, -0.006027698516845703, -0.0057315826416015625, -0.005435466766357422, -0.005139350891113281, -0.004843235015869141, -0.004547119140625, -0.004251003265380859, -0.003954887390136719, -0.003658771514892578, -0.0033626556396484375, -0.003066539764404297, -0.0027704238891601562, -0.0024743080139160156, -0.002178192138671875, -0.0018820762634277344, -0.0015859603881835938, -0.0012898445129394531, -0.0009937286376953125, -0.0006976127624511719, -0.00040149688720703125, -0.00010538101196289062, 0.00019073486328125, 0.0004868507385253906, 0.0007829666137695312, 0.0010790824890136719, 0.0013751983642578125, 0.0016713142395019531, 0.0019674301147460938, 0.0022635459899902344, 0.002559661865234375, 0.0028557777404785156, 0.0031518936157226562, 0.003448009490966797, 0.0037441253662109375, 0.004040241241455078, 0.004336357116699219, 0.004632472991943359, 0.0049285888671875, 0.005224704742431641, 0.005520820617675781, 0.005816936492919922, 0.0061130523681640625, 0.006409168243408203, 0.006705284118652344, 0.007001399993896484, 0.007297515869140625, 0.007593631744384766, 0.007889747619628906, 0.008185863494873047, 0.008481979370117188, 0.008778095245361328, 0.009074211120605469, 0.00937032699584961, 0.00966644287109375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 7.0, 11.0, 14.0, 20.0, 27.0, 31.0, 29.0, 35.0, 37.0, 49.0, 69.0, 82.0, 89.0, 118.0, 131.0, 160.0, 162.0, 157.0, 199.0, 238.0, 287.0, 311.0, 258.0, 234.0, 198.0, 188.0, 139.0, 128.0, 117.0, 112.0, 87.0, 73.0, 48.0, 42.0, 46.0, 31.0, 25.0, 19.0, 11.0, 18.0, 13.0, 5.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028018951416015625, -0.0027147531509399414, -0.0026276111602783203, -0.0025404691696166992, -0.002453327178955078, -0.002366185188293457, -0.002279043197631836, -0.002191901206970215, -0.0021047592163085938, -0.0020176172256469727, -0.0019304752349853516, -0.0018433332443237305, -0.0017561912536621094, -0.0016690492630004883, -0.0015819072723388672, -0.001494765281677246, -0.001407623291015625, -0.001320481300354004, -0.0012333393096923828, -0.0011461973190307617, -0.0010590553283691406, -0.0009719133377075195, -0.0008847713470458984, -0.0007976293563842773, -0.0007104873657226562, -0.0006233453750610352, -0.0005362033843994141, -0.00044906139373779297, -0.0003619194030761719, -0.0002747774124145508, -0.0001876354217529297, -0.0001004934310913086, -1.33514404296875e-05, 7.37905502319336e-05, 0.0001609325408935547, 0.0002480745315551758, 0.0003352165222167969, 0.00042235851287841797, 0.0005095005035400391, 0.0005966424942016602, 0.0006837844848632812, 0.0007709264755249023, 0.0008580684661865234, 0.0009452104568481445, 0.0010323524475097656, 0.0011194944381713867, 0.0012066364288330078, 0.001293778419494629, 0.00138092041015625, 0.001468062400817871, 0.0015552043914794922, 0.0016423463821411133, 0.0017294883728027344, 0.0018166303634643555, 0.0019037723541259766, 0.0019909143447875977, 0.0020780563354492188, 0.00216519832611084, 0.002252340316772461, 0.002339482307434082, 0.002426624298095703, 0.0025137662887573242, 0.0026009082794189453, 0.0026880502700805664, 0.0027751922607421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 10.0, 5.0, 13.0, 24.0, 25.0, 24.0, 49.0, 44.0, 59.0, 83.0, 82.0, 88.0, 104.0, 85.0, 68.0, 46.0, 34.0, 23.0, 33.0, 22.0, 14.0, 16.0, 7.0, 9.0, 8.0, 5.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007800758816301823, -0.007521199062466621, -0.00724163930863142, -0.006962079554796219, -0.006682519800961018, -0.006402960047125816, -0.006123400758951902, -0.005843841005116701, -0.0055642812512815, -0.005284721497446299, -0.005005161743611097, -0.004725601989775896, -0.004446042701601982, -0.004166482947766781, -0.0038869231939315796, -0.0036073634400963783, -0.003327803686261177, -0.003048243932425976, -0.0027686841785907745, -0.002489124657586217, -0.0022095649037510157, -0.0019300051499158144, -0.001650445512495935, -0.0013708858750760555, -0.0010913261212408543, -0.0008117664256133139, -0.0005322067299857736, -0.0002526470343582332, 2.6912661269307137e-05, 0.0003064724151045084, 0.0005860320525243878, 0.0008655916899442673, 0.0011451514437794685, 0.0014247111976146698, 0.0017042708350345492, 0.0019838304724544287, 0.00226339022628963, 0.002542949980124831, 0.002822509501129389, 0.00310206925496459, 0.0033816290087997913, 0.0036611887626349926, 0.003940748516470194, 0.004220308270305395, 0.004499867558479309, 0.00477942731231451, 0.005058987066149712, 0.005338546819984913, 0.005618106573820114, 0.005897666327655315, 0.006177226081490517, 0.006456785835325718, 0.006736345589160919, 0.0070159053429961205, 0.007295464631170034, 0.007575024385005236, 0.007854584604501724, 0.008134144358336926, 0.008413704112172127, 0.008693263866007328, 0.00897282361984253, 0.00925238337367773, 0.009531943127512932, 0.009811501950025558, 0.01009106170386076]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 2.0, 13.0, 20.0, 17.0, 15.0, 22.0, 24.0, 19.0, 32.0, 34.0, 39.0, 39.0, 58.0, 48.0, 39.0, 44.0, 39.0, 46.0, 47.0, 46.0, 34.0, 38.0, 37.0, 39.0, 37.0, 17.0, 22.0, 18.0, 22.0, 21.0, 10.0, 8.0, 6.0, 10.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.006916028913110495, -0.006715869065374136, -0.00651570875197649, -0.006315548904240131, -0.006115389056503773, -0.005915229208767414, -0.005715068895369768, -0.0055149090476334095, -0.0053147487342357635, -0.005114588886499405, -0.004914428573101759, -0.0047142687253654, -0.004514108877629042, -0.004313948564231396, -0.004113788716495037, -0.0039136288687586784, -0.00371346902102232, -0.0035133089404553175, -0.003313149092718959, -0.0031129890121519566, -0.002912829164415598, -0.0027126690838485956, -0.0025125090032815933, -0.0023123491555452347, -0.0021121890749782324, -0.001912029110826552, -0.0017118691466748714, -0.0015117090661078691, -0.0013115491019561887, -0.0011113891378045082, -0.0009112290572375059, -0.0007110690930858254, -0.0005109095945954323, -0.00031074960133992136, -0.00011058960808441043, 8.957041427493095e-05, 0.0002897303784266114, 0.0004898903425782919, 0.0006900504231452942, 0.0008902103872969747, 0.0010903703514486551, 0.0012905303156003356, 0.001490690279752016, 0.0016908503603190184, 0.0018910103244706988, 0.0020911702886223793, 0.0022913303691893816, 0.002491490449756384, 0.0026916502974927425, 0.002891810378059745, 0.0030919702257961035, 0.0032921303063631058, 0.0034922901540994644, 0.0036924502346664667, 0.003892610315233469, 0.004092770162969828, 0.004292930476367474, 0.004493090324103832, 0.004693250637501478, 0.004893410485237837, 0.0050935703329741955, 0.005293730646371841, 0.0054938904941082, 0.005694050341844559, 0.005894210189580917]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 12.0, 11.0, 20.0, 18.0, 35.0, 43.0, 78.0, 92.0, 145.0, 241.0, 353.0, 507.0, 762.0, 1092.0, 1781.0, 2733.0, 4290.0, 7012.0, 11877.0, 20090.0, 36440.0, 71485.0, 160057.0, 369713.0, 183969.0, 80021.0, 40366.0, 22126.0, 12467.0, 7501.0, 4698.0, 3012.0, 1838.0, 1207.0, 796.0, 566.0, 370.0, 232.0, 165.0, 100.0, 78.0, 42.0, 34.0, 20.0, 24.0, 14.0, 9.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.0064239501953125, -0.006232619285583496, -0.006041288375854492, -0.005849957466125488, -0.005658626556396484, -0.0054672956466674805, -0.0052759647369384766, -0.005084633827209473, -0.004893302917480469, -0.004701972007751465, -0.004510641098022461, -0.004319310188293457, -0.004127979278564453, -0.003936648368835449, -0.0037453174591064453, -0.0035539865493774414, -0.0033626556396484375, -0.0031713247299194336, -0.0029799938201904297, -0.0027886629104614258, -0.002597332000732422, -0.002406001091003418, -0.002214670181274414, -0.00202333927154541, -0.0018320083618164062, -0.0016406774520874023, -0.0014493465423583984, -0.0012580156326293945, -0.0010666847229003906, -0.0008753538131713867, -0.0006840229034423828, -0.0004926919937133789, -0.000301361083984375, -0.0001100301742553711, 8.130073547363281e-05, 0.0002726316452026367, 0.0004639625549316406, 0.0006552934646606445, 0.0008466243743896484, 0.0010379552841186523, 0.0012292861938476562, 0.0014206171035766602, 0.001611948013305664, 0.001803278923034668, 0.001994609832763672, 0.0021859407424926758, 0.0023772716522216797, 0.0025686025619506836, 0.0027599334716796875, 0.0029512643814086914, 0.0031425952911376953, 0.0033339262008666992, 0.003525257110595703, 0.003716588020324707, 0.003907918930053711, 0.004099249839782715, 0.004290580749511719, 0.004481911659240723, 0.0046732425689697266, 0.0048645734786987305, 0.005055904388427734, 0.005247235298156738, 0.005438566207885742, 0.005629897117614746, 0.00582122802734375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 4.0, 6.0, 5.0, 11.0, 18.0, 18.0, 17.0, 20.0, 23.0, 32.0, 30.0, 45.0, 51.0, 49.0, 39.0, 44.0, 42.0, 39.0, 50.0, 49.0, 42.0, 44.0, 40.0, 41.0, 44.0, 24.0, 24.0, 21.0, 23.0, 19.0, 20.0, 16.0, 10.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00696563720703125, -0.006754755973815918, -0.006543874740600586, -0.006332993507385254, -0.006122112274169922, -0.00591123104095459, -0.005700349807739258, -0.005489468574523926, -0.005278587341308594, -0.005067706108093262, -0.00485682487487793, -0.004645943641662598, -0.004435062408447266, -0.004224181175231934, -0.0040132999420166016, -0.0038024187088012695, -0.0035915374755859375, -0.0033806562423706055, -0.0031697750091552734, -0.0029588937759399414, -0.0027480125427246094, -0.0025371313095092773, -0.0023262500762939453, -0.0021153688430786133, -0.0019044876098632812, -0.0016936063766479492, -0.0014827251434326172, -0.0012718439102172852, -0.0010609626770019531, -0.0008500814437866211, -0.0006392002105712891, -0.00042831897735595703, -0.000217437744140625, -6.556510925292969e-06, 0.00020432472229003906, 0.0004152059555053711, 0.0006260871887207031, 0.0008369684219360352, 0.0010478496551513672, 0.0012587308883666992, 0.0014696121215820312, 0.0016804933547973633, 0.0018913745880126953, 0.0021022558212280273, 0.0023131370544433594, 0.0025240182876586914, 0.0027348995208740234, 0.0029457807540893555, 0.0031566619873046875, 0.0033675432205200195, 0.0035784244537353516, 0.0037893056869506836, 0.004000186920166016, 0.004211068153381348, 0.00442194938659668, 0.004632830619812012, 0.004843711853027344, 0.005054593086242676, 0.005265474319458008, 0.00547635555267334, 0.005687236785888672, 0.005898118019104004, 0.006108999252319336, 0.006319880485534668, 0.00653076171875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 9.0, 9.0, 24.0, 33.0, 39.0, 49.0, 79.0, 112.0, 158.0, 185.0, 339.0, 466.0, 634.0, 981.0, 1414.0, 2120.0, 3319.0, 5549.0, 9746.0, 19692.0, 51643.0, 467072.0, 392183.0, 48703.0, 19472.0, 9648.0, 5369.0, 3131.0, 1987.0, 1348.0, 935.0, 621.0, 445.0, 299.0, 210.0, 158.0, 114.0, 79.0, 46.0, 38.0, 26.0, 13.0, 19.0, 7.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.01119232177734375, -0.010852932929992676, -0.010513544082641602, -0.010174155235290527, -0.009834766387939453, -0.009495377540588379, -0.009155988693237305, -0.00881659984588623, -0.008477210998535156, -0.008137822151184082, -0.007798433303833008, -0.007459044456481934, -0.007119655609130859, -0.006780266761779785, -0.006440877914428711, -0.006101489067077637, -0.0057621002197265625, -0.005422711372375488, -0.005083322525024414, -0.00474393367767334, -0.004404544830322266, -0.004065155982971191, -0.003725767135620117, -0.003386378288269043, -0.0030469894409179688, -0.0027076005935668945, -0.0023682117462158203, -0.002028822898864746, -0.0016894340515136719, -0.0013500452041625977, -0.0010106563568115234, -0.0006712675094604492, -0.000331878662109375, 7.510185241699219e-06, 0.00034689903259277344, 0.0006862878799438477, 0.0010256767272949219, 0.001365065574645996, 0.0017044544219970703, 0.0020438432693481445, 0.0023832321166992188, 0.002722620964050293, 0.003062009811401367, 0.0034013986587524414, 0.0037407875061035156, 0.00408017635345459, 0.004419565200805664, 0.004758954048156738, 0.0050983428955078125, 0.005437731742858887, 0.005777120590209961, 0.006116509437561035, 0.006455898284912109, 0.006795287132263184, 0.007134675979614258, 0.007474064826965332, 0.007813453674316406, 0.00815284252166748, 0.008492231369018555, 0.008831620216369629, 0.009171009063720703, 0.009510397911071777, 0.009849786758422852, 0.010189175605773926, 0.010528564453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 3.0, 2.0, 13.0, 10.0, 12.0, 12.0, 8.0, 11.0, 15.0, 30.0, 22.0, 30.0, 31.0, 28.0, 39.0, 33.0, 33.0, 40.0, 34.0, 42.0, 40.0, 37.0, 34.0, 40.0, 39.0, 29.0, 35.0, 35.0, 34.0, 32.0, 23.0, 28.0, 22.0, 18.0, 13.0, 18.0, 13.0, 12.0, 8.0, 9.0, 8.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.003879547119140625, -0.0037613511085510254, -0.0036431550979614258, -0.003524959087371826, -0.0034067630767822266, -0.003288567066192627, -0.0031703710556030273, -0.0030521750450134277, -0.002933979034423828, -0.0028157830238342285, -0.002697587013244629, -0.0025793910026550293, -0.0024611949920654297, -0.00234299898147583, -0.0022248029708862305, -0.002106606960296631, -0.0019884109497070312, -0.0018702149391174316, -0.001752018928527832, -0.0016338229179382324, -0.0015156269073486328, -0.0013974308967590332, -0.0012792348861694336, -0.001161038875579834, -0.0010428428649902344, -0.0009246468544006348, -0.0008064508438110352, -0.0006882548332214355, -0.0005700588226318359, -0.00045186281204223633, -0.0003336668014526367, -0.0002154707908630371, -9.72747802734375e-05, 2.092123031616211e-05, 0.00013911724090576172, 0.00025731325149536133, 0.00037550926208496094, 0.0004937052726745605, 0.0006119012832641602, 0.0007300972938537598, 0.0008482933044433594, 0.000966489315032959, 0.0010846853256225586, 0.0012028813362121582, 0.0013210773468017578, 0.0014392733573913574, 0.001557469367980957, 0.0016756653785705566, 0.0017938613891601562, 0.0019120573997497559, 0.0020302534103393555, 0.002148449420928955, 0.0022666454315185547, 0.0023848414421081543, 0.002503037452697754, 0.0026212334632873535, 0.002739429473876953, 0.0028576254844665527, 0.0029758214950561523, 0.003094017505645752, 0.0032122135162353516, 0.003330409526824951, 0.0034486055374145508, 0.0035668015480041504, 0.00368499755859375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 9.0, 12.0, 12.0, 21.0, 19.0, 25.0, 32.0, 47.0, 75.0, 95.0, 79.0, 162.0, 251.0, 264.0, 441.0, 659.0, 1042.0, 1688.0, 3027.0, 5825.0, 13849.0, 51580.0, 792293.0, 136107.0, 22622.0, 8167.0, 4078.0, 2211.0, 1296.0, 816.0, 475.0, 335.0, 247.0, 152.0, 134.0, 98.0, 70.0, 57.0, 43.0, 46.0, 29.0, 13.0, 11.0, 14.0, 9.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0012445449829101562, -0.0012040287256240845, -0.0011635124683380127, -0.001122996211051941, -0.0010824799537658691, -0.0010419636964797974, -0.0010014474391937256, -0.0009609311819076538, -0.000920414924621582, -0.0008798986673355103, -0.0008393824100494385, -0.0007988661527633667, -0.0007583498954772949, -0.0007178336381912231, -0.0006773173809051514, -0.0006368011236190796, -0.0005962848663330078, -0.000555768609046936, -0.0005152523517608643, -0.0004747360944747925, -0.0004342198371887207, -0.0003937035799026489, -0.00035318732261657715, -0.00031267106533050537, -0.0002721548080444336, -0.00023163855075836182, -0.00019112229347229004, -0.00015060603618621826, -0.00011008977890014648, -6.957352161407471e-05, -2.905726432800293e-05, 1.1458992958068848e-05, 5.1975250244140625e-05, 9.24915075302124e-05, 0.00013300776481628418, 0.00017352402210235596, 0.00021404027938842773, 0.0002545565366744995, 0.0002950727939605713, 0.00033558905124664307, 0.00037610530853271484, 0.0004166215658187866, 0.0004571378231048584, 0.0004976540803909302, 0.000538170337677002, 0.0005786865949630737, 0.0006192028522491455, 0.0006597191095352173, 0.0007002353668212891, 0.0007407516241073608, 0.0007812678813934326, 0.0008217841386795044, 0.0008623003959655762, 0.000902816653251648, 0.0009433329105377197, 0.0009838491678237915, 0.0010243654251098633, 0.001064881682395935, 0.0011053979396820068, 0.0011459141969680786, 0.0011864304542541504, 0.0012269467115402222, 0.001267462968826294, 0.0013079792261123657, 0.0013484954833984375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 4.0, 16.0, 7.0, 14.0, 11.0, 19.0, 25.0, 19.0, 36.0, 33.0, 76.0, 59.0, 46.0, 53.0, 60.0, 58.0, 46.0, 71.0, 52.0, 44.0, 37.0, 32.0, 30.0, 17.0, 26.0, 20.0, 18.0, 14.0, 7.0, 10.0, 8.0, 14.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6065314412117004e-06, -1.5441328287124634e-06, -1.4817342162132263e-06, -1.4193356037139893e-06, -1.3569369912147522e-06, -1.2945383787155151e-06, -1.232139766216278e-06, -1.169741153717041e-06, -1.107342541217804e-06, -1.044943928718567e-06, -9.825453162193298e-07, -9.201467037200928e-07, -8.577480912208557e-07, -7.953494787216187e-07, -7.329508662223816e-07, -6.705522537231445e-07, -6.081536412239075e-07, -5.457550287246704e-07, -4.833564162254333e-07, -4.209578037261963e-07, -3.5855919122695923e-07, -2.9616057872772217e-07, -2.337619662284851e-07, -1.7136335372924805e-07, -1.0896474123001099e-07, -4.6566128730773926e-08, 1.5832483768463135e-08, 7.82310962677002e-08, 1.4062970876693726e-07, 2.0302832126617432e-07, 2.654269337654114e-07, 3.2782554626464844e-07, 3.902241587638855e-07, 4.5262277126312256e-07, 5.150213837623596e-07, 5.774199962615967e-07, 6.398186087608337e-07, 7.022172212600708e-07, 7.646158337593079e-07, 8.270144462585449e-07, 8.89413058757782e-07, 9.51811671257019e-07, 1.014210283756256e-06, 1.0766088962554932e-06, 1.1390075087547302e-06, 1.2014061212539673e-06, 1.2638047337532043e-06, 1.3262033462524414e-06, 1.3886019587516785e-06, 1.4510005712509155e-06, 1.5133991837501526e-06, 1.5757977962493896e-06, 1.6381964087486267e-06, 1.7005950212478638e-06, 1.7629936337471008e-06, 1.8253922462463379e-06, 1.887790858745575e-06, 1.950189471244812e-06, 2.012588083744049e-06, 2.074986696243286e-06, 2.137385308742523e-06, 2.1997839212417603e-06, 2.2621825337409973e-06, 2.3245811462402344e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 11.0, 13.0, 11.0, 12.0, 26.0, 27.0, 34.0, 59.0, 83.0, 101.0, 122.0, 175.0, 284.0, 348.0, 443.0, 654.0, 915.0, 1245.0, 1828.0, 2619.0, 3898.0, 6246.0, 9838.0, 16631.0, 31439.0, 72071.0, 266181.0, 448170.0, 94198.0, 38785.0, 19503.0, 11112.0, 6951.0, 4433.0, 2968.0, 2010.0, 1415.0, 969.0, 738.0, 496.0, 412.0, 292.0, 215.0, 175.0, 109.0, 85.0, 57.0, 46.0, 31.0, 32.0, 17.0, 10.0, 6.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0009622573852539062, -0.0009313523769378662, -0.0009004473686218262, -0.0008695423603057861, -0.0008386373519897461, -0.0008077323436737061, -0.000776827335357666, -0.000745922327041626, -0.0007150173187255859, -0.0006841123104095459, -0.0006532073020935059, -0.0006223022937774658, -0.0005913972854614258, -0.0005604922771453857, -0.0005295872688293457, -0.0004986822605133057, -0.0004677772521972656, -0.0004368722438812256, -0.00040596723556518555, -0.0003750622272491455, -0.00034415721893310547, -0.00031325221061706543, -0.0002823472023010254, -0.00025144219398498535, -0.0002205371856689453, -0.00018963217735290527, -0.00015872716903686523, -0.0001278221607208252, -9.691715240478516e-05, -6.601214408874512e-05, -3.510713577270508e-05, -4.202127456665039e-06, 2.6702880859375e-05, 5.760788917541504e-05, 8.851289749145508e-05, 0.00011941790580749512, 0.00015032291412353516, 0.0001812279224395752, 0.00021213293075561523, 0.00024303793907165527, 0.0002739429473876953, 0.00030484795570373535, 0.0003357529640197754, 0.00036665797233581543, 0.00039756298065185547, 0.0004284679889678955, 0.00045937299728393555, 0.0004902780055999756, 0.0005211830139160156, 0.0005520880222320557, 0.0005829930305480957, 0.0006138980388641357, 0.0006448030471801758, 0.0006757080554962158, 0.0007066130638122559, 0.0007375180721282959, 0.0007684230804443359, 0.000799328088760376, 0.000830233097076416, 0.0008611381053924561, 0.0008920431137084961, 0.0009229481220245361, 0.0009538531303405762, 0.0009847581386566162, 0.0010156631469726562]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 7.0, 11.0, 17.0, 22.0, 17.0, 36.0, 40.0, 55.0, 71.0, 212.0, 188.0, 74.0, 64.0, 40.0, 35.0, 20.0, 16.0, 16.0, 11.0, 13.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0005512237548828125, -0.0005344897508621216, -0.0005177557468414307, -0.0005010217428207397, -0.00048428773880004883, -0.0004675537347793579, -0.000450819730758667, -0.0004340857267379761, -0.00041735172271728516, -0.00040061771869659424, -0.0003838837146759033, -0.0003671497106552124, -0.0003504157066345215, -0.00033368170261383057, -0.00031694769859313965, -0.00030021369457244873, -0.0002834796905517578, -0.0002667456865310669, -0.000250011682510376, -0.00023327767848968506, -0.00021654367446899414, -0.00019980967044830322, -0.0001830756664276123, -0.0001663416624069214, -0.00014960765838623047, -0.00013287365436553955, -0.00011613965034484863, -9.940564632415771e-05, -8.26716423034668e-05, -6.593763828277588e-05, -4.920363426208496e-05, -3.246963024139404e-05, -1.5735626220703125e-05, 9.98377799987793e-07, 1.773238182067871e-05, 3.446638584136963e-05, 5.120038986206055e-05, 6.793439388275146e-05, 8.466839790344238e-05, 0.0001014024019241333, 0.00011813640594482422, 0.00013487040996551514, 0.00015160441398620605, 0.00016833841800689697, 0.0001850724220275879, 0.0002018064260482788, 0.00021854043006896973, 0.00023527443408966064, 0.00025200843811035156, 0.0002687424421310425, 0.0002854764461517334, 0.0003022104501724243, 0.00031894445419311523, 0.00033567845821380615, 0.00035241246223449707, 0.000369146466255188, 0.0003858804702758789, 0.0004026144742965698, 0.00041934847831726074, 0.00043608248233795166, 0.0004528164863586426, 0.0004695504903793335, 0.0004862844944000244, 0.0005030184984207153, 0.0005197525024414062]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 9.0, 16.0, 21.0, 18.0, 42.0, 39.0, 53.0, 51.0, 70.0, 88.0, 115.0, 92.0, 96.0, 49.0, 43.0, 47.0, 36.0, 16.0, 24.0, 17.0, 10.0, 5.0, 9.0, 3.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008176167495548725, -0.00789280142635107, -0.00760943628847599, -0.007326070219278336, -0.007042704615741968, -0.006759339012205601, -0.006475972943007946, -0.006192607339471579, -0.005909241735935211, -0.005625876132398844, -0.005342510528862476, -0.005059144459664822, -0.004775778856128454, -0.004492413252592087, -0.004209047183394432, -0.003925681579858065, -0.0036423159763216972, -0.00335895037278533, -0.0030755845364183187, -0.0027922187000513077, -0.0025088530965149403, -0.002225487492978573, -0.0019421216566115618, -0.0016587558202445507, -0.0013753902167081833, -0.001092024496756494, -0.0008086587768048048, -0.0005252930568531156, -0.00024192733690142632, 4.143838305026293e-05, 0.00032480410300195217, 0.0006081699393689632, 0.0008915364742279053, 0.0011749021941795945, 0.0014582679141312838, 0.001741633634082973, 0.0020249993540346622, 0.0023083649575710297, 0.0025917307939380407, 0.002875096630305052, 0.0031584622338414192, 0.0034418278373777866, 0.0037251936737447977, 0.004008559510111809, 0.004291925113648176, 0.004575290717184544, 0.004858656786382198, 0.005142022389918566, 0.005425387993454933, 0.005708753596991301, 0.005992119200527668, 0.006275485269725323, 0.00655885087326169, 0.0068422164767980576, 0.007125582545995712, 0.00740894814953208, 0.007692313753068447, 0.007975679822266102, 0.008259044960141182, 0.008542411029338837, 0.008825777098536491, 0.009109142236411572, 0.009392508305609226, 0.009675873443484306, 0.009959239512681961]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 3.0, 3.0, 16.0, 21.0, 14.0, 15.0, 22.0, 29.0, 18.0, 29.0, 34.0, 42.0, 36.0, 54.0, 50.0, 34.0, 47.0, 39.0, 46.0, 46.0, 49.0, 32.0, 35.0, 39.0, 37.0, 34.0, 22.0, 22.0, 17.0, 21.0, 17.0, 15.0, 8.0, 8.0, 10.0, 2.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0067710233852267265, -0.0065748724155128, -0.006378721445798874, -0.00618257001042366, -0.005986419040709734, -0.005790268070995808, -0.005594117101281881, -0.005397966131567955, -0.005201814696192741, -0.005005663726478815, -0.004809512756764889, -0.004613361321389675, -0.004417210351675749, -0.0042210593819618225, -0.004024908412247896, -0.00382875744253397, -0.0036326064728200436, -0.0034364555031061172, -0.0032403043005615473, -0.003044153330847621, -0.002848002128303051, -0.0026518511585891247, -0.0024557001888751984, -0.002259549219161272, -0.002063398016616702, -0.001867246930487454, -0.0016710958443582058, -0.0014749448746442795, -0.0012787937885150313, -0.0010826427023857832, -0.0008864917326718569, -0.0006903406465426087, -0.0004941900260746479, -0.0002980389690492302, -0.00010188791202381253, 9.42631158977747e-05, 0.00029041420202702284, 0.000486565288156271, 0.0006827162578701973, 0.0008788673439994454, 0.0010750184301286936, 0.0012711695162579417, 0.0014673206023871899, 0.0016634715721011162, 0.0018596226582303643, 0.0020557737443596125, 0.0022519247140735388, 0.0024480759166181087, 0.002644226886332035, 0.0028403778560459614, 0.0030365290585905313, 0.0032326800283044577, 0.0034288312308490276, 0.003624982200562954, 0.0038211331702768803, 0.004017284139990807, 0.00421343557536602, 0.0044095865450799465, 0.004605737514793873, 0.0048018889501690865, 0.004998039919883013, 0.005194190889596939, 0.005390341859310865, 0.005586492829024792, 0.005782643798738718]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 17.0, 29.0, 30.0, 63.0, 83.0, 110.0, 181.0, 230.0, 317.0, 484.0, 686.0, 1009.0, 1512.0, 2203.0, 3277.0, 4904.0, 7056.0, 10848.0, 16508.0, 25501.0, 41302.0, 68425.0, 121142.0, 225003.0, 219367.0, 117272.0, 67054.0, 40197.0, 25202.0, 16090.0, 10632.0, 7084.0, 4698.0, 3172.0, 2188.0, 1462.0, 988.0, 711.0, 488.0, 329.0, 214.0, 145.0, 103.0, 66.0, 53.0, 39.0, 23.0, 19.0, 11.0, 11.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0101470947265625, -0.00982975959777832, -0.00951242446899414, -0.009195089340209961, -0.008877754211425781, -0.008560419082641602, -0.008243083953857422, -0.007925748825073242, -0.0076084136962890625, -0.007291078567504883, -0.006973743438720703, -0.0066564083099365234, -0.006339073181152344, -0.006021738052368164, -0.005704402923583984, -0.005387067794799805, -0.005069732666015625, -0.004752397537231445, -0.004435062408447266, -0.004117727279663086, -0.0038003921508789062, -0.0034830570220947266, -0.003165721893310547, -0.002848386764526367, -0.0025310516357421875, -0.002213716506958008, -0.0018963813781738281, -0.0015790462493896484, -0.0012617111206054688, -0.0009443759918212891, -0.0006270408630371094, -0.0003097057342529297, 7.62939453125e-06, 0.0003249645233154297, 0.0006422996520996094, 0.0009596347808837891, 0.0012769699096679688, 0.0015943050384521484, 0.0019116401672363281, 0.002228975296020508, 0.0025463104248046875, 0.002863645553588867, 0.003180980682373047, 0.0034983158111572266, 0.0038156509399414062, 0.004132986068725586, 0.004450321197509766, 0.004767656326293945, 0.005084991455078125, 0.005402326583862305, 0.005719661712646484, 0.006036996841430664, 0.006354331970214844, 0.0066716670989990234, 0.006989002227783203, 0.007306337356567383, 0.0076236724853515625, 0.007941007614135742, 0.008258342742919922, 0.008575677871704102, 0.008893013000488281, 0.009210348129272461, 0.00952768325805664, 0.00984501838684082, 0.010162353515625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 4.0, 11.0, 17.0, 11.0, 13.0, 23.0, 19.0, 30.0, 28.0, 30.0, 28.0, 32.0, 44.0, 44.0, 39.0, 46.0, 43.0, 42.0, 32.0, 52.0, 42.0, 37.0, 33.0, 35.0, 32.0, 32.0, 26.0, 26.0, 17.0, 19.0, 26.0, 11.0, 12.0, 10.0, 12.0, 3.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004833221435546875, -0.004675149917602539, -0.004517078399658203, -0.004359006881713867, -0.004200935363769531, -0.004042863845825195, -0.0038847923278808594, -0.0037267208099365234, -0.0035686492919921875, -0.0034105777740478516, -0.0032525062561035156, -0.0030944347381591797, -0.0029363632202148438, -0.002778291702270508, -0.002620220184326172, -0.002462148666381836, -0.0023040771484375, -0.002146005630493164, -0.001987934112548828, -0.0018298625946044922, -0.0016717910766601562, -0.0015137195587158203, -0.0013556480407714844, -0.0011975765228271484, -0.0010395050048828125, -0.0008814334869384766, -0.0007233619689941406, -0.0005652904510498047, -0.00040721893310546875, -0.0002491474151611328, -9.107589721679688e-05, 6.699562072753906e-05, 0.000225067138671875, 0.00038313865661621094, 0.0005412101745605469, 0.0006992816925048828, 0.0008573532104492188, 0.0010154247283935547, 0.0011734962463378906, 0.0013315677642822266, 0.0014896392822265625, 0.0016477108001708984, 0.0018057823181152344, 0.0019638538360595703, 0.0021219253540039062, 0.002279996871948242, 0.002438068389892578, 0.002596139907836914, 0.00275421142578125, 0.002912282943725586, 0.003070354461669922, 0.003228425979614258, 0.0033864974975585938, 0.0035445690155029297, 0.0037026405334472656, 0.0038607120513916016, 0.0040187835693359375, 0.0041768550872802734, 0.004334926605224609, 0.004492998123168945, 0.004651069641113281, 0.004809141159057617, 0.004967212677001953, 0.005125284194946289, 0.005283355712890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 16.0, 18.0, 25.0, 41.0, 57.0, 84.0, 129.0, 148.0, 260.0, 368.0, 532.0, 768.0, 1093.0, 1653.0, 2407.0, 3531.0, 5091.0, 7847.0, 11900.0, 18042.0, 28503.0, 44586.0, 73320.0, 125196.0, 222056.0, 202869.0, 113317.0, 67101.0, 41307.0, 26287.0, 16689.0, 10979.0, 7136.0, 4786.0, 3237.0, 2300.0, 1517.0, 1040.0, 751.0, 474.0, 354.0, 242.0, 166.0, 118.0, 69.0, 60.0, 27.0, 14.0, 17.0, 8.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0095672607421875, -0.009267449378967285, -0.00896763801574707, -0.008667826652526855, -0.00836801528930664, -0.008068203926086426, -0.007768392562866211, -0.007468581199645996, -0.007168769836425781, -0.006868958473205566, -0.0065691471099853516, -0.006269335746765137, -0.005969524383544922, -0.005669713020324707, -0.005369901657104492, -0.005070090293884277, -0.0047702789306640625, -0.004470467567443848, -0.004170656204223633, -0.003870844841003418, -0.003571033477783203, -0.0032712221145629883, -0.0029714107513427734, -0.0026715993881225586, -0.0023717880249023438, -0.002071976661682129, -0.001772165298461914, -0.0014723539352416992, -0.0011725425720214844, -0.0008727312088012695, -0.0005729198455810547, -0.00027310848236083984, 2.6702880859375e-05, 0.00032651424407958984, 0.0006263256072998047, 0.0009261369705200195, 0.0012259483337402344, 0.0015257596969604492, 0.001825571060180664, 0.002125382423400879, 0.0024251937866210938, 0.0027250051498413086, 0.0030248165130615234, 0.0033246278762817383, 0.003624439239501953, 0.003924250602722168, 0.004224061965942383, 0.004523873329162598, 0.0048236846923828125, 0.005123496055603027, 0.005423307418823242, 0.005723118782043457, 0.006022930145263672, 0.006322741508483887, 0.0066225528717041016, 0.006922364234924316, 0.007222175598144531, 0.007521986961364746, 0.007821798324584961, 0.008121609687805176, 0.00842142105102539, 0.008721232414245605, 0.00902104377746582, 0.009320855140686035, 0.00962066650390625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 12.0, 14.0, 15.0, 23.0, 16.0, 30.0, 28.0, 28.0, 32.0, 36.0, 31.0, 37.0, 45.0, 38.0, 43.0, 40.0, 44.0, 52.0, 34.0, 37.0, 36.0, 40.0, 26.0, 22.0, 28.0, 21.0, 26.0, 17.0, 21.0, 16.0, 14.0, 11.0, 10.0, 14.0, 8.0, 6.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034656524658203125, -0.0033653974533081055, -0.0032651424407958984, -0.0031648874282836914, -0.0030646324157714844, -0.0029643774032592773, -0.0028641223907470703, -0.0027638673782348633, -0.0026636123657226562, -0.0025633573532104492, -0.002463102340698242, -0.002362847328186035, -0.002262592315673828, -0.002162337303161621, -0.002062082290649414, -0.001961827278137207, -0.001861572265625, -0.001761317253112793, -0.001661062240600586, -0.001560807228088379, -0.0014605522155761719, -0.0013602972030639648, -0.0012600421905517578, -0.0011597871780395508, -0.0010595321655273438, -0.0009592771530151367, -0.0008590221405029297, -0.0007587671279907227, -0.0006585121154785156, -0.0005582571029663086, -0.00045800209045410156, -0.00035774707794189453, -0.0002574920654296875, -0.00015723705291748047, -5.698204040527344e-05, 4.3272972106933594e-05, 0.00014352798461914062, 0.00024378299713134766, 0.0003440380096435547, 0.0004442930221557617, 0.0005445480346679688, 0.0006448030471801758, 0.0007450580596923828, 0.0008453130722045898, 0.0009455680847167969, 0.001045823097229004, 0.001146078109741211, 0.001246333122253418, 0.001346588134765625, 0.001446843147277832, 0.001547098159790039, 0.001647353172302246, 0.0017476081848144531, 0.0018478631973266602, 0.0019481182098388672, 0.0020483732223510742, 0.0021486282348632812, 0.0022488832473754883, 0.0023491382598876953, 0.0024493932723999023, 0.0025496482849121094, 0.0026499032974243164, 0.0027501583099365234, 0.0028504133224487305, 0.0029506683349609375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 13.0, 9.0, 10.0, 19.0, 22.0, 36.0, 27.0, 53.0, 54.0, 77.0, 120.0, 130.0, 181.0, 196.0, 320.0, 456.0, 594.0, 872.0, 1407.0, 2409.0, 5161.0, 13980.0, 64290.0, 834016.0, 93817.0, 16841.0, 5833.0, 2744.0, 1466.0, 961.0, 620.0, 483.0, 360.0, 208.0, 173.0, 152.0, 115.0, 79.0, 48.0, 46.0, 46.0, 39.0, 17.0, 15.0, 10.0, 8.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0015897750854492188, -0.0015409737825393677, -0.0014921724796295166, -0.0014433711767196655, -0.0013945698738098145, -0.0013457685708999634, -0.0012969672679901123, -0.0012481659650802612, -0.0011993646621704102, -0.001150563359260559, -0.001101762056350708, -0.001052960753440857, -0.0010041594505310059, -0.0009553581476211548, -0.0009065568447113037, -0.0008577555418014526, -0.0008089542388916016, -0.0007601529359817505, -0.0007113516330718994, -0.0006625503301620483, -0.0006137490272521973, -0.0005649477243423462, -0.0005161464214324951, -0.00046734511852264404, -0.00041854381561279297, -0.0003697425127029419, -0.0003209412097930908, -0.00027213990688323975, -0.00022333860397338867, -0.0001745373010635376, -0.00012573599815368652, -7.693469524383545e-05, -2.8133392333984375e-05, 2.06679105758667e-05, 6.946921348571777e-05, 0.00011827051639556885, 0.00016707181930541992, 0.000215873122215271, 0.00026467442512512207, 0.00031347572803497314, 0.0003622770309448242, 0.0004110783338546753, 0.00045987963676452637, 0.0005086809396743774, 0.0005574822425842285, 0.0006062835454940796, 0.0006550848484039307, 0.0007038861513137817, 0.0007526874542236328, 0.0008014887571334839, 0.000850290060043335, 0.000899091362953186, 0.0009478926658630371, 0.0009966939687728882, 0.0010454952716827393, 0.0010942965745925903, 0.0011430978775024414, 0.0011918991804122925, 0.0012407004833221436, 0.0012895017862319946, 0.0013383030891418457, 0.0013871043920516968, 0.0014359056949615479, 0.001484706997871399, 0.00153350830078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 2.0, 6.0, 8.0, 7.0, 7.0, 11.0, 10.0, 23.0, 27.0, 37.0, 50.0, 92.0, 120.0, 177.0, 116.0, 85.0, 55.0, 36.0, 23.0, 14.0, 20.0, 13.0, 11.0, 5.0, 9.0, 8.0, 7.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5506520867347717e-06, -1.4919787645339966e-06, -1.4333054423332214e-06, -1.3746321201324463e-06, -1.3159587979316711e-06, -1.257285475730896e-06, -1.1986121535301208e-06, -1.1399388313293457e-06, -1.0812655091285706e-06, -1.0225921869277954e-06, -9.639188647270203e-07, -9.052455425262451e-07, -8.4657222032547e-07, -7.878988981246948e-07, -7.292255759239197e-07, -6.705522537231445e-07, -6.118789315223694e-07, -5.532056093215942e-07, -4.945322871208191e-07, -4.3585896492004395e-07, -3.771856427192688e-07, -3.1851232051849365e-07, -2.598389983177185e-07, -2.0116567611694336e-07, -1.424923539161682e-07, -8.381903171539307e-08, -2.514570951461792e-08, 3.3527612686157227e-08, 9.220093488693237e-08, 1.5087425708770752e-07, 2.0954757928848267e-07, 2.682209014892578e-07, 3.2689422369003296e-07, 3.855675458908081e-07, 4.4424086809158325e-07, 5.029141902923584e-07, 5.615875124931335e-07, 6.202608346939087e-07, 6.789341568946838e-07, 7.37607479095459e-07, 7.962808012962341e-07, 8.549541234970093e-07, 9.136274456977844e-07, 9.723007678985596e-07, 1.0309740900993347e-06, 1.0896474123001099e-06, 1.148320734500885e-06, 1.2069940567016602e-06, 1.2656673789024353e-06, 1.3243407011032104e-06, 1.3830140233039856e-06, 1.4416873455047607e-06, 1.5003606677055359e-06, 1.559033989906311e-06, 1.6177073121070862e-06, 1.6763806343078613e-06, 1.7350539565086365e-06, 1.7937272787094116e-06, 1.8524006009101868e-06, 1.911073923110962e-06, 1.969747245311737e-06, 2.028420567512512e-06, 2.0870938897132874e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 4.0, 8.0, 10.0, 11.0, 14.0, 20.0, 26.0, 34.0, 53.0, 70.0, 68.0, 112.0, 141.0, 231.0, 308.0, 384.0, 558.0, 776.0, 1183.0, 1755.0, 2825.0, 4395.0, 8174.0, 17251.0, 50416.0, 677859.0, 216669.0, 33953.0, 13158.0, 6687.0, 3800.0, 2397.0, 1556.0, 1100.0, 733.0, 471.0, 356.0, 277.0, 183.0, 128.0, 92.0, 82.0, 64.0, 56.0, 25.0, 23.0, 21.0, 14.0, 11.0, 5.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014543533325195312, -0.0014113783836364746, -0.001368403434753418, -0.0013254284858703613, -0.0012824535369873047, -0.001239478588104248, -0.0011965036392211914, -0.0011535286903381348, -0.0011105537414550781, -0.0010675787925720215, -0.0010246038436889648, -0.0009816288948059082, -0.0009386539459228516, -0.0008956789970397949, -0.0008527040481567383, -0.0008097290992736816, -0.000766754150390625, -0.0007237792015075684, -0.0006808042526245117, -0.0006378293037414551, -0.0005948543548583984, -0.0005518794059753418, -0.0005089044570922852, -0.0004659295082092285, -0.0004229545593261719, -0.00037997961044311523, -0.0003370046615600586, -0.00029402971267700195, -0.0002510547637939453, -0.00020807981491088867, -0.00016510486602783203, -0.0001221299171447754, -7.915496826171875e-05, -3.618001937866211e-05, 6.794929504394531e-06, 4.976987838745117e-05, 9.274482727050781e-05, 0.00013571977615356445, 0.0001786947250366211, 0.00022166967391967773, 0.0002646446228027344, 0.000307619571685791, 0.00035059452056884766, 0.0003935694694519043, 0.00043654441833496094, 0.0004795193672180176, 0.0005224943161010742, 0.0005654692649841309, 0.0006084442138671875, 0.0006514191627502441, 0.0006943941116333008, 0.0007373690605163574, 0.0007803440093994141, 0.0008233189582824707, 0.0008662939071655273, 0.000909268856048584, 0.0009522438049316406, 0.0009952187538146973, 0.001038193702697754, 0.0010811686515808105, 0.0011241436004638672, 0.0011671185493469238, 0.0012100934982299805, 0.0012530684471130371, 0.0012960433959960938]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 5.0, 2.0, 9.0, 3.0, 11.0, 16.0, 26.0, 29.0, 51.0, 145.0, 330.0, 158.0, 65.0, 40.0, 30.0, 15.0, 9.0, 14.0, 8.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004658699035644531, -0.0004534870386123657, -0.0004411041736602783, -0.0004287213087081909, -0.0004163384437561035, -0.0004039555788040161, -0.0003915727138519287, -0.0003791898488998413, -0.0003668069839477539, -0.0003544241189956665, -0.0003420412540435791, -0.0003296583890914917, -0.0003172755241394043, -0.0003048926591873169, -0.0002925097942352295, -0.0002801269292831421, -0.0002677440643310547, -0.0002553611993789673, -0.00024297833442687988, -0.00023059546947479248, -0.00021821260452270508, -0.00020582973957061768, -0.00019344687461853027, -0.00018106400966644287, -0.00016868114471435547, -0.00015629827976226807, -0.00014391541481018066, -0.00013153254985809326, -0.00011914968490600586, -0.00010676681995391846, -9.438395500183105e-05, -8.200109004974365e-05, -6.961822509765625e-05, -5.723536014556885e-05, -4.4852495193481445e-05, -3.246963024139404e-05, -2.008676528930664e-05, -7.703900337219238e-06, 4.678964614868164e-06, 1.7061829566955566e-05, 2.944469451904297e-05, 4.182755947113037e-05, 5.4210424423217773e-05, 6.659328937530518e-05, 7.897615432739258e-05, 9.135901927947998e-05, 0.00010374188423156738, 0.00011612474918365479, 0.0001285076141357422, 0.0001408904790878296, 0.000153273344039917, 0.0001656562089920044, 0.0001780390739440918, 0.0001904219388961792, 0.0002028048038482666, 0.000215187668800354, 0.0002275705337524414, 0.0002399533987045288, 0.0002523362636566162, 0.0002647191286087036, 0.000277101993560791, 0.0002894848585128784, 0.0003018677234649658, 0.0003142505884170532, 0.0003266334533691406]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 16.0, 17.0, 21.0, 27.0, 35.0, 57.0, 66.0, 83.0, 118.0, 108.0, 104.0, 77.0, 81.0, 46.0, 37.0, 28.0, 21.0, 11.0, 9.0, 4.0, 10.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007812042720615864, -0.0075183832086622715, -0.0072247241623699665, -0.006931064650416374, -0.006637405604124069, -0.006343746092170477, -0.006050086580216885, -0.00575642753392458, -0.005462768021970987, -0.005169108510017395, -0.00487544946372509, -0.004581789951771498, -0.004288130439817905, -0.0039944713935256, -0.003700811881572008, -0.0034071526024490595, -0.003113493323326111, -0.002819834044203162, -0.0025261747650802135, -0.0022325152531266212, -0.0019388559740036726, -0.001645196694880724, -0.0013515372993424535, -0.001057877903804183, -0.0007642186246812344, -0.0004705592873506248, -0.00017689995002001524, 0.00011675938731059432, 0.0004104187246412039, 0.0007040780037641525, 0.000997737399302423, 0.0012913967948406935, 0.0015850551426410675, 0.0018787144217640162, 0.002172373700886965, 0.002466033212840557, 0.0027596924919635057, 0.0030533517710864544, 0.0033470112830400467, 0.0036406705621629953, 0.003934329841285944, 0.004227989353239536, 0.004521648399531841, 0.004815307911485434, 0.005108967423439026, 0.005402626469731331, 0.005696285981684923, 0.0059899454936385155, 0.0062836045399308205, 0.006577264051884413, 0.006870923098176718, 0.00716458261013031, 0.007458241656422615, 0.007751901168376207, 0.0080455606803298, 0.008339219726622105, 0.008632879704236984, 0.00892653875052929, 0.009220198728144169, 0.009513857774436474, 0.009807516820728779, 0.010101176798343658, 0.010394835844635963, 0.010688494890928268, 0.010982153937220573]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 8.0, 14.0, 16.0, 15.0, 18.0, 26.0, 26.0, 21.0, 31.0, 34.0, 33.0, 48.0, 46.0, 46.0, 48.0, 43.0, 36.0, 49.0, 43.0, 34.0, 37.0, 41.0, 39.0, 27.0, 25.0, 31.0, 26.0, 17.0, 9.0, 18.0, 11.0, 11.0, 13.0, 6.0, 2.0, 8.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00555018987506628, -0.0053834738209843636, -0.005216758232563734, -0.005050042178481817, -0.004883326590061188, -0.004716610535979271, -0.004549894481897354, -0.004383178427815437, -0.004216462839394808, -0.004049746785312891, -0.0038830311968922615, -0.0037163151428103447, -0.0035495993215590715, -0.0033828835003077984, -0.0032161674462258816, -0.0030494516249746084, -0.0028827358037233353, -0.002716019982472062, -0.002549304161220789, -0.002382588107138872, -0.002215872285887599, -0.002049156464636326, -0.0018824405269697309, -0.0017157245893031359, -0.0015490087680518627, -0.0013822929468005896, -0.0012155770091339946, -0.0010488610714673996, -0.0008821452502161264, -0.0007154293707571924, -0.0005487134912982583, -0.0003819975536316633, -0.00021528219804167747, -4.8566318582743406e-05, 0.00011814956087619066, 0.00028486544033512473, 0.0004515813197940588, 0.0006182971992529929, 0.0007850130787119269, 0.0009517290163785219, 0.001118444837629795, 0.0012851606588810682, 0.0014518765965476632, 0.0016185925342142582, 0.0017853083554655313, 0.0019520241767168045, 0.0021187402307987213, 0.0022854560520499945, 0.0024521718733012676, 0.0026188876945525408, 0.002785603515803814, 0.0029523195698857307, 0.003119035391137004, 0.003285751212388277, 0.003452467266470194, 0.003619183087721467, 0.00378589890897274, 0.003952614963054657, 0.0041193305514752865, 0.004286046605557203, 0.004452762193977833, 0.00461947824805975, 0.004786194302141666, 0.004952910356223583, 0.005119625944644213]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 11.0, 19.0, 30.0, 43.0, 63.0, 94.0, 145.0, 182.0, 255.0, 362.0, 481.0, 694.0, 1013.0, 1483.0, 2120.0, 3261.0, 4783.0, 7446.0, 12005.0, 19582.0, 32803.0, 56856.0, 106084.0, 224396.0, 678569.0, 1700998.0, 814604.0, 251211.0, 115040.0, 61908.0, 36351.0, 21671.0, 13681.0, 8521.0, 5743.0, 3681.0, 2509.0, 1631.0, 1146.0, 840.0, 604.0, 410.0, 289.0, 187.0, 126.0, 116.0, 57.0, 50.0, 32.0, 26.0, 23.0, 23.0, 3.0, 11.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.00630950927734375, -0.0060961246490478516, -0.005882740020751953, -0.005669355392456055, -0.005455970764160156, -0.005242586135864258, -0.005029201507568359, -0.004815816879272461, -0.0046024322509765625, -0.004389047622680664, -0.004175662994384766, -0.003962278366088867, -0.0037488937377929688, -0.0035355091094970703, -0.003322124481201172, -0.0031087398529052734, -0.002895355224609375, -0.0026819705963134766, -0.002468585968017578, -0.0022552013397216797, -0.0020418167114257812, -0.0018284320831298828, -0.0016150474548339844, -0.001401662826538086, -0.0011882781982421875, -0.0009748935699462891, -0.0007615089416503906, -0.0005481243133544922, -0.00033473968505859375, -0.00012135505676269531, 9.202957153320312e-05, 0.00030541419982910156, 0.000518798828125, 0.0007321834564208984, 0.0009455680847167969, 0.0011589527130126953, 0.0013723373413085938, 0.0015857219696044922, 0.0017991065979003906, 0.002012491226196289, 0.0022258758544921875, 0.002439260482788086, 0.0026526451110839844, 0.002866029739379883, 0.0030794143676757812, 0.0032927989959716797, 0.003506183624267578, 0.0037195682525634766, 0.003932952880859375, 0.0041463375091552734, 0.004359722137451172, 0.00457310676574707, 0.004786491394042969, 0.004999876022338867, 0.005213260650634766, 0.005426645278930664, 0.0056400299072265625, 0.005853414535522461, 0.006066799163818359, 0.006280183792114258, 0.006493568420410156, 0.006706953048706055, 0.006920337677001953, 0.0071337223052978516, 0.00734710693359375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 8.0, 5.0, 6.0, 11.0, 18.0, 19.0, 17.0, 22.0, 29.0, 28.0, 26.0, 28.0, 41.0, 41.0, 57.0, 55.0, 47.0, 45.0, 46.0, 31.0, 28.0, 48.0, 50.0, 34.0, 52.0, 35.0, 27.0, 21.0, 17.0, 18.0, 18.0, 14.0, 12.0, 9.0, 8.0, 8.0, 5.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00362396240234375, -0.0035137832164764404, -0.003403604030609131, -0.0032934248447418213, -0.0031832456588745117, -0.003073066473007202, -0.0029628872871398926, -0.002852708101272583, -0.0027425289154052734, -0.002632349729537964, -0.0025221705436706543, -0.0024119913578033447, -0.002301812171936035, -0.0021916329860687256, -0.002081453800201416, -0.0019712746143341064, -0.0018610954284667969, -0.0017509162425994873, -0.0016407370567321777, -0.0015305578708648682, -0.0014203786849975586, -0.001310199499130249, -0.0012000203132629395, -0.0010898411273956299, -0.0009796619415283203, -0.0008694827556610107, -0.0007593035697937012, -0.0006491243839263916, -0.000538945198059082, -0.00042876601219177246, -0.0003185868263244629, -0.00020840764045715332, -9.822845458984375e-05, 1.195073127746582e-05, 0.0001221299171447754, 0.00023230910301208496, 0.00034248828887939453, 0.0004526674747467041, 0.0005628466606140137, 0.0006730258464813232, 0.0007832050323486328, 0.0008933842182159424, 0.001003563404083252, 0.0011137425899505615, 0.001223921775817871, 0.0013341009616851807, 0.0014442801475524902, 0.0015544593334197998, 0.0016646385192871094, 0.001774817705154419, 0.0018849968910217285, 0.001995176076889038, 0.0021053552627563477, 0.0022155344486236572, 0.002325713634490967, 0.0024358928203582764, 0.002546072006225586, 0.0026562511920928955, 0.002766430377960205, 0.0028766095638275146, 0.0029867887496948242, 0.003096967935562134, 0.0032071471214294434, 0.003317326307296753, 0.0034275054931640625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 16.0, 29.0, 33.0, 46.0, 103.0, 132.0, 230.0, 365.0, 635.0, 1122.0, 2028.0, 3806.0, 7163.0, 15163.0, 33260.0, 84485.0, 253701.0, 1014393.0, 2021932.0, 507536.0, 148302.0, 53994.0, 23242.0, 10743.0, 5305.0, 2849.0, 1557.0, 847.0, 510.0, 261.0, 181.0, 107.0, 66.0, 51.0, 30.0, 15.0, 8.0, 6.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0091705322265625, -0.008886337280273438, -0.008602142333984375, -0.008317947387695312, -0.00803375244140625, -0.0077495574951171875, -0.007465362548828125, -0.0071811676025390625, -0.00689697265625, -0.0066127777099609375, -0.006328582763671875, -0.0060443878173828125, -0.00576019287109375, -0.0054759979248046875, -0.005191802978515625, -0.0049076080322265625, -0.0046234130859375, -0.0043392181396484375, -0.004055023193359375, -0.0037708282470703125, -0.00348663330078125, -0.0032024383544921875, -0.002918243408203125, -0.0026340484619140625, -0.002349853515625, -0.0020656585693359375, -0.001781463623046875, -0.0014972686767578125, -0.00121307373046875, -0.0009288787841796875, -0.000644683837890625, -0.0003604888916015625, -7.62939453125e-05, 0.0002079010009765625, 0.000492095947265625, 0.0007762908935546875, 0.00106048583984375, 0.0013446807861328125, 0.001628875732421875, 0.0019130706787109375, 0.002197265625, 0.0024814605712890625, 0.002765655517578125, 0.0030498504638671875, 0.00333404541015625, 0.0036182403564453125, 0.003902435302734375, 0.0041866302490234375, 0.0044708251953125, 0.0047550201416015625, 0.005039215087890625, 0.0053234100341796875, 0.00560760498046875, 0.0058917999267578125, 0.006175994873046875, 0.0064601898193359375, 0.006744384765625, 0.0070285797119140625, 0.007312774658203125, 0.0075969696044921875, 0.00788116455078125, 0.008165359497070312, 0.008449554443359375, 0.008733749389648438, 0.0090179443359375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 12.0, 12.0, 13.0, 21.0, 20.0, 21.0, 44.0, 65.0, 66.0, 91.0, 108.0, 132.0, 156.0, 189.0, 234.0, 282.0, 363.0, 385.0, 372.0, 260.0, 260.0, 181.0, 149.0, 138.0, 106.0, 71.0, 71.0, 57.0, 46.0, 19.0, 25.0, 30.0, 12.0, 12.0, 8.0, 5.0, 10.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016937255859375, -0.00163191556930542, -0.0015701055526733398, -0.0015082955360412598, -0.0014464855194091797, -0.0013846755027770996, -0.0013228654861450195, -0.0012610554695129395, -0.0011992454528808594, -0.0011374354362487793, -0.0010756254196166992, -0.0010138154029846191, -0.0009520053863525391, -0.000890195369720459, -0.0008283853530883789, -0.0007665753364562988, -0.0007047653198242188, -0.0006429553031921387, -0.0005811452865600586, -0.0005193352699279785, -0.00045752525329589844, -0.00039571523666381836, -0.0003339052200317383, -0.0002720952033996582, -0.00021028518676757812, -0.00014847517013549805, -8.666515350341797e-05, -2.485513687133789e-05, 3.695487976074219e-05, 9.876489639282227e-05, 0.00016057491302490234, 0.00022238492965698242, 0.0002841949462890625, 0.0003460049629211426, 0.00040781497955322266, 0.00046962499618530273, 0.0005314350128173828, 0.0005932450294494629, 0.000655055046081543, 0.000716865062713623, 0.0007786750793457031, 0.0008404850959777832, 0.0009022951126098633, 0.0009641051292419434, 0.0010259151458740234, 0.0010877251625061035, 0.0011495351791381836, 0.0012113451957702637, 0.0012731552124023438, 0.0013349652290344238, 0.001396775245666504, 0.001458585262298584, 0.001520395278930664, 0.0015822052955627441, 0.0016440153121948242, 0.0017058253288269043, 0.0017676353454589844, 0.0018294453620910645, 0.0018912553787231445, 0.0019530653953552246, 0.0020148754119873047, 0.0020766854286193848, 0.002138495445251465, 0.002200305461883545, 0.002262115478515625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 18.0, 6.0, 12.0, 14.0, 21.0, 21.0, 30.0, 45.0, 46.0, 55.0, 88.0, 94.0, 100.0, 86.0, 65.0, 55.0, 40.0, 39.0, 19.0, 21.0, 26.0, 16.0, 15.0, 9.0, 4.0, 5.0, 4.0, 3.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.003964461386203766, -0.0038198456168174744, -0.003675229847431183, -0.0035306140780448914, -0.0033859983086586, -0.0032413825392723083, -0.003096766769886017, -0.0029521510004997253, -0.002807535231113434, -0.0026629194617271423, -0.002518303692340851, -0.0023736879229545593, -0.002229072153568268, -0.0020844563841819763, -0.0019398406147956848, -0.0017952248454093933, -0.0016506090760231018, -0.0015059933066368103, -0.0013613775372505188, -0.0012167617678642273, -0.0010721459984779358, -0.0009275302290916443, -0.0007829144597053528, -0.0006382986903190613, -0.0004936829209327698, -0.00034906715154647827, -0.00020445138216018677, -5.9835612773895264e-05, 8.478015661239624e-05, 0.00022939592599868774, 0.00037401169538497925, 0.0005186274647712708, 0.0006632436998188496, 0.0008078594692051411, 0.0009524752385914326, 0.001097091007977724, 0.0012417067773640156, 0.001386322546750307, 0.0015309383161365986, 0.00167555408552289, 0.0018201698549091816, 0.001964785624295473, 0.0021094013936817646, 0.002254017163068056, 0.0023986329324543476, 0.002543248701840639, 0.0026878644712269306, 0.002832480240613222, 0.0029770960099995136, 0.003121711779385805, 0.0032663275487720966, 0.003410943318158388, 0.0035555590875446796, 0.003700174856930971, 0.0038447906263172626, 0.003989406395703554, 0.004134022165089846, 0.004278637934476137, 0.004423253703862429, 0.00456786947324872, 0.004712485242635012, 0.004857101012021303, 0.005001716781407595, 0.005146332550793886, 0.005290948320180178]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 8.0, 8.0, 8.0, 8.0, 6.0, 6.0, 7.0, 14.0, 14.0, 25.0, 24.0, 19.0, 23.0, 23.0, 25.0, 34.0, 36.0, 34.0, 38.0, 34.0, 36.0, 43.0, 45.0, 34.0, 38.0, 46.0, 42.0, 28.0, 38.0, 33.0, 26.0, 20.0, 30.0, 17.0, 15.0, 16.0, 13.0, 10.0, 12.0, 11.0, 10.0, 9.0, 8.0, 4.0, 2.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.0031083417125046253, -0.0030097756534814835, -0.0029112095944583416, -0.0028126435354351997, -0.002714077476412058, -0.002615511417388916, -0.0025169451255351305, -0.0024183790665119886, -0.0023198130074888468, -0.002221246948465705, -0.002122680889442563, -0.002024114830419421, -0.0019255486549809575, -0.0018269825959578156, -0.001728416420519352, -0.00162985036149621, -0.0015312843024730682, -0.0014327182434499264, -0.0013341521844267845, -0.0012355860089883208, -0.001137019949965179, -0.001038453890942037, -0.0009398877737112343, -0.0008413216564804316, -0.0007427555974572897, -0.0006441895384341478, -0.0005456234212033451, -0.00044705733307637274, -0.0003484912449494004, -0.00024992518592625856, -0.0001513590686954558, -5.2792951464653015e-05, 4.5773107558488846e-05, 0.00014433919568546116, 0.00024290528381243348, 0.0003414713719394058, 0.0004400374600663781, 0.00053860351908952, 0.0006371696363203228, 0.0007357357535511255, 0.0008343018125742674, 0.0009328678715974092, 0.0010314339306205511, 0.0011300001060590148, 0.0012285661650821567, 0.0013271322241052985, 0.0014256983995437622, 0.001524264458566904, 0.001622830517590046, 0.0017213965766131878, 0.0018199626356363297, 0.0019185288110747933, 0.0020170947536826134, 0.0021156608127057552, 0.0022142271045595407, 0.0023127931635826826, 0.0024113592226058245, 0.0025099252816289663, 0.002608491340652108, 0.00270705739967525, 0.0028056236915290356, 0.0029041897505521774, 0.0030027558095753193, 0.003101321868598461, 0.003199887927621603]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 9.0, 13.0, 23.0, 22.0, 31.0, 43.0, 73.0, 134.0, 164.0, 301.0, 451.0, 793.0, 1325.0, 2499.0, 4916.0, 10191.0, 24696.0, 79348.0, 490492.0, 332932.0, 61095.0, 20645.0, 8843.0, 4182.0, 2268.0, 1167.0, 698.0, 434.0, 249.0, 187.0, 106.0, 66.0, 44.0, 27.0, 24.0, 14.0, 9.0, 11.0, 10.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00457000732421875, -0.004422128200531006, -0.004274249076843262, -0.004126369953155518, -0.0039784908294677734, -0.0038306117057800293, -0.003682732582092285, -0.003534853458404541, -0.003386974334716797, -0.0032390952110290527, -0.0030912160873413086, -0.0029433369636535645, -0.0027954578399658203, -0.002647578716278076, -0.002499699592590332, -0.002351820468902588, -0.0022039413452148438, -0.0020560622215270996, -0.0019081830978393555, -0.0017603039741516113, -0.0016124248504638672, -0.001464545726776123, -0.001316666603088379, -0.0011687874794006348, -0.0010209083557128906, -0.0008730292320251465, -0.0007251501083374023, -0.0005772709846496582, -0.00042939186096191406, -0.0002815127372741699, -0.00013363361358642578, 1.424551010131836e-05, 0.0001621246337890625, 0.00031000375747680664, 0.0004578828811645508, 0.0006057620048522949, 0.0007536411285400391, 0.0009015202522277832, 0.0010493993759155273, 0.0011972784996032715, 0.0013451576232910156, 0.0014930367469787598, 0.001640915870666504, 0.001788794994354248, 0.0019366741180419922, 0.0020845532417297363, 0.0022324323654174805, 0.0023803114891052246, 0.0025281906127929688, 0.002676069736480713, 0.002823948860168457, 0.002971827983856201, 0.0031197071075439453, 0.0032675862312316895, 0.0034154653549194336, 0.0035633444786071777, 0.003711223602294922, 0.003859102725982666, 0.00400698184967041, 0.004154860973358154, 0.0043027400970458984, 0.004450619220733643, 0.004598498344421387, 0.004746377468109131, 0.004894256591796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 4.0, 6.0, 6.0, 11.0, 6.0, 9.0, 7.0, 27.0, 15.0, 26.0, 23.0, 22.0, 19.0, 34.0, 34.0, 37.0, 42.0, 48.0, 40.0, 42.0, 40.0, 41.0, 57.0, 37.0, 36.0, 36.0, 32.0, 35.0, 29.0, 22.0, 18.0, 15.0, 22.0, 15.0, 13.0, 8.0, 11.0, 18.0, 9.0, 12.0, 2.0, 12.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.003513336181640625, -0.003403306007385254, -0.003293275833129883, -0.0031832456588745117, -0.0030732154846191406, -0.0029631853103637695, -0.0028531551361083984, -0.0027431249618530273, -0.0026330947875976562, -0.002523064613342285, -0.002413034439086914, -0.002303004264831543, -0.002192974090576172, -0.0020829439163208008, -0.0019729137420654297, -0.0018628835678100586, -0.0017528533935546875, -0.0016428232192993164, -0.0015327930450439453, -0.0014227628707885742, -0.0013127326965332031, -0.001202702522277832, -0.001092672348022461, -0.0009826421737670898, -0.0008726119995117188, -0.0007625818252563477, -0.0006525516510009766, -0.0005425214767456055, -0.0004324913024902344, -0.0003224611282348633, -0.0002124309539794922, -0.0001024007797241211, 7.62939453125e-06, 0.0001176595687866211, 0.0002276897430419922, 0.0003377199172973633, 0.0004477500915527344, 0.0005577802658081055, 0.0006678104400634766, 0.0007778406143188477, 0.0008878707885742188, 0.0009979009628295898, 0.001107931137084961, 0.001217961311340332, 0.0013279914855957031, 0.0014380216598510742, 0.0015480518341064453, 0.0016580820083618164, 0.0017681121826171875, 0.0018781423568725586, 0.0019881725311279297, 0.0020982027053833008, 0.002208232879638672, 0.002318263053894043, 0.002428293228149414, 0.002538323402404785, 0.0026483535766601562, 0.0027583837509155273, 0.0028684139251708984, 0.0029784440994262695, 0.0030884742736816406, 0.0031985044479370117, 0.003308534622192383, 0.003418564796447754, 0.003528594970703125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 7.0, 10.0, 15.0, 17.0, 28.0, 24.0, 35.0, 52.0, 71.0, 90.0, 106.0, 182.0, 233.0, 274.0, 461.0, 668.0, 1013.0, 1659.0, 2898.0, 5302.0, 11764.0, 39399.0, 531727.0, 393518.0, 35376.0, 10960.0, 5097.0, 2769.0, 1614.0, 987.0, 661.0, 416.0, 311.0, 195.0, 163.0, 100.0, 81.0, 64.0, 40.0, 36.0, 36.0, 27.0, 14.0, 13.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.005641937255859375, -0.005459725856781006, -0.005277514457702637, -0.005095303058624268, -0.0049130916595458984, -0.004730880260467529, -0.00454866886138916, -0.004366457462310791, -0.004184246063232422, -0.004002034664154053, -0.0038198232650756836, -0.0036376118659973145, -0.0034554004669189453, -0.003273189067840576, -0.003090977668762207, -0.002908766269683838, -0.0027265548706054688, -0.0025443434715270996, -0.0023621320724487305, -0.0021799206733703613, -0.001997709274291992, -0.001815497875213623, -0.001633286476135254, -0.0014510750770568848, -0.0012688636779785156, -0.0010866522789001465, -0.0009044408798217773, -0.0007222294807434082, -0.0005400180816650391, -0.0003578066825866699, -0.00017559528350830078, 6.616115570068359e-06, 0.0001888275146484375, 0.00037103891372680664, 0.0005532503128051758, 0.0007354617118835449, 0.0009176731109619141, 0.0010998845100402832, 0.0012820959091186523, 0.0014643073081970215, 0.0016465187072753906, 0.0018287301063537598, 0.002010941505432129, 0.002193152904510498, 0.002375364303588867, 0.0025575757026672363, 0.0027397871017456055, 0.0029219985008239746, 0.0031042098999023438, 0.003286421298980713, 0.003468632698059082, 0.003650844097137451, 0.0038330554962158203, 0.0040152668952941895, 0.004197478294372559, 0.004379689693450928, 0.004561901092529297, 0.004744112491607666, 0.004926323890686035, 0.005108535289764404, 0.0052907466888427734, 0.005472958087921143, 0.005655169486999512, 0.005837380886077881, 0.00601959228515625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 9.0, 8.0, 18.0, 15.0, 13.0, 23.0, 27.0, 33.0, 24.0, 51.0, 31.0, 34.0, 36.0, 40.0, 43.0, 47.0, 46.0, 41.0, 43.0, 30.0, 46.0, 45.0, 45.0, 32.0, 22.0, 22.0, 27.0, 25.0, 23.0, 24.0, 10.0, 9.0, 6.0, 7.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0028629302978515625, -0.002786785364151001, -0.0027106404304504395, -0.002634495496749878, -0.0025583505630493164, -0.002482205629348755, -0.0024060606956481934, -0.002329915761947632, -0.0022537708282470703, -0.002177625894546509, -0.0021014809608459473, -0.0020253360271453857, -0.0019491910934448242, -0.0018730461597442627, -0.0017969012260437012, -0.0017207562923431396, -0.0016446113586425781, -0.0015684664249420166, -0.001492321491241455, -0.0014161765575408936, -0.001340031623840332, -0.0012638866901397705, -0.001187741756439209, -0.0011115968227386475, -0.001035451889038086, -0.0009593069553375244, -0.0008831620216369629, -0.0008070170879364014, -0.0007308721542358398, -0.0006547272205352783, -0.0005785822868347168, -0.0005024373531341553, -0.00042629241943359375, -0.0003501474857330322, -0.0002740025520324707, -0.00019785761833190918, -0.00012171268463134766, -4.556775093078613e-05, 3.057718276977539e-05, 0.00010672211647033691, 0.00018286705017089844, 0.00025901198387145996, 0.0003351569175720215, 0.000411301851272583, 0.00048744678497314453, 0.0005635917186737061, 0.0006397366523742676, 0.0007158815860748291, 0.0007920265197753906, 0.0008681714534759521, 0.0009443163871765137, 0.0010204613208770752, 0.0010966062545776367, 0.0011727511882781982, 0.0012488961219787598, 0.0013250410556793213, 0.0014011859893798828, 0.0014773309230804443, 0.0015534758567810059, 0.0016296207904815674, 0.001705765724182129, 0.0017819106578826904, 0.001858055591583252, 0.0019342005252838135, 0.002010345458984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 5.0, 13.0, 9.0, 18.0, 22.0, 18.0, 36.0, 56.0, 79.0, 94.0, 141.0, 188.0, 257.0, 405.0, 584.0, 972.0, 1650.0, 2924.0, 5727.0, 12982.0, 45307.0, 780713.0, 154418.0, 23425.0, 8442.0, 4090.0, 2260.0, 1279.0, 794.0, 535.0, 316.0, 220.0, 153.0, 123.0, 80.0, 47.0, 55.0, 28.0, 25.0, 15.0, 14.0, 8.0, 9.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0009050369262695312, -0.000875622034072876, -0.0008462071418762207, -0.0008167922496795654, -0.0007873773574829102, -0.0007579624652862549, -0.0007285475730895996, -0.0006991326808929443, -0.0006697177886962891, -0.0006403028964996338, -0.0006108880043029785, -0.0005814731121063232, -0.000552058219909668, -0.0005226433277130127, -0.0004932284355163574, -0.00046381354331970215, -0.0004343986511230469, -0.0004049837589263916, -0.00037556886672973633, -0.00034615397453308105, -0.0003167390823364258, -0.0002873241901397705, -0.00025790929794311523, -0.00022849440574645996, -0.0001990795135498047, -0.00016966462135314941, -0.00014024972915649414, -0.00011083483695983887, -8.14199447631836e-05, -5.200505256652832e-05, -2.2590160369873047e-05, 6.8247318267822266e-06, 3.62396240234375e-05, 6.565451622009277e-05, 9.506940841674805e-05, 0.00012448430061340332, 0.0001538991928100586, 0.00018331408500671387, 0.00021272897720336914, 0.00024214386940002441, 0.0002715587615966797, 0.00030097365379333496, 0.00033038854598999023, 0.0003598034381866455, 0.0003892183303833008, 0.00041863322257995605, 0.00044804811477661133, 0.0004774630069732666, 0.0005068778991699219, 0.0005362927913665771, 0.0005657076835632324, 0.0005951225757598877, 0.000624537467956543, 0.0006539523601531982, 0.0006833672523498535, 0.0007127821445465088, 0.0007421970367431641, 0.0007716119289398193, 0.0008010268211364746, 0.0008304417133331299, 0.0008598566055297852, 0.0008892714977264404, 0.0009186863899230957, 0.000948101282119751, 0.0009775161743164062]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 18.0, 11.0, 11.0, 14.0, 37.0, 25.0, 32.0, 36.0, 75.0, 30.0, 58.0, 43.0, 104.0, 57.0, 54.0, 97.0, 35.0, 37.0, 28.0, 54.0, 22.0, 14.0, 13.0, 22.0, 8.0, 7.0, 6.0, 10.0, 1.0, 4.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-06, -2.2491440176963806e-06, -2.173706889152527e-06, -2.098269760608673e-06, -2.0228326320648193e-06, -1.9473955035209656e-06, -1.8719583749771118e-06, -1.796521246433258e-06, -1.7210841178894043e-06, -1.6456469893455505e-06, -1.5702098608016968e-06, -1.494772732257843e-06, -1.4193356037139893e-06, -1.3438984751701355e-06, -1.2684613466262817e-06, -1.193024218082428e-06, -1.1175870895385742e-06, -1.0421499609947205e-06, -9.667128324508667e-07, -8.912757039070129e-07, -8.158385753631592e-07, -7.404014468193054e-07, -6.649643182754517e-07, -5.895271897315979e-07, -5.140900611877441e-07, -4.386529326438904e-07, -3.632158041000366e-07, -2.8777867555618286e-07, -2.123415470123291e-07, -1.3690441846847534e-07, -6.146728992462158e-08, 1.3969838619232178e-08, 8.940696716308594e-08, 1.648440957069397e-07, 2.4028122425079346e-07, 3.157183527946472e-07, 3.91155481338501e-07, 4.6659260988235474e-07, 5.420297384262085e-07, 6.174668669700623e-07, 6.92903995513916e-07, 7.683411240577698e-07, 8.437782526016235e-07, 9.192153811454773e-07, 9.94652509689331e-07, 1.0700896382331848e-06, 1.1455267667770386e-06, 1.2209638953208923e-06, 1.296401023864746e-06, 1.3718381524085999e-06, 1.4472752809524536e-06, 1.5227124094963074e-06, 1.5981495380401611e-06, 1.6735866665840149e-06, 1.7490237951278687e-06, 1.8244609236717224e-06, 1.8998980522155762e-06, 1.97533518075943e-06, 2.0507723093032837e-06, 2.1262094378471375e-06, 2.201646566390991e-06, 2.277083694934845e-06, 2.3525208234786987e-06, 2.4279579520225525e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 9.0, 7.0, 18.0, 26.0, 27.0, 50.0, 59.0, 94.0, 137.0, 203.0, 308.0, 545.0, 875.0, 1527.0, 2504.0, 4507.0, 8427.0, 17190.0, 41192.0, 141639.0, 605703.0, 145183.0, 41571.0, 17204.0, 8458.0, 4602.0, 2622.0, 1443.0, 903.0, 530.0, 322.0, 231.0, 125.0, 98.0, 68.0, 40.0, 27.0, 23.0, 12.0, 11.0, 9.0, 4.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012159347534179688, -0.0011773407459259033, -0.0011387467384338379, -0.0011001527309417725, -0.001061558723449707, -0.0010229647159576416, -0.0009843707084655762, -0.0009457767009735107, -0.0009071826934814453, -0.0008685886859893799, -0.0008299946784973145, -0.000791400671005249, -0.0007528066635131836, -0.0007142126560211182, -0.0006756186485290527, -0.0006370246410369873, -0.0005984306335449219, -0.0005598366260528564, -0.000521242618560791, -0.0004826486110687256, -0.00044405460357666016, -0.0004054605960845947, -0.0003668665885925293, -0.00032827258110046387, -0.00028967857360839844, -0.000251084566116333, -0.00021249055862426758, -0.00017389655113220215, -0.00013530254364013672, -9.670853614807129e-05, -5.811452865600586e-05, -1.952052116394043e-05, 1.9073486328125e-05, 5.766749382019043e-05, 9.626150131225586e-05, 0.0001348555088043213, 0.00017344951629638672, 0.00021204352378845215, 0.0002506375312805176, 0.000289231538772583, 0.00032782554626464844, 0.00036641955375671387, 0.0004050135612487793, 0.0004436075687408447, 0.00048220157623291016, 0.0005207955837249756, 0.000559389591217041, 0.0005979835987091064, 0.0006365776062011719, 0.0006751716136932373, 0.0007137656211853027, 0.0007523596286773682, 0.0007909536361694336, 0.000829547643661499, 0.0008681416511535645, 0.0009067356586456299, 0.0009453296661376953, 0.0009839236736297607, 0.0010225176811218262, 0.0010611116886138916, 0.001099705696105957, 0.0011382997035980225, 0.0011768937110900879, 0.0012154877185821533, 0.0012540817260742188]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 8.0, 5.0, 9.0, 3.0, 10.0, 16.0, 17.0, 27.0, 46.0, 51.0, 86.0, 141.0, 213.0, 138.0, 65.0, 54.0, 29.0, 15.0, 11.0, 5.0, 4.0, 5.0, 5.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004067420959472656, -0.00039487332105636597, -0.0003830045461654663, -0.00037113577127456665, -0.000359266996383667, -0.00034739822149276733, -0.0003355294466018677, -0.000323660671710968, -0.00031179189682006836, -0.0002999231219291687, -0.00028805434703826904, -0.0002761855721473694, -0.0002643167972564697, -0.00025244802236557007, -0.0002405792474746704, -0.00022871047258377075, -0.0002168416976928711, -0.00020497292280197144, -0.00019310414791107178, -0.00018123537302017212, -0.00016936659812927246, -0.0001574978232383728, -0.00014562904834747314, -0.00013376027345657349, -0.00012189149856567383, -0.00011002272367477417, -9.815394878387451e-05, -8.628517389297485e-05, -7.44163990020752e-05, -6.254762411117554e-05, -5.067884922027588e-05, -3.881007432937622e-05, -2.6941299438476562e-05, -1.5072524547576904e-05, -3.203749656677246e-06, 8.665025234222412e-06, 2.053380012512207e-05, 3.240257501602173e-05, 4.427134990692139e-05, 5.6140124797821045e-05, 6.80088996887207e-05, 7.987767457962036e-05, 9.174644947052002e-05, 0.00010361522436141968, 0.00011548399925231934, 0.000127352774143219, 0.00013922154903411865, 0.0001510903239250183, 0.00016295909881591797, 0.00017482787370681763, 0.00018669664859771729, 0.00019856542348861694, 0.0002104341983795166, 0.00022230297327041626, 0.00023417174816131592, 0.0002460405230522156, 0.00025790929794311523, 0.0002697780728340149, 0.00028164684772491455, 0.0002935156226158142, 0.00030538439750671387, 0.0003172531723976135, 0.0003291219472885132, 0.00034099072217941284, 0.0003528594970703125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 5.0, 9.0, 6.0, 9.0, 9.0, 14.0, 28.0, 22.0, 28.0, 38.0, 67.0, 65.0, 78.0, 104.0, 102.0, 72.0, 66.0, 52.0, 50.0, 22.0, 27.0, 30.0, 29.0, 8.0, 11.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.004126824904233217, -0.003975533880293369, -0.0038242428563535213, -0.0036729518324136734, -0.0035216608084738255, -0.0033703697845339775, -0.003219078527763486, -0.003067787503823638, -0.00291649647988379, -0.002765205455943942, -0.002613914432004094, -0.002462623408064246, -0.0023113321512937546, -0.0021600411273539066, -0.0020087501034140587, -0.0018574590794742107, -0.0017061680555343628, -0.0015548770315945148, -0.001403586007654667, -0.0012522948672994971, -0.0011010038433596492, -0.0009497128194198012, -0.0007984217372722924, -0.0006471306551247835, -0.0004958396311849356, -0.00034454857814125717, -0.00019325752509757876, -4.196647205390036e-05, 0.00010932458098977804, 0.000260615604929626, 0.00041190668707713485, 0.0005631977692246437, 0.000714489258825779, 0.0008657802827656269, 0.0010170713067054749, 0.0011683624470606446, 0.0013196534710004926, 0.0014709444949403405, 0.0016222356352955103, 0.0017735266592353582, 0.0019248176831752062, 0.002076108707115054, 0.002227399731054902, 0.00237869075499475, 0.0025299820117652416, 0.0026812730357050896, 0.0028325640596449375, 0.0029838550835847855, 0.0031351461075246334, 0.0032864371314644814, 0.0034377281554043293, 0.0035890191793441772, 0.003740310203284025, 0.003891601227223873, 0.004042892251163721, 0.004194183275103569, 0.004345474764704704, 0.004496765788644552, 0.0046480568125844, 0.004799347836524248, 0.004950638860464096, 0.005101929884403944, 0.005253220908343792, 0.005404512397944927, 0.005555802956223488]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 7.0, 6.0, 9.0, 7.0, 4.0, 15.0, 29.0, 18.0, 18.0, 24.0, 16.0, 25.0, 36.0, 34.0, 31.0, 37.0, 33.0, 38.0, 38.0, 46.0, 37.0, 36.0, 44.0, 38.0, 39.0, 30.0, 50.0, 23.0, 25.0, 18.0, 23.0, 26.0, 9.0, 15.0, 17.0, 10.0, 15.0, 7.0, 9.0, 9.0, 3.0, 5.0, 7.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.0031068657990545034, -0.003007764695212245, -0.0029086635913699865, -0.0028095622546970844, -0.002710461150854826, -0.0026113600470125675, -0.002512258943170309, -0.0024131578393280506, -0.002314056735485792, -0.0022149556316435337, -0.0021158545278012753, -0.002016753423959017, -0.0019176520872861147, -0.0018185509834438562, -0.0017194498796015978, -0.0016203487757593393, -0.0015212474390864372, -0.0014221463352441788, -0.0013230451149865985, -0.00122394401114434, -0.0011248427908867598, -0.0010257416870445013, -0.0009266405832022429, -0.0008275394211523235, -0.0007284382591024041, -0.0006293370970524848, -0.0005302359350025654, -0.00043113483116030693, -0.00033203366911038756, -0.0002329325070604682, -0.00013383140321820974, -3.473024116829038e-05, 6.437068805098534e-05, 0.00016347183554898947, 0.0002625729830469936, 0.0003616741159930825, 0.0004607752780430019, 0.0005598764400929213, 0.0006589775439351797, 0.0007580787059850991, 0.0008571798680350184, 0.0009562810300849378, 0.0010553821921348572, 0.0011544832959771156, 0.001253584399819374, 0.0013526856200769544, 0.0014517867239192128, 0.001550887944176793, 0.0016499890480190516, 0.00174909015186131, 0.0018481913721188903, 0.0019472924759611487, 0.002046393696218729, 0.0021454948000609875, 0.002244595903903246, 0.0023436970077455044, 0.002442798111587763, 0.0025418992154300213, 0.0026410003192722797, 0.002740101423114538, 0.0028392027597874403, 0.0029383038636296988, 0.003037404967471957, 0.0031365060713142157, 0.0032356074079871178]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 18.0, 14.0, 29.0, 34.0, 65.0, 80.0, 118.0, 173.0, 225.0, 353.0, 515.0, 684.0, 1013.0, 1449.0, 2160.0, 3283.0, 4915.0, 7532.0, 11861.0, 19055.0, 31434.0, 52649.0, 93591.0, 171239.0, 248007.0, 169350.0, 92562.0, 52111.0, 30950.0, 18898.0, 11676.0, 7444.0, 4924.0, 3171.0, 2171.0, 1480.0, 1058.0, 691.0, 466.0, 308.0, 240.0, 180.0, 104.0, 95.0, 54.0, 36.0, 23.0, 24.0, 15.0, 5.0, 11.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.006862640380859375, -0.006657719612121582, -0.006452798843383789, -0.006247878074645996, -0.006042957305908203, -0.00583803653717041, -0.005633115768432617, -0.005428194999694824, -0.005223274230957031, -0.005018353462219238, -0.004813432693481445, -0.004608511924743652, -0.004403591156005859, -0.004198670387268066, -0.0039937496185302734, -0.0037888288497924805, -0.0035839080810546875, -0.0033789873123168945, -0.0031740665435791016, -0.0029691457748413086, -0.0027642250061035156, -0.0025593042373657227, -0.0023543834686279297, -0.0021494626998901367, -0.0019445419311523438, -0.0017396211624145508, -0.0015347003936767578, -0.0013297796249389648, -0.0011248588562011719, -0.0009199380874633789, -0.0007150173187255859, -0.000510096549987793, -0.00030517578125, -0.00010025501251220703, 0.00010466575622558594, 0.0003095865249633789, 0.0005145072937011719, 0.0007194280624389648, 0.0009243488311767578, 0.0011292695999145508, 0.0013341903686523438, 0.0015391111373901367, 0.0017440319061279297, 0.0019489526748657227, 0.0021538734436035156, 0.0023587942123413086, 0.0025637149810791016, 0.0027686357498168945, 0.0029735565185546875, 0.0031784772872924805, 0.0033833980560302734, 0.0035883188247680664, 0.0037932395935058594, 0.003998160362243652, 0.004203081130981445, 0.004408001899719238, 0.004612922668457031, 0.004817843437194824, 0.005022764205932617, 0.00522768497467041, 0.005432605743408203, 0.005637526512145996, 0.005842447280883789, 0.006047368049621582, 0.006252288818359375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 2.0, 7.0, 7.0, 9.0, 14.0, 18.0, 15.0, 24.0, 22.0, 22.0, 27.0, 26.0, 35.0, 27.0, 39.0, 25.0, 39.0, 50.0, 33.0, 50.0, 46.0, 53.0, 42.0, 49.0, 39.0, 30.0, 31.0, 25.0, 24.0, 17.0, 26.0, 13.0, 18.0, 16.0, 8.0, 11.0, 11.0, 7.0, 7.0, 3.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.003086090087890625, -0.002991616725921631, -0.0028971433639526367, -0.0028026700019836426, -0.0027081966400146484, -0.0026137232780456543, -0.00251924991607666, -0.002424776554107666, -0.002330303192138672, -0.0022358298301696777, -0.0021413564682006836, -0.0020468831062316895, -0.0019524097442626953, -0.0018579363822937012, -0.001763463020324707, -0.0016689896583557129, -0.0015745162963867188, -0.0014800429344177246, -0.0013855695724487305, -0.0012910962104797363, -0.0011966228485107422, -0.001102149486541748, -0.001007676124572754, -0.0009132027626037598, -0.0008187294006347656, -0.0007242560386657715, -0.0006297826766967773, -0.0005353093147277832, -0.00044083595275878906, -0.0003463625907897949, -0.0002518892288208008, -0.00015741586685180664, -6.29425048828125e-05, 3.153085708618164e-05, 0.00012600421905517578, 0.00022047758102416992, 0.00031495094299316406, 0.0004094243049621582, 0.0005038976669311523, 0.0005983710289001465, 0.0006928443908691406, 0.0007873177528381348, 0.0008817911148071289, 0.000976264476776123, 0.0010707378387451172, 0.0011652112007141113, 0.0012596845626831055, 0.0013541579246520996, 0.0014486312866210938, 0.0015431046485900879, 0.001637578010559082, 0.0017320513725280762, 0.0018265247344970703, 0.0019209980964660645, 0.0020154714584350586, 0.0021099448204040527, 0.002204418182373047, 0.002298891544342041, 0.002393364906311035, 0.0024878382682800293, 0.0025823116302490234, 0.0026767849922180176, 0.0027712583541870117, 0.002865731716156006, 0.002960205078125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 12.0, 16.0, 6.0, 23.0, 24.0, 46.0, 53.0, 62.0, 109.0, 157.0, 202.0, 302.0, 448.0, 649.0, 1051.0, 1586.0, 2500.0, 3769.0, 5866.0, 9335.0, 15184.0, 25315.0, 43026.0, 76624.0, 143393.0, 246883.0, 208672.0, 112260.0, 61158.0, 34548.0, 20819.0, 12561.0, 7703.0, 4875.0, 3069.0, 2081.0, 1370.0, 868.0, 564.0, 413.0, 270.0, 218.0, 155.0, 92.0, 64.0, 53.0, 29.0, 23.0, 13.0, 11.0, 12.0, 8.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006855010986328125, -0.0066394805908203125, -0.0064239501953125, -0.0062084197998046875, -0.005992889404296875, -0.0057773590087890625, -0.00556182861328125, -0.0053462982177734375, -0.005130767822265625, -0.0049152374267578125, -0.00469970703125, -0.0044841766357421875, -0.004268646240234375, -0.0040531158447265625, -0.00383758544921875, -0.0036220550537109375, -0.003406524658203125, -0.0031909942626953125, -0.0029754638671875, -0.0027599334716796875, -0.002544403076171875, -0.0023288726806640625, -0.00211334228515625, -0.0018978118896484375, -0.001682281494140625, -0.0014667510986328125, -0.001251220703125, -0.0010356903076171875, -0.000820159912109375, -0.0006046295166015625, -0.00038909912109375, -0.0001735687255859375, 4.1961669921875e-05, 0.0002574920654296875, 0.0004730224609375, 0.0006885528564453125, 0.000904083251953125, 0.0011196136474609375, 0.00133514404296875, 0.0015506744384765625, 0.001766204833984375, 0.0019817352294921875, 0.002197265625, 0.0024127960205078125, 0.002628326416015625, 0.0028438568115234375, 0.00305938720703125, 0.0032749176025390625, 0.003490447998046875, 0.0037059783935546875, 0.0039215087890625, 0.0041370391845703125, 0.004352569580078125, 0.0045680999755859375, 0.00478363037109375, 0.0049991607666015625, 0.005214691162109375, 0.0054302215576171875, 0.005645751953125, 0.0058612823486328125, 0.006076812744140625, 0.0062923431396484375, 0.00650787353515625, 0.0067234039306640625, 0.006938934326171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 7.0, 5.0, 7.0, 12.0, 13.0, 12.0, 14.0, 16.0, 15.0, 26.0, 23.0, 23.0, 24.0, 35.0, 33.0, 42.0, 35.0, 49.0, 42.0, 48.0, 40.0, 36.0, 44.0, 46.0, 50.0, 43.0, 31.0, 26.0, 22.0, 24.0, 28.0, 33.0, 22.0, 12.0, 9.0, 11.0, 10.0, 7.0, 8.0, 7.0, 3.0, 0.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017499923706054688, -0.0016845911741256714, -0.001619189977645874, -0.0015537887811660767, -0.0014883875846862793, -0.001422986388206482, -0.0013575851917266846, -0.0012921839952468872, -0.0012267827987670898, -0.0011613816022872925, -0.0010959804058074951, -0.0010305792093276978, -0.0009651780128479004, -0.000899776816368103, -0.0008343756198883057, -0.0007689744234085083, -0.0007035732269287109, -0.0006381720304489136, -0.0005727708339691162, -0.0005073696374893188, -0.0004419684410095215, -0.0003765672445297241, -0.00031116604804992676, -0.0002457648515701294, -0.00018036365509033203, -0.00011496245861053467, -4.9561262130737305e-05, 1.583993434906006e-05, 8.124113082885742e-05, 0.00014664232730865479, 0.00021204352378845215, 0.0002774447202682495, 0.0003428459167480469, 0.00040824711322784424, 0.0004736483097076416, 0.000539049506187439, 0.0006044507026672363, 0.0006698518991470337, 0.0007352530956268311, 0.0008006542921066284, 0.0008660554885864258, 0.0009314566850662231, 0.0009968578815460205, 0.0010622590780258179, 0.0011276602745056152, 0.0011930614709854126, 0.00125846266746521, 0.0013238638639450073, 0.0013892650604248047, 0.001454666256904602, 0.0015200674533843994, 0.0015854686498641968, 0.0016508698463439941, 0.0017162710428237915, 0.0017816722393035889, 0.0018470734357833862, 0.0019124746322631836, 0.001977875828742981, 0.0020432770252227783, 0.0021086782217025757, 0.002174079418182373, 0.0022394806146621704, 0.0023048818111419678, 0.002370283007621765, 0.0024356842041015625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 10.0, 10.0, 18.0, 24.0, 29.0, 34.0, 70.0, 98.0, 133.0, 185.0, 254.0, 373.0, 455.0, 611.0, 812.0, 1126.0, 1478.0, 2105.0, 2941.0, 4433.0, 7131.0, 13559.0, 40005.0, 308253.0, 565738.0, 57371.0, 16714.0, 8087.0, 4873.0, 3168.0, 2291.0, 1639.0, 1209.0, 863.0, 654.0, 542.0, 319.0, 255.0, 196.0, 141.0, 107.0, 74.0, 56.0, 36.0, 24.0, 22.0, 13.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0012731552124023438, -0.0012347102165222168, -0.0011962652206420898, -0.0011578202247619629, -0.001119375228881836, -0.001080930233001709, -0.001042485237121582, -0.001004040241241455, -0.0009655952453613281, -0.0009271502494812012, -0.0008887052536010742, -0.0008502602577209473, -0.0008118152618408203, -0.0007733702659606934, -0.0007349252700805664, -0.0006964802742004395, -0.0006580352783203125, -0.0006195902824401855, -0.0005811452865600586, -0.0005427002906799316, -0.0005042552947998047, -0.00046581029891967773, -0.0004273653030395508, -0.00038892030715942383, -0.0003504753112792969, -0.0003120303153991699, -0.00027358531951904297, -0.00023514032363891602, -0.00019669532775878906, -0.0001582503318786621, -0.00011980533599853516, -8.13603401184082e-05, -4.291534423828125e-05, -4.470348358154297e-06, 3.3974647521972656e-05, 7.241964340209961e-05, 0.00011086463928222656, 0.00014930963516235352, 0.00018775463104248047, 0.00022619962692260742, 0.0002646446228027344, 0.00030308961868286133, 0.0003415346145629883, 0.00037997961044311523, 0.0004184246063232422, 0.00045686960220336914, 0.0004953145980834961, 0.000533759593963623, 0.00057220458984375, 0.000610649585723877, 0.0006490945816040039, 0.0006875395774841309, 0.0007259845733642578, 0.0007644295692443848, 0.0008028745651245117, 0.0008413195610046387, 0.0008797645568847656, 0.0009182095527648926, 0.0009566545486450195, 0.0009950995445251465, 0.0010335445404052734, 0.0010719895362854004, 0.0011104345321655273, 0.0011488795280456543, 0.0011873245239257812]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 6.0, 0.0, 8.0, 0.0, 24.0, 0.0, 37.0, 0.0, 60.0, 0.0, 74.0, 0.0, 108.0, 0.0, 136.0, 0.0, 136.0, 0.0, 101.0, 0.0, 0.0, 102.0, 0.0, 75.0, 0.0, 49.0, 0.0, 32.0, 0.0, 21.0, 0.0, 13.0, 0.0, 12.0, 0.0, 6.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.055940270423889e-07, -7.767230272293091e-07, -7.478520274162292e-07, -7.189810276031494e-07, -6.901100277900696e-07, -6.612390279769897e-07, -6.323680281639099e-07, -6.034970283508301e-07, -5.746260285377502e-07, -5.457550287246704e-07, -5.168840289115906e-07, -4.880130290985107e-07, -4.591420292854309e-07, -4.302710294723511e-07, -4.0140002965927124e-07, -3.725290298461914e-07, -3.4365803003311157e-07, -3.1478703022003174e-07, -2.859160304069519e-07, -2.5704503059387207e-07, -2.2817403078079224e-07, -1.993030309677124e-07, -1.7043203115463257e-07, -1.4156103134155273e-07, -1.126900315284729e-07, -8.381903171539307e-08, -5.494803190231323e-08, -2.60770320892334e-08, 2.7939677238464355e-09, 3.166496753692627e-08, 6.05359673500061e-08, 8.940696716308594e-08, 1.1827796697616577e-07, 1.471489667892456e-07, 1.7601996660232544e-07, 2.0489096641540527e-07, 2.337619662284851e-07, 2.6263296604156494e-07, 2.915039658546448e-07, 3.203749656677246e-07, 3.4924596548080444e-07, 3.781169652938843e-07, 4.069879651069641e-07, 4.3585896492004395e-07, 4.647299647331238e-07, 4.936009645462036e-07, 5.224719643592834e-07, 5.513429641723633e-07, 5.802139639854431e-07, 6.09084963798523e-07, 6.379559636116028e-07, 6.668269634246826e-07, 6.956979632377625e-07, 7.245689630508423e-07, 7.534399628639221e-07, 7.82310962677002e-07, 8.111819624900818e-07, 8.400529623031616e-07, 8.689239621162415e-07, 8.977949619293213e-07, 9.266659617424011e-07, 9.55536961555481e-07, 9.844079613685608e-07, 1.0132789611816406e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 16.0, 31.0, 37.0, 26.0, 41.0, 73.0, 91.0, 109.0, 151.0, 172.0, 194.0, 311.0, 353.0, 497.0, 669.0, 891.0, 1231.0, 1686.0, 2447.0, 3624.0, 5980.0, 11909.0, 41921.0, 804767.0, 130792.0, 17820.0, 7856.0, 4510.0, 2887.0, 1956.0, 1394.0, 996.0, 769.0, 505.0, 418.0, 284.0, 242.0, 194.0, 151.0, 128.0, 99.0, 68.0, 66.0, 57.0, 31.0, 19.0, 10.0, 18.0, 12.0, 9.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0022525787353515625, -0.0021792352199554443, -0.002105891704559326, -0.002032548189163208, -0.00195920467376709, -0.0018858611583709717, -0.0018125176429748535, -0.0017391741275787354, -0.0016658306121826172, -0.001592487096786499, -0.0015191435813903809, -0.0014458000659942627, -0.0013724565505981445, -0.0012991130352020264, -0.0012257695198059082, -0.00115242600440979, -0.0010790824890136719, -0.0010057389736175537, -0.0009323954582214355, -0.0008590519428253174, -0.0007857084274291992, -0.0007123649120330811, -0.0006390213966369629, -0.0005656778812408447, -0.0004923343658447266, -0.0004189908504486084, -0.00034564733505249023, -0.00027230381965637207, -0.0001989603042602539, -0.00012561678886413574, -5.227327346801758e-05, 2.1070241928100586e-05, 9.441375732421875e-05, 0.00016775727272033691, 0.00024110078811645508, 0.00031444430351257324, 0.0003877878189086914, 0.00046113133430480957, 0.0005344748497009277, 0.0006078183650970459, 0.0006811618804931641, 0.0007545053958892822, 0.0008278489112854004, 0.0009011924266815186, 0.0009745359420776367, 0.0010478794574737549, 0.001121222972869873, 0.0011945664882659912, 0.0012679100036621094, 0.0013412535190582275, 0.0014145970344543457, 0.0014879405498504639, 0.001561284065246582, 0.0016346275806427002, 0.0017079710960388184, 0.0017813146114349365, 0.0018546581268310547, 0.0019280016422271729, 0.002001345157623291, 0.002074688673019409, 0.0021480321884155273, 0.0022213757038116455, 0.0022947192192077637, 0.002368062734603882, 0.00244140625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 5.0, 4.0, 13.0, 12.0, 22.0, 50.0, 174.0, 398.0, 175.0, 69.0, 13.0, 9.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007390975952148438, -0.0007182508707046509, -0.000697404146194458, -0.0006765574216842651, -0.0006557106971740723, -0.0006348639726638794, -0.0006140172481536865, -0.0005931705236434937, -0.0005723237991333008, -0.0005514770746231079, -0.000530630350112915, -0.0005097836256027222, -0.0004889369010925293, -0.0004680901765823364, -0.00044724345207214355, -0.0004263967275619507, -0.0004055500030517578, -0.00038470327854156494, -0.00036385655403137207, -0.0003430098295211792, -0.00032216310501098633, -0.00030131638050079346, -0.0002804696559906006, -0.0002596229314804077, -0.00023877620697021484, -0.00021792948246002197, -0.0001970827579498291, -0.00017623603343963623, -0.00015538930892944336, -0.0001345425844192505, -0.00011369585990905762, -9.284913539886475e-05, -7.200241088867188e-05, -5.1155686378479004e-05, -3.0308961868286133e-05, -9.462237358093262e-06, 1.138448715209961e-05, 3.223121166229248e-05, 5.307793617248535e-05, 7.392466068267822e-05, 9.47713851928711e-05, 0.00011561810970306396, 0.00013646483421325684, 0.0001573115587234497, 0.00017815828323364258, 0.00019900500774383545, 0.00021985173225402832, 0.0002406984567642212, 0.00026154518127441406, 0.00028239190578460693, 0.0003032386302947998, 0.0003240853548049927, 0.00034493207931518555, 0.0003657788038253784, 0.0003866255283355713, 0.00040747225284576416, 0.00042831897735595703, 0.0004491657018661499, 0.0004700124263763428, 0.0004908591508865356, 0.0005117058753967285, 0.0005325525999069214, 0.0005533993244171143, 0.0005742460489273071, 0.0005950927734375]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 1.0, 6.0, 1.0, 4.0, 5.0, 3.0, 11.0, 5.0, 8.0, 11.0, 16.0, 28.0, 28.0, 33.0, 62.0, 71.0, 80.0, 95.0, 112.0, 87.0, 63.0, 53.0, 40.0, 36.0, 33.0, 19.0, 26.0, 17.0, 6.0, 10.0, 5.0, 5.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036887770984321833, -0.003537248121574521, -0.003385719144716859, -0.0032341901678591967, -0.0030826611910015345, -0.0029311322141438723, -0.0027796030044555664, -0.002628074027597904, -0.002476545050740242, -0.00232501607388258, -0.0021734870970249176, -0.0020219581201672554, -0.0018704291433095932, -0.001718900166451931, -0.001567371073178947, -0.0014158420963212848, -0.0012643132358789444, -0.0011127842590212822, -0.00096125528216362, -0.0008097262470982969, -0.0006581972702406347, -0.0005066682933829725, -0.00035513925831764936, -0.00020361028145998716, -5.208130460232496e-05, 9.944768680725247e-05, 0.0002509766782168299, 0.00040250568417832255, 0.0005540346610359848, 0.000705563637893647, 0.0008570926729589701, 0.0010086216498166323, 0.0011601503938436508, 0.001311679370701313, 0.0014632083475589752, 0.0016147373244166374, 0.0017662663012742996, 0.0019177952781319618, 0.002069324254989624, 0.0022208532318472862, 0.0023723822087049484, 0.0025239111855626106, 0.002675440162420273, 0.002826969139277935, 0.0029784981161355972, 0.0031300270929932594, 0.0032815560698509216, 0.003433085046708584, 0.0035846142563968897, 0.003736143233254552, 0.003887672210112214, 0.00403920141980052, 0.004190730396658182, 0.004342259373515844, 0.0044937883503735065, 0.004645317327231169, 0.004796846304088831, 0.004948375280946493, 0.005099904257804155, 0.0052514332346618176, 0.00540296221151948, 0.005554491188377142, 0.005706020165234804, 0.005857549142092466, 0.0060090781189501286]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 14.0, 19.0, 16.0, 29.0, 32.0, 26.0, 37.0, 31.0, 39.0, 36.0, 34.0, 57.0, 46.0, 33.0, 46.0, 36.0, 39.0, 35.0, 27.0, 38.0, 28.0, 24.0, 22.0, 20.0, 29.0, 22.0, 13.0, 12.0, 9.0, 9.0, 12.0, 11.0, 6.0, 4.0, 8.0, 6.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002762011718004942, -0.0026647301856428385, -0.0025674488861113787, -0.002470167353749275, -0.0023728858213871717, -0.0022756042890250683, -0.0021783229894936085, -0.002081041457131505, -0.0019837599247694016, -0.00188647850882262, -0.0017891969764605165, -0.0016919155605137348, -0.0015946340281516314, -0.0014973526122048497, -0.001400071196258068, -0.0013027896638959646, -0.0012055083643645048, -0.0011082269484177232, -0.0010109454160556197, -0.0009136640001088381, -0.0008163825259543955, -0.000719101051799953, -0.0006218196358531713, -0.0005245381616987288, -0.00042725668754428625, -0.0003299752133898437, -0.0002326937683392316, -0.00013541232328861952, -3.813084913417697e-05, 5.915062502026558e-05, 0.00015643204096704721, 0.00025371351512148976, 0.00035099522210657597, 0.0004482766962610185, 0.0005455581704154611, 0.0006428395863622427, 0.0007401210605166852, 0.0008374025346711278, 0.0009346839506179094, 0.001031965482980013, 0.0011292468989267945, 0.0012265283148735762, 0.0013238098472356796, 0.0014210912631824613, 0.001518372679129243, 0.0016156542114913464, 0.001712935627438128, 0.0018102170433849096, 0.001907498575747013, 0.0020047801081091166, 0.0021020614076405764, 0.00219934294000268, 0.0022966244723647833, 0.0023939060047268867, 0.0024911873042583466, 0.00258846883662045, 0.0026857503689825535, 0.002783031901344657, 0.0028803132008761168, 0.00297759473323822, 0.0030748762656003237, 0.003172157797962427, 0.003269439097493887, 0.0033667206298559904, 0.0034640019293874502]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 7.0, 14.0, 22.0, 26.0, 54.0, 72.0, 107.0, 146.0, 266.0, 401.0, 586.0, 915.0, 1382.0, 2093.0, 3331.0, 5248.0, 8243.0, 13509.0, 23208.0, 41987.0, 86655.0, 219073.0, 805767.0, 1871148.0, 737537.0, 196787.0, 78059.0, 39327.0, 21981.0, 12967.0, 7875.0, 5086.0, 3358.0, 2161.0, 1430.0, 1031.0, 726.0, 479.0, 327.0, 249.0, 176.0, 118.0, 103.0, 67.0, 53.0, 36.0, 19.0, 22.0, 9.0, 17.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.005176544189453125, -0.00498807430267334, -0.004799604415893555, -0.0046111345291137695, -0.004422664642333984, -0.004234194755554199, -0.004045724868774414, -0.003857254981994629, -0.0036687850952148438, -0.0034803152084350586, -0.0032918453216552734, -0.0031033754348754883, -0.002914905548095703, -0.002726435661315918, -0.002537965774536133, -0.0023494958877563477, -0.0021610260009765625, -0.0019725561141967773, -0.0017840862274169922, -0.001595616340637207, -0.0014071464538574219, -0.0012186765670776367, -0.0010302066802978516, -0.0008417367935180664, -0.0006532669067382812, -0.0004647970199584961, -0.00027632713317871094, -8.785724639892578e-05, 0.00010061264038085938, 0.00028908252716064453, 0.0004775524139404297, 0.0006660223007202148, 0.0008544921875, 0.0010429620742797852, 0.0012314319610595703, 0.0014199018478393555, 0.0016083717346191406, 0.0017968416213989258, 0.001985311508178711, 0.002173781394958496, 0.0023622512817382812, 0.0025507211685180664, 0.0027391910552978516, 0.0029276609420776367, 0.003116130828857422, 0.003304600715637207, 0.003493070602416992, 0.0036815404891967773, 0.0038700103759765625, 0.004058480262756348, 0.004246950149536133, 0.004435420036315918, 0.004623889923095703, 0.004812359809875488, 0.0050008296966552734, 0.005189299583435059, 0.005377769470214844, 0.005566239356994629, 0.005754709243774414, 0.005943179130554199, 0.006131649017333984, 0.0063201189041137695, 0.006508588790893555, 0.00669705867767334, 0.006885528564453125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 4.0, 4.0, 13.0, 9.0, 11.0, 16.0, 18.0, 8.0, 21.0, 29.0, 22.0, 27.0, 29.0, 30.0, 45.0, 34.0, 46.0, 37.0, 59.0, 45.0, 40.0, 44.0, 51.0, 45.0, 38.0, 41.0, 26.0, 26.0, 26.0, 14.0, 27.0, 22.0, 16.0, 13.0, 6.0, 15.0, 10.0, 6.0, 7.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0024242401123046875, -0.0023370087146759033, -0.002249777317047119, -0.002162545919418335, -0.0020753145217895508, -0.0019880831241607666, -0.0019008517265319824, -0.0018136203289031982, -0.001726388931274414, -0.0016391575336456299, -0.0015519261360168457, -0.0014646947383880615, -0.0013774633407592773, -0.0012902319431304932, -0.001203000545501709, -0.0011157691478729248, -0.0010285377502441406, -0.0009413063526153564, -0.0008540749549865723, -0.0007668435573577881, -0.0006796121597290039, -0.0005923807621002197, -0.0005051493644714355, -0.00041791796684265137, -0.0003306865692138672, -0.000243455171585083, -0.00015622377395629883, -6.899237632751465e-05, 1.823902130126953e-05, 0.00010547041893005371, 0.0001927018165588379, 0.00027993321418762207, 0.00036716461181640625, 0.00045439600944519043, 0.0005416274070739746, 0.0006288588047027588, 0.000716090202331543, 0.0008033215999603271, 0.0008905529975891113, 0.0009777843952178955, 0.0010650157928466797, 0.0011522471904754639, 0.001239478588104248, 0.0013267099857330322, 0.0014139413833618164, 0.0015011727809906006, 0.0015884041786193848, 0.001675635576248169, 0.0017628669738769531, 0.0018500983715057373, 0.0019373297691345215, 0.0020245611667633057, 0.00211179256439209, 0.002199023962020874, 0.002286255359649658, 0.0023734867572784424, 0.0024607181549072266, 0.0025479495525360107, 0.002635180950164795, 0.002722412347793579, 0.0028096437454223633, 0.0028968751430511475, 0.0029841065406799316, 0.003071337938308716, 0.0031585693359375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 4.0, 8.0, 14.0, 14.0, 18.0, 28.0, 68.0, 89.0, 107.0, 171.0, 242.0, 331.0, 491.0, 774.0, 1138.0, 1693.0, 2742.0, 4307.0, 6920.0, 11168.0, 19020.0, 33023.0, 60435.0, 117609.0, 252060.0, 653217.0, 1621303.0, 811980.0, 299426.0, 136183.0, 68324.0, 36971.0, 21087.0, 12466.0, 7512.0, 4667.0, 2887.0, 1997.0, 1289.0, 822.0, 548.0, 365.0, 254.0, 153.0, 119.0, 72.0, 56.0, 37.0, 22.0, 22.0, 12.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.00553131103515625, -0.005366683006286621, -0.005202054977416992, -0.005037426948547363, -0.004872798919677734, -0.0047081708908081055, -0.0045435428619384766, -0.004378914833068848, -0.004214286804199219, -0.00404965877532959, -0.003885030746459961, -0.003720402717590332, -0.003555774688720703, -0.0033911466598510742, -0.0032265186309814453, -0.0030618906021118164, -0.0028972625732421875, -0.0027326345443725586, -0.0025680065155029297, -0.0024033784866333008, -0.002238750457763672, -0.002074122428894043, -0.001909494400024414, -0.0017448663711547852, -0.0015802383422851562, -0.0014156103134155273, -0.0012509822845458984, -0.0010863542556762695, -0.0009217262268066406, -0.0007570981979370117, -0.0005924701690673828, -0.0004278421401977539, -0.000263214111328125, -9.85860824584961e-05, 6.604194641113281e-05, 0.00023066997528076172, 0.0003952980041503906, 0.0005599260330200195, 0.0007245540618896484, 0.0008891820907592773, 0.0010538101196289062, 0.0012184381484985352, 0.001383066177368164, 0.001547694206237793, 0.0017123222351074219, 0.0018769502639770508, 0.0020415782928466797, 0.0022062063217163086, 0.0023708343505859375, 0.0025354623794555664, 0.0027000904083251953, 0.0028647184371948242, 0.003029346466064453, 0.003193974494934082, 0.003358602523803711, 0.00352323055267334, 0.0036878585815429688, 0.0038524866104125977, 0.0040171146392822266, 0.0041817426681518555, 0.004346370697021484, 0.004510998725891113, 0.004675626754760742, 0.004840254783630371, 0.0050048828125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 20.0, 17.0, 28.0, 40.0, 37.0, 50.0, 73.0, 84.0, 128.0, 117.0, 168.0, 188.0, 230.0, 333.0, 403.0, 428.0, 356.0, 292.0, 226.0, 185.0, 112.0, 120.0, 84.0, 69.0, 64.0, 38.0, 40.0, 31.0, 19.0, 15.0, 12.0, 9.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017709732055664062, -0.00171583890914917, -0.0016607046127319336, -0.0016055703163146973, -0.001550436019897461, -0.0014953017234802246, -0.0014401674270629883, -0.001385033130645752, -0.0013298988342285156, -0.0012747645378112793, -0.001219630241394043, -0.0011644959449768066, -0.0011093616485595703, -0.001054227352142334, -0.0009990930557250977, -0.0009439587593078613, -0.000888824462890625, -0.0008336901664733887, -0.0007785558700561523, -0.000723421573638916, -0.0006682872772216797, -0.0006131529808044434, -0.000558018684387207, -0.0005028843879699707, -0.0004477500915527344, -0.00039261579513549805, -0.0003374814987182617, -0.0002823472023010254, -0.00022721290588378906, -0.00017207860946655273, -0.0001169443130493164, -6.181001663208008e-05, -6.67572021484375e-06, 4.845857620239258e-05, 0.0001035928726196289, 0.00015872716903686523, 0.00021386146545410156, 0.0002689957618713379, 0.0003241300582885742, 0.00037926435470581055, 0.0004343986511230469, 0.0004895329475402832, 0.0005446672439575195, 0.0005998015403747559, 0.0006549358367919922, 0.0007100701332092285, 0.0007652044296264648, 0.0008203387260437012, 0.0008754730224609375, 0.0009306073188781738, 0.0009857416152954102, 0.0010408759117126465, 0.0010960102081298828, 0.0011511445045471191, 0.0012062788009643555, 0.0012614130973815918, 0.0013165473937988281, 0.0013716816902160645, 0.0014268159866333008, 0.0014819502830505371, 0.0015370845794677734, 0.0015922188758850098, 0.001647353172302246, 0.0017024874687194824, 0.0017576217651367188]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 8.0, 8.0, 6.0, 10.0, 14.0, 21.0, 40.0, 29.0, 43.0, 65.0, 82.0, 93.0, 123.0, 108.0, 101.0, 68.0, 45.0, 32.0, 31.0, 14.0, 17.0, 14.0, 13.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005335601046681404, -0.005135165993124247, -0.004934730473905802, -0.004734295420348644, -0.004533859901130199, -0.004333424847573042, -0.004132989794015884, -0.00393255427479744, -0.003732119221240282, -0.003531683934852481, -0.0033312486484646797, -0.003130813594907522, -0.002930378308519721, -0.00272994302213192, -0.0025295079685747623, -0.002329072682186961, -0.00212863739579916, -0.0019282021094113588, -0.0017277669394388795, -0.0015273317694664001, -0.001326896483078599, -0.0011264611966907978, -0.0009260260267183185, -0.0007255908567458391, -0.000525155570358038, -0.0003247203421778977, -0.00012428511399775743, 7.615011418238282e-05, 0.0002765853423625231, 0.00047702062875032425, 0.0006774557987228036, 0.0008778909686952829, 0.001078326255083084, 0.0012787615414708853, 0.0014791967114433646, 0.001679631881415844, 0.0018800671678036451, 0.0020805024541914463, 0.002280937507748604, 0.002481372794136405, 0.002681808080524206, 0.0028822433669120073, 0.0030826786532998085, 0.003283113706856966, 0.003483548993244767, 0.0036839842796325684, 0.003884419333189726, 0.004084854386746883, 0.004285289905965328, 0.004485724959522486, 0.0046861604787409306, 0.004886595532298088, 0.005087031051516533, 0.00528746610507369, 0.005487901158630848, 0.005688336677849293, 0.00588877173140645, 0.006089206784963608, 0.006289642304182053, 0.00649007735773921, 0.006690512411296368, 0.0068909479305148125, 0.00709138298407197, 0.0072918180376291275, 0.007492253556847572]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 13.0, 14.0, 14.0, 12.0, 7.0, 15.0, 24.0, 20.0, 16.0, 30.0, 27.0, 29.0, 41.0, 35.0, 42.0, 36.0, 41.0, 49.0, 48.0, 37.0, 47.0, 28.0, 38.0, 39.0, 27.0, 31.0, 30.0, 23.0, 22.0, 23.0, 14.0, 20.0, 16.0, 14.0, 10.0, 17.0, 13.0, 3.0, 7.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002904309192672372, -0.0028063601348549128, -0.0027084110770374537, -0.0026104620192199945, -0.0025125129614025354, -0.0024145639035850763, -0.0023166146129369736, -0.0022186655551195145, -0.0021207164973020554, -0.0020227674394845963, -0.0019248183816671371, -0.001826869323849678, -0.001728920266032219, -0.0016309712082147598, -0.001533022033981979, -0.0014350729761645198, -0.0013371240347623825, -0.0012391749769449234, -0.0011412259191274643, -0.0010432768613100052, -0.0009453277452848852, -0.0008473786874674261, -0.000749429571442306, -0.0006514805136248469, -0.0005535314558073878, -0.0004555823979899287, -0.00035763331106863916, -0.0002596842241473496, -0.0001617351663298905, -6.378610851243138e-05, 3.416300751268864e-05, 0.00013211206533014774, 0.0002300608903169632, 0.0003280099481344223, 0.00042595903505571187, 0.0005239081219770014, 0.0006218571797944605, 0.0007198062376119196, 0.0008177553536370397, 0.0009157044114544988, 0.0010136534692719579, 0.001111602527089417, 0.001209551584906876, 0.001307500759139657, 0.0014054498169571161, 0.0015033988747745752, 0.0016013479325920343, 0.0016992969904094934, 0.0017972460482269526, 0.0018951951060444117, 0.0019931441638618708, 0.00209109322167933, 0.002189042279496789, 0.002286991337314248, 0.002384940627962351, 0.00248288968577981, 0.002580838743597269, 0.002678787801414728, 0.0027767368592321873, 0.0028746859170496464, 0.0029726349748671055, 0.0030705840326845646, 0.0031685330905020237, 0.003266482148319483, 0.003364431206136942]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 11.0, 8.0, 3.0, 11.0, 8.0, 23.0, 30.0, 59.0, 67.0, 103.0, 137.0, 202.0, 262.0, 383.0, 590.0, 783.0, 1172.0, 1787.0, 2675.0, 4201.0, 6873.0, 11074.0, 19080.0, 33616.0, 64800.0, 143071.0, 350956.0, 214949.0, 87171.0, 43502.0, 23775.0, 13724.0, 8358.0, 5125.0, 3298.0, 2106.0, 1457.0, 981.0, 614.0, 452.0, 319.0, 223.0, 147.0, 110.0, 69.0, 64.0, 53.0, 26.0, 20.0, 9.0, 15.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0], "bins": [-0.0013484954833984375, -0.001307263970375061, -0.0012660324573516846, -0.001224800944328308, -0.0011835694313049316, -0.0011423379182815552, -0.0011011064052581787, -0.0010598748922348022, -0.0010186433792114258, -0.0009774118661880493, -0.0009361803531646729, -0.0008949488401412964, -0.0008537173271179199, -0.0008124858140945435, -0.000771254301071167, -0.0007300227880477905, -0.0006887912750244141, -0.0006475597620010376, -0.0006063282489776611, -0.0005650967359542847, -0.0005238652229309082, -0.00048263370990753174, -0.0004414021968841553, -0.0004001706838607788, -0.00035893917083740234, -0.0003177076578140259, -0.0002764761447906494, -0.00023524463176727295, -0.00019401311874389648, -0.00015278160572052002, -0.00011155009269714355, -7.031857967376709e-05, -2.9087066650390625e-05, 1.214444637298584e-05, 5.3375959396362305e-05, 9.460747241973877e-05, 0.00013583898544311523, 0.0001770704984664917, 0.00021830201148986816, 0.00025953352451324463, 0.0003007650375366211, 0.00034199655055999756, 0.000383228063583374, 0.0004244595766067505, 0.00046569108963012695, 0.0005069226026535034, 0.0005481541156768799, 0.0005893856287002563, 0.0006306171417236328, 0.0006718486547470093, 0.0007130801677703857, 0.0007543116807937622, 0.0007955431938171387, 0.0008367747068405151, 0.0008780062198638916, 0.0009192377328872681, 0.0009604692459106445, 0.001001700758934021, 0.0010429322719573975, 0.001084163784980774, 0.0011253952980041504, 0.0011666268110275269, 0.0012078583240509033, 0.0012490898370742798, 0.0012903213500976562]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 7.0, 13.0, 7.0, 11.0, 9.0, 15.0, 14.0, 12.0, 17.0, 25.0, 17.0, 25.0, 26.0, 35.0, 36.0, 34.0, 37.0, 46.0, 44.0, 52.0, 35.0, 38.0, 45.0, 37.0, 45.0, 39.0, 34.0, 32.0, 24.0, 24.0, 19.0, 13.0, 22.0, 21.0, 14.0, 15.0, 16.0, 13.0, 10.0, 6.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0031280517578125, -0.0030224621295928955, -0.002916872501373291, -0.0028112828731536865, -0.002705693244934082, -0.0026001036167144775, -0.002494513988494873, -0.0023889243602752686, -0.002283334732055664, -0.0021777451038360596, -0.002072155475616455, -0.0019665658473968506, -0.001860976219177246, -0.0017553865909576416, -0.0016497969627380371, -0.0015442073345184326, -0.0014386177062988281, -0.0013330280780792236, -0.0012274384498596191, -0.0011218488216400146, -0.0010162591934204102, -0.0009106695652008057, -0.0008050799369812012, -0.0006994903087615967, -0.0005939006805419922, -0.0004883110523223877, -0.0003827214241027832, -0.0002771317958831787, -0.00017154216766357422, -6.595253944396973e-05, 3.9637088775634766e-05, 0.00014522671699523926, 0.00025081634521484375, 0.00035640597343444824, 0.00046199560165405273, 0.0005675852298736572, 0.0006731748580932617, 0.0007787644863128662, 0.0008843541145324707, 0.0009899437427520752, 0.0010955333709716797, 0.0012011229991912842, 0.0013067126274108887, 0.0014123022556304932, 0.0015178918838500977, 0.0016234815120697021, 0.0017290711402893066, 0.0018346607685089111, 0.0019402503967285156, 0.00204584002494812, 0.0021514296531677246, 0.002257019281387329, 0.0023626089096069336, 0.002468198537826538, 0.0025737881660461426, 0.002679377794265747, 0.0027849674224853516, 0.002890557050704956, 0.0029961466789245605, 0.003101736307144165, 0.0032073259353637695, 0.003312915563583374, 0.0034185051918029785, 0.003524094820022583, 0.0036296844482421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 9.0, 7.0, 17.0, 20.0, 24.0, 32.0, 41.0, 70.0, 121.0, 192.0, 403.0, 699.0, 1299.0, 2629.0, 5613.0, 13341.0, 37474.0, 172457.0, 653951.0, 111446.0, 28523.0, 10810.0, 4666.0, 2187.0, 1108.0, 583.0, 326.0, 176.0, 103.0, 57.0, 38.0, 34.0, 24.0, 11.0, 9.0, 18.0, 6.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002597808837890625, -0.002512305974960327, -0.0024268031120300293, -0.0023413002490997314, -0.0022557973861694336, -0.0021702945232391357, -0.002084791660308838, -0.00199928879737854, -0.0019137859344482422, -0.0018282830715179443, -0.0017427802085876465, -0.0016572773456573486, -0.0015717744827270508, -0.001486271619796753, -0.001400768756866455, -0.0013152658939361572, -0.0012297630310058594, -0.0011442601680755615, -0.0010587573051452637, -0.0009732544422149658, -0.000887751579284668, -0.0008022487163543701, -0.0007167458534240723, -0.0006312429904937744, -0.0005457401275634766, -0.0004602372646331787, -0.00037473440170288086, -0.000289231538772583, -0.00020372867584228516, -0.0001182258129119873, -3.272294998168945e-05, 5.27799129486084e-05, 0.00013828277587890625, 0.0002237856388092041, 0.00030928850173950195, 0.0003947913646697998, 0.00048029422760009766, 0.0005657970905303955, 0.0006512999534606934, 0.0007368028163909912, 0.0008223056793212891, 0.0009078085422515869, 0.0009933114051818848, 0.0010788142681121826, 0.0011643171310424805, 0.0012498199939727783, 0.0013353228569030762, 0.001420825719833374, 0.0015063285827636719, 0.0015918314456939697, 0.0016773343086242676, 0.0017628371715545654, 0.0018483400344848633, 0.0019338428974151611, 0.002019345760345459, 0.002104848623275757, 0.0021903514862060547, 0.0022758543491363525, 0.0023613572120666504, 0.0024468600749969482, 0.002532362937927246, 0.002617865800857544, 0.002703368663787842, 0.0027888715267181396, 0.0028743743896484375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 11.0, 4.0, 10.0, 7.0, 18.0, 10.0, 20.0, 26.0, 24.0, 31.0, 41.0, 53.0, 23.0, 27.0, 45.0, 33.0, 34.0, 53.0, 44.0, 36.0, 36.0, 36.0, 34.0, 41.0, 44.0, 28.0, 42.0, 36.0, 27.0, 22.0, 15.0, 17.0, 9.0, 14.0, 11.0, 6.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0021305084228515625, -0.002063244581222534, -0.001995980739593506, -0.0019287168979644775, -0.0018614530563354492, -0.001794189214706421, -0.0017269253730773926, -0.0016596615314483643, -0.001592397689819336, -0.0015251338481903076, -0.0014578700065612793, -0.001390606164932251, -0.0013233423233032227, -0.0012560784816741943, -0.001188814640045166, -0.0011215507984161377, -0.0010542869567871094, -0.000987023115158081, -0.0009197592735290527, -0.0008524954319000244, -0.0007852315902709961, -0.0007179677486419678, -0.0006507039070129395, -0.0005834400653839111, -0.0005161762237548828, -0.0004489123821258545, -0.00038164854049682617, -0.00031438469886779785, -0.00024712085723876953, -0.0001798570156097412, -0.00011259317398071289, -4.532933235168457e-05, 2.193450927734375e-05, 8.919835090637207e-05, 0.0001564621925354004, 0.0002237260341644287, 0.00029098987579345703, 0.00035825371742248535, 0.00042551755905151367, 0.000492781400680542, 0.0005600452423095703, 0.0006273090839385986, 0.000694572925567627, 0.0007618367671966553, 0.0008291006088256836, 0.0008963644504547119, 0.0009636282920837402, 0.0010308921337127686, 0.0010981559753417969, 0.0011654198169708252, 0.0012326836585998535, 0.0012999475002288818, 0.0013672113418579102, 0.0014344751834869385, 0.0015017390251159668, 0.0015690028667449951, 0.0016362667083740234, 0.0017035305500030518, 0.00177079439163208, 0.0018380582332611084, 0.0019053220748901367, 0.001972585916519165, 0.0020398497581481934, 0.0021071135997772217, 0.00217437744140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 3.0, 2.0, 9.0, 12.0, 23.0, 21.0, 31.0, 37.0, 31.0, 43.0, 78.0, 73.0, 107.0, 126.0, 181.0, 234.0, 361.0, 492.0, 703.0, 1400.0, 3883.0, 15905.0, 206034.0, 783348.0, 25553.0, 5317.0, 1755.0, 811.0, 531.0, 371.0, 246.0, 174.0, 141.0, 115.0, 84.0, 64.0, 42.0, 37.0, 36.0, 24.0, 16.0, 16.0, 19.0, 18.0, 11.0, 5.0, 6.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0], "bins": [-0.0007410049438476562, -0.0007186383008956909, -0.0006962716579437256, -0.0006739050149917603, -0.0006515383720397949, -0.0006291717290878296, -0.0006068050861358643, -0.0005844384431838989, -0.0005620718002319336, -0.0005397051572799683, -0.0005173385143280029, -0.0004949718713760376, -0.00047260522842407227, -0.00045023858547210693, -0.0004278719425201416, -0.00040550529956817627, -0.00038313865661621094, -0.0003607720136642456, -0.0003384053707122803, -0.00031603872776031494, -0.0002936720848083496, -0.0002713054418563843, -0.00024893879890441895, -0.0002265721559524536, -0.00020420551300048828, -0.00018183887004852295, -0.00015947222709655762, -0.00013710558414459229, -0.00011473894119262695, -9.237229824066162e-05, -7.000565528869629e-05, -4.763901233673096e-05, -2.5272369384765625e-05, -2.905726432800293e-06, 1.946091651916504e-05, 4.182755947113037e-05, 6.41942024230957e-05, 8.656084537506104e-05, 0.00010892748832702637, 0.0001312941312789917, 0.00015366077423095703, 0.00017602741718292236, 0.0001983940601348877, 0.00022076070308685303, 0.00024312734603881836, 0.0002654939889907837, 0.000287860631942749, 0.00031022727489471436, 0.0003325939178466797, 0.000354960560798645, 0.00037732720375061035, 0.0003996938467025757, 0.000422060489654541, 0.00044442713260650635, 0.0004667937755584717, 0.000489160418510437, 0.0005115270614624023, 0.0005338937044143677, 0.000556260347366333, 0.0005786269903182983, 0.0006009936332702637, 0.000623360276222229, 0.0006457269191741943, 0.0006680935621261597, 0.000690460205078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 9.0, 3.0, 2.0, 5.0, 8.0, 4.0, 11.0, 15.0, 12.0, 39.0, 44.0, 23.0, 73.0, 34.0, 79.0, 82.0, 39.0, 82.0, 68.0, 45.0, 82.0, 58.0, 16.0, 43.0, 17.0, 23.0, 20.0, 12.0, 24.0, 12.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.9420480132102966e-06, -2.8442591428756714e-06, -2.746470272541046e-06, -2.648681402206421e-06, -2.5508925318717957e-06, -2.4531036615371704e-06, -2.355314791202545e-06, -2.25752592086792e-06, -2.1597370505332947e-06, -2.0619481801986694e-06, -1.964159309864044e-06, -1.866370439529419e-06, -1.7685815691947937e-06, -1.6707926988601685e-06, -1.5730038285255432e-06, -1.475214958190918e-06, -1.3774260878562927e-06, -1.2796372175216675e-06, -1.1818483471870422e-06, -1.084059476852417e-06, -9.862706065177917e-07, -8.884817361831665e-07, -7.906928658485413e-07, -6.92903995513916e-07, -5.951151251792908e-07, -4.973262548446655e-07, -3.995373845100403e-07, -3.0174851417541504e-07, -2.039596438407898e-07, -1.0617077350616455e-07, -8.381903171539307e-09, 8.940696716308594e-08, 1.8719583749771118e-07, 2.849847078323364e-07, 3.8277357816696167e-07, 4.805624485015869e-07, 5.783513188362122e-07, 6.761401891708374e-07, 7.739290595054626e-07, 8.717179298400879e-07, 9.695068001747131e-07, 1.0672956705093384e-06, 1.1650845408439636e-06, 1.2628734111785889e-06, 1.3606622815132141e-06, 1.4584511518478394e-06, 1.5562400221824646e-06, 1.6540288925170898e-06, 1.751817762851715e-06, 1.8496066331863403e-06, 1.9473955035209656e-06, 2.045184373855591e-06, 2.142973244190216e-06, 2.2407621145248413e-06, 2.3385509848594666e-06, 2.436339855194092e-06, 2.534128725528717e-06, 2.6319175958633423e-06, 2.7297064661979675e-06, 2.8274953365325928e-06, 2.925284206867218e-06, 3.0230730772018433e-06, 3.1208619475364685e-06, 3.2186508178710938e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 4.0, 11.0, 6.0, 14.0, 30.0, 37.0, 48.0, 54.0, 90.0, 113.0, 178.0, 238.0, 326.0, 496.0, 815.0, 1377.0, 2928.0, 8026.0, 25410.0, 100287.0, 645088.0, 200403.0, 41512.0, 12092.0, 4251.0, 1786.0, 969.0, 614.0, 371.0, 288.0, 202.0, 147.0, 83.0, 73.0, 58.0, 37.0, 22.0, 14.0, 13.0, 11.0, 11.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006785392761230469, -0.0006584003567695618, -0.0006382614374160767, -0.0006181225180625916, -0.0005979835987091064, -0.0005778446793556213, -0.0005577057600021362, -0.0005375668406486511, -0.000517427921295166, -0.0004972890019416809, -0.0004771500825881958, -0.0004570111632347107, -0.0004368722438812256, -0.0004167333245277405, -0.00039659440517425537, -0.00037645548582077026, -0.00035631656646728516, -0.00033617764711380005, -0.00031603872776031494, -0.00029589980840682983, -0.0002757608890533447, -0.0002556219696998596, -0.0002354830503463745, -0.0002153441309928894, -0.0001952052116394043, -0.0001750662922859192, -0.00015492737293243408, -0.00013478845357894897, -0.00011464953422546387, -9.451061487197876e-05, -7.437169551849365e-05, -5.4232776165008545e-05, -3.409385681152344e-05, -1.395493745803833e-05, 6.183981895446777e-06, 2.6322901248931885e-05, 4.646182060241699e-05, 6.66007399559021e-05, 8.673965930938721e-05, 0.00010687857866287231, 0.00012701749801635742, 0.00014715641736984253, 0.00016729533672332764, 0.00018743425607681274, 0.00020757317543029785, 0.00022771209478378296, 0.00024785101413726807, 0.0002679899334907532, 0.0002881288528442383, 0.0003082677721977234, 0.0003284066915512085, 0.0003485456109046936, 0.0003686845302581787, 0.0003888234496116638, 0.0004089623689651489, 0.00042910128831863403, 0.00044924020767211914, 0.00046937912702560425, 0.0004895180463790894, 0.0005096569657325745, 0.0005297958850860596, 0.0005499348044395447, 0.0005700737237930298, 0.0005902126431465149, 0.0006103515625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 23.0, 67.0, 101.0, 205.0, 290.0, 133.0, 76.0, 49.0, 17.0, 5.0, 8.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017535686492919922, -0.00016957707703113556, -0.0001637972891330719, -0.00015801750123500824, -0.00015223771333694458, -0.00014645792543888092, -0.00014067813754081726, -0.0001348983496427536, -0.00012911856174468994, -0.00012333877384662628, -0.00011755898594856262, -0.00011177919805049896, -0.0001059994101524353, -0.00010021962225437164, -9.443983435630798e-05, -8.866004645824432e-05, -8.288025856018066e-05, -7.7100470662117e-05, -7.132068276405334e-05, -6.554089486598969e-05, -5.9761106967926025e-05, -5.3981319069862366e-05, -4.8201531171798706e-05, -4.2421743273735046e-05, -3.664195537567139e-05, -3.086216747760773e-05, -2.5082379579544067e-05, -1.9302591681480408e-05, -1.3522803783416748e-05, -7.743015885353088e-06, -1.9632279872894287e-06, 3.816559910774231e-06, 9.59634780883789e-06, 1.537613570690155e-05, 2.115592360496521e-05, 2.693571150302887e-05, 3.271549940109253e-05, 3.849528729915619e-05, 4.427507519721985e-05, 5.005486309528351e-05, 5.583465099334717e-05, 6.161443889141083e-05, 6.739422678947449e-05, 7.317401468753815e-05, 7.89538025856018e-05, 8.473359048366547e-05, 9.051337838172913e-05, 9.629316627979279e-05, 0.00010207295417785645, 0.0001078527420759201, 0.00011363252997398376, 0.00011941231787204742, 0.00012519210577011108, 0.00013097189366817474, 0.0001367516815662384, 0.00014253146946430206, 0.00014831125736236572, 0.00015409104526042938, 0.00015987083315849304, 0.0001656506210565567, 0.00017143040895462036, 0.00017721019685268402, 0.00018298998475074768, 0.00018876977264881134, 0.000194549560546875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 8.0, 14.0, 35.0, 25.0, 29.0, 50.0, 63.0, 83.0, 95.0, 120.0, 105.0, 98.0, 70.0, 43.0, 31.0, 33.0, 15.0, 17.0, 12.0, 11.0, 12.0, 3.0, 1.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005497945472598076, -0.005298672243952751, -0.005099398549646139, -0.0049001253210008144, -0.004700851626694202, -0.004501578398048878, -0.004302304703742266, -0.004103031475096941, -0.003903757780790329, -0.0037044843193143606, -0.0035052108578383923, -0.003305937396362424, -0.0031066639348864555, -0.002907390706241131, -0.002708117011934519, -0.002508843783289194, -0.0023095703218132257, -0.0021102968603372574, -0.001911023398861289, -0.0017117499373853207, -0.0015124764759093523, -0.0013132031308487058, -0.0011139296693727374, -0.000914656207896769, -0.0007153827464208007, -0.0005161092849448323, -0.0003168358525726944, -0.00011756242020055652, 8.171104127541184e-05, 0.0002809844445437193, 0.00048025790601968765, 0.000679531367495656, 0.0008788048289716244, 0.0010780782904475927, 0.001277351751923561, 0.0014766252133995295, 0.0016758986748754978, 0.0018751720199361444, 0.0020744455978274345, 0.0022737188264727592, 0.0024729925207793713, 0.0026722659822553396, 0.002871539443731308, 0.0030708129052072763, 0.0032700863666832447, 0.0034693595953285694, 0.0036686332896351814, 0.003867906518280506, 0.004067179746925831, 0.0042664529755711555, 0.0044657266698777676, 0.004664999898523092, 0.004864273592829704, 0.005063546821475029, 0.005262820515781641, 0.005462093744426966, 0.005661367438733578, 0.0058606406673789024, 0.0060599143616855145, 0.006259187590330839, 0.006458461284637451, 0.006657734513282776, 0.006857008207589388, 0.007056281436234713, 0.007255555130541325]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 11.0, 10.0, 14.0, 11.0, 14.0, 8.0, 18.0, 22.0, 19.0, 16.0, 36.0, 21.0, 33.0, 37.0, 33.0, 42.0, 41.0, 46.0, 45.0, 47.0, 37.0, 48.0, 25.0, 46.0, 31.0, 26.0, 33.0, 32.0, 24.0, 22.0, 22.0, 13.0, 16.0, 18.0, 14.0, 12.0, 17.0, 10.0, 4.0, 7.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0029267724603414536, -0.0028281693812459707, -0.002729566302150488, -0.002630963223055005, -0.0025323601439595222, -0.0024337570648640394, -0.0023351539857685566, -0.00223655067384243, -0.002137947827577591, -0.002039344748482108, -0.0019407416693866253, -0.0018421385902911425, -0.0017435355111956596, -0.0016449324321001768, -0.0015463292365893722, -0.0014477261574938893, -0.0013491229619830847, -0.0012505198828876019, -0.001151916803792119, -0.0010533137246966362, -0.0009547105873934925, -0.0008561075082980096, -0.0007575043709948659, -0.0006589012918993831, -0.0005602982128039002, -0.0004616951337084174, -0.00036309202550910413, -0.00026448891730979085, -0.00016588583821430802, -6.72827591188252e-05, 3.132037818431854e-05, 0.00012992345727980137, 0.0002285265363752842, 0.000327129615470767, 0.0004257327236700803, 0.0005243358318693936, 0.0006229389109648764, 0.0007215419900603592, 0.000820145127363503, 0.0009187482064589858, 0.0010173512855544686, 0.0011159543646499515, 0.0012145574437454343, 0.001313160639256239, 0.0014117637183517218, 0.0015103667974472046, 0.0016089698765426874, 0.0017075729556381702, 0.001806176034733653, 0.001904779113829136, 0.0020033821929246187, 0.0021019852720201015, 0.0022005883511155844, 0.002299191430211067, 0.0023977947421371937, 0.002496397588402033, 0.0025950009003281593, 0.002693603979423642, 0.002792207058519125, 0.002890810137614608, 0.0029894132167100906, 0.0030880162958055735, 0.0031866193749010563, 0.0032852226868271828, 0.003383825533092022]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 16.0, 20.0, 28.0, 39.0, 56.0, 77.0, 111.0, 151.0, 250.0, 329.0, 504.0, 655.0, 925.0, 1348.0, 1904.0, 2728.0, 3997.0, 6026.0, 9154.0, 13876.0, 21755.0, 35040.0, 58570.0, 99503.0, 164752.0, 214287.0, 160906.0, 97058.0, 57419.0, 34381.0, 21328.0, 13790.0, 8721.0, 5893.0, 3985.0, 2682.0, 1942.0, 1284.0, 918.0, 660.0, 416.0, 314.0, 237.0, 182.0, 116.0, 71.0, 53.0, 26.0, 24.0, 14.0, 10.0, 11.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.005603790283203125, -0.005425751209259033, -0.005247712135314941, -0.00506967306137085, -0.004891633987426758, -0.004713594913482666, -0.004535555839538574, -0.004357516765594482, -0.004179477691650391, -0.004001438617706299, -0.003823399543762207, -0.0036453604698181152, -0.0034673213958740234, -0.0032892823219299316, -0.00311124324798584, -0.002933204174041748, -0.0027551651000976562, -0.0025771260261535645, -0.0023990869522094727, -0.002221047878265381, -0.002043008804321289, -0.0018649697303771973, -0.0016869306564331055, -0.0015088915824890137, -0.0013308525085449219, -0.00115281343460083, -0.0009747743606567383, -0.0007967352867126465, -0.0006186962127685547, -0.0004406571388244629, -0.0002626180648803711, -8.45789909362793e-05, 9.34600830078125e-05, 0.0002714991569519043, 0.0004495382308959961, 0.0006275773048400879, 0.0008056163787841797, 0.0009836554527282715, 0.0011616945266723633, 0.001339733600616455, 0.0015177726745605469, 0.0016958117485046387, 0.0018738508224487305, 0.0020518898963928223, 0.002229928970336914, 0.002407968044281006, 0.0025860071182250977, 0.0027640461921691895, 0.0029420852661132812, 0.003120124340057373, 0.003298163414001465, 0.0034762024879455566, 0.0036542415618896484, 0.0038322806358337402, 0.004010319709777832, 0.004188358783721924, 0.004366397857666016, 0.004544436931610107, 0.004722476005554199, 0.004900515079498291, 0.005078554153442383, 0.005256593227386475, 0.005434632301330566, 0.005612671375274658, 0.00579071044921875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 6.0, 5.0, 9.0, 7.0, 8.0, 14.0, 12.0, 14.0, 20.0, 23.0, 18.0, 24.0, 34.0, 24.0, 37.0, 33.0, 42.0, 38.0, 43.0, 48.0, 41.0, 53.0, 42.0, 36.0, 42.0, 33.0, 26.0, 36.0, 24.0, 33.0, 20.0, 17.0, 17.0, 18.0, 15.0, 15.0, 12.0, 10.0, 14.0, 10.0, 10.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0029773712158203125, -0.0028819739818573, -0.002786576747894287, -0.0026911795139312744, -0.0025957822799682617, -0.002500385046005249, -0.0024049878120422363, -0.0023095905780792236, -0.002214193344116211, -0.0021187961101531982, -0.0020233988761901855, -0.0019280016422271729, -0.0018326044082641602, -0.0017372071743011475, -0.0016418099403381348, -0.001546412706375122, -0.0014510154724121094, -0.0013556182384490967, -0.001260221004486084, -0.0011648237705230713, -0.0010694265365600586, -0.0009740293025970459, -0.0008786320686340332, -0.0007832348346710205, -0.0006878376007080078, -0.0005924403667449951, -0.0004970431327819824, -0.0004016458988189697, -0.00030624866485595703, -0.00021085143089294434, -0.00011545419692993164, -2.0056962966918945e-05, 7.534027099609375e-05, 0.00017073750495910645, 0.00026613473892211914, 0.00036153197288513184, 0.00045692920684814453, 0.0005523264408111572, 0.0006477236747741699, 0.0007431209087371826, 0.0008385181427001953, 0.000933915376663208, 0.0010293126106262207, 0.0011247098445892334, 0.001220107078552246, 0.0013155043125152588, 0.0014109015464782715, 0.0015062987804412842, 0.0016016960144042969, 0.0016970932483673096, 0.0017924904823303223, 0.001887887716293335, 0.0019832849502563477, 0.0020786821842193604, 0.002174079418182373, 0.0022694766521453857, 0.0023648738861083984, 0.002460271120071411, 0.002555668354034424, 0.0026510655879974365, 0.0027464628219604492, 0.002841860055923462, 0.0029372572898864746, 0.0030326545238494873, 0.0031280517578125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 14.0, 19.0, 35.0, 54.0, 81.0, 96.0, 163.0, 228.0, 298.0, 486.0, 701.0, 981.0, 1485.0, 2117.0, 3000.0, 4390.0, 6456.0, 9569.0, 14590.0, 21876.0, 34407.0, 54877.0, 89237.0, 146910.0, 215329.0, 166051.0, 101173.0, 61762.0, 38495.0, 24360.0, 16054.0, 10571.0, 7107.0, 4804.0, 3312.0, 2323.0, 1611.0, 1117.0, 768.0, 515.0, 358.0, 244.0, 177.0, 117.0, 79.0, 51.0, 36.0, 33.0, 14.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0057830810546875, -0.0056002140045166016, -0.005417346954345703, -0.005234479904174805, -0.005051612854003906, -0.004868745803833008, -0.004685878753662109, -0.004503011703491211, -0.0043201446533203125, -0.004137277603149414, -0.003954410552978516, -0.003771543502807617, -0.0035886764526367188, -0.0034058094024658203, -0.003222942352294922, -0.0030400753021240234, -0.002857208251953125, -0.0026743412017822266, -0.002491474151611328, -0.0023086071014404297, -0.0021257400512695312, -0.0019428730010986328, -0.0017600059509277344, -0.001577138900756836, -0.0013942718505859375, -0.001211404800415039, -0.0010285377502441406, -0.0008456707000732422, -0.0006628036499023438, -0.0004799365997314453, -0.0002970695495605469, -0.00011420249938964844, 6.866455078125e-05, 0.00025153160095214844, 0.0004343986511230469, 0.0006172657012939453, 0.0008001327514648438, 0.0009829998016357422, 0.0011658668518066406, 0.001348733901977539, 0.0015316009521484375, 0.001714468002319336, 0.0018973350524902344, 0.002080202102661133, 0.0022630691528320312, 0.0024459362030029297, 0.002628803253173828, 0.0028116703033447266, 0.002994537353515625, 0.0031774044036865234, 0.003360271453857422, 0.0035431385040283203, 0.0037260055541992188, 0.003908872604370117, 0.004091739654541016, 0.004274606704711914, 0.0044574737548828125, 0.004640340805053711, 0.004823207855224609, 0.005006074905395508, 0.005188941955566406, 0.005371809005737305, 0.005554676055908203, 0.0057375431060791016, 0.00592041015625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 3.0, 2.0, 17.0, 15.0, 14.0, 15.0, 17.0, 16.0, 20.0, 27.0, 28.0, 24.0, 34.0, 33.0, 30.0, 43.0, 38.0, 46.0, 37.0, 46.0, 40.0, 46.0, 43.0, 34.0, 35.0, 32.0, 38.0, 27.0, 27.0, 28.0, 19.0, 17.0, 16.0, 15.0, 14.0, 9.0, 15.0, 8.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0020847320556640625, -0.002018958330154419, -0.0019531846046447754, -0.0018874108791351318, -0.0018216371536254883, -0.0017558634281158447, -0.0016900897026062012, -0.0016243159770965576, -0.001558542251586914, -0.0014927685260772705, -0.001426994800567627, -0.0013612210750579834, -0.0012954473495483398, -0.0012296736240386963, -0.0011638998985290527, -0.0010981261730194092, -0.0010323524475097656, -0.0009665787220001221, -0.0009008049964904785, -0.000835031270980835, -0.0007692575454711914, -0.0007034838199615479, -0.0006377100944519043, -0.0005719363689422607, -0.0005061626434326172, -0.00044038891792297363, -0.0003746151924133301, -0.0003088414669036865, -0.00024306774139404297, -0.00017729401588439941, -0.00011152029037475586, -4.5746564865112305e-05, 2.002716064453125e-05, 8.58008861541748e-05, 0.00015157461166381836, 0.00021734833717346191, 0.00028312206268310547, 0.000348895788192749, 0.0004146695137023926, 0.00048044323921203613, 0.0005462169647216797, 0.0006119906902313232, 0.0006777644157409668, 0.0007435381412506104, 0.0008093118667602539, 0.0008750855922698975, 0.000940859317779541, 0.0010066330432891846, 0.0010724067687988281, 0.0011381804943084717, 0.0012039542198181152, 0.0012697279453277588, 0.0013355016708374023, 0.001401275396347046, 0.0014670491218566895, 0.001532822847366333, 0.0015985965728759766, 0.0016643702983856201, 0.0017301440238952637, 0.0017959177494049072, 0.0018616914749145508, 0.0019274652004241943, 0.001993238925933838, 0.0020590126514434814, 0.002124786376953125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 12.0, 8.0, 19.0, 26.0, 34.0, 47.0, 56.0, 62.0, 102.0, 127.0, 198.0, 275.0, 416.0, 531.0, 841.0, 1545.0, 3236.0, 8316.0, 26606.0, 111031.0, 653158.0, 183969.0, 37941.0, 10939.0, 4079.0, 1879.0, 934.0, 665.0, 427.0, 296.0, 217.0, 139.0, 95.0, 86.0, 54.0, 44.0, 40.0, 25.0, 17.0, 16.0, 9.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00431060791015625, -0.004174351692199707, -0.004038095474243164, -0.003901839256286621, -0.003765583038330078, -0.003629326820373535, -0.003493070602416992, -0.0033568143844604492, -0.0032205581665039062, -0.0030843019485473633, -0.0029480457305908203, -0.0028117895126342773, -0.0026755332946777344, -0.0025392770767211914, -0.0024030208587646484, -0.0022667646408081055, -0.0021305084228515625, -0.0019942522048950195, -0.0018579959869384766, -0.0017217397689819336, -0.0015854835510253906, -0.0014492273330688477, -0.0013129711151123047, -0.0011767148971557617, -0.0010404586791992188, -0.0009042024612426758, -0.0007679462432861328, -0.0006316900253295898, -0.0004954338073730469, -0.0003591775894165039, -0.00022292137145996094, -8.666515350341797e-05, 4.9591064453125e-05, 0.00018584728240966797, 0.00032210350036621094, 0.0004583597183227539, 0.0005946159362792969, 0.0007308721542358398, 0.0008671283721923828, 0.0010033845901489258, 0.0011396408081054688, 0.0012758970260620117, 0.0014121532440185547, 0.0015484094619750977, 0.0016846656799316406, 0.0018209218978881836, 0.0019571781158447266, 0.0020934343338012695, 0.0022296905517578125, 0.0023659467697143555, 0.0025022029876708984, 0.0026384592056274414, 0.0027747154235839844, 0.0029109716415405273, 0.0030472278594970703, 0.0031834840774536133, 0.0033197402954101562, 0.0034559965133666992, 0.003592252731323242, 0.003728508949279785, 0.003864765167236328, 0.004001021385192871, 0.004137277603149414, 0.004273533821105957, 0.0044097900390625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 0.0, 8.0, 0.0, 14.0, 0.0, 14.0, 0.0, 36.0, 0.0, 31.0, 0.0, 37.0, 0.0, 64.0, 0.0, 74.0, 0.0, 102.0, 0.0, 98.0, 0.0, 109.0, 0.0, 93.0, 0.0, 79.0, 0.0, 68.0, 0.0, 54.0, 0.0, 32.0, 0.0, 34.0, 0.0, 19.0, 0.0, 15.0, 0.0, 15.0, 0.0, 7.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.834766387939453e-07, -9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 12.0, 9.0, 14.0, 24.0, 21.0, 32.0, 31.0, 50.0, 68.0, 87.0, 110.0, 146.0, 226.0, 270.0, 400.0, 533.0, 739.0, 1172.0, 1840.0, 2776.0, 4432.0, 7355.0, 12713.0, 24260.0, 51683.0, 146124.0, 502333.0, 172220.0, 57530.0, 26115.0, 13811.0, 7878.0, 4591.0, 2876.0, 1919.0, 1265.0, 813.0, 569.0, 397.0, 278.0, 190.0, 149.0, 120.0, 96.0, 83.0, 40.0, 45.0, 37.0, 24.0, 13.0, 15.0, 7.0, 5.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.002529144287109375, -0.002446383237838745, -0.0023636221885681152, -0.0022808611392974854, -0.0021981000900268555, -0.0021153390407562256, -0.0020325779914855957, -0.0019498169422149658, -0.001867055892944336, -0.001784294843673706, -0.0017015337944030762, -0.0016187727451324463, -0.0015360116958618164, -0.0014532506465911865, -0.0013704895973205566, -0.0012877285480499268, -0.0012049674987792969, -0.001122206449508667, -0.0010394454002380371, -0.0009566843509674072, -0.0008739233016967773, -0.0007911622524261475, -0.0007084012031555176, -0.0006256401538848877, -0.0005428791046142578, -0.00046011805534362793, -0.00037735700607299805, -0.00029459595680236816, -0.00021183490753173828, -0.0001290738582611084, -4.6312808990478516e-05, 3.644824028015137e-05, 0.00011920928955078125, 0.00020197033882141113, 0.000284731388092041, 0.0003674924373626709, 0.0004502534866333008, 0.0005330145359039307, 0.0006157755851745605, 0.0006985366344451904, 0.0007812976837158203, 0.0008640587329864502, 0.0009468197822570801, 0.00102958083152771, 0.0011123418807983398, 0.0011951029300689697, 0.0012778639793395996, 0.0013606250286102295, 0.0014433860778808594, 0.0015261471271514893, 0.0016089081764221191, 0.001691669225692749, 0.001774430274963379, 0.0018571913242340088, 0.0019399523735046387, 0.0020227134227752686, 0.0021054744720458984, 0.0021882355213165283, 0.002270996570587158, 0.002353757619857788, 0.002436518669128418, 0.002519279718399048, 0.0026020407676696777, 0.0026848018169403076, 0.0027675628662109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 3.0, 12.0, 9.0, 15.0, 24.0, 30.0, 31.0, 39.0, 83.0, 93.0, 93.0, 102.0, 108.0, 83.0, 72.0, 54.0, 28.0, 30.0, 18.0, 12.0, 16.0, 12.0, 3.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005865097045898438, -0.0005658045411109924, -0.0005450993776321411, -0.0005243942141532898, -0.0005036890506744385, -0.00048298388719558716, -0.00046227872371673584, -0.0004415735602378845, -0.0004208683967590332, -0.0004001632332801819, -0.00037945806980133057, -0.00035875290632247925, -0.00033804774284362793, -0.0003173425793647766, -0.0002966374158859253, -0.000275932252407074, -0.00025522708892822266, -0.00023452192544937134, -0.00021381676197052002, -0.0001931115984916687, -0.00017240643501281738, -0.00015170127153396606, -0.00013099610805511475, -0.00011029094457626343, -8.958578109741211e-05, -6.888061761856079e-05, -4.817545413970947e-05, -2.7470290660858154e-05, -6.765127182006836e-06, 1.3940036296844482e-05, 3.46451997756958e-05, 5.535036325454712e-05, 7.605552673339844e-05, 9.676069021224976e-05, 0.00011746585369110107, 0.0001381710171699524, 0.0001588761806488037, 0.00017958134412765503, 0.00020028650760650635, 0.00022099167108535767, 0.00024169683456420898, 0.0002624019980430603, 0.0002831071615219116, 0.00030381232500076294, 0.00032451748847961426, 0.0003452226519584656, 0.0003659278154373169, 0.0003866329789161682, 0.00040733814239501953, 0.00042804330587387085, 0.00044874846935272217, 0.0004694536328315735, 0.0004901587963104248, 0.0005108639597892761, 0.0005315691232681274, 0.0005522742867469788, 0.0005729794502258301, 0.0005936846137046814, 0.0006143897771835327, 0.000635094940662384, 0.0006558001041412354, 0.0006765052676200867, 0.000697210431098938, 0.0007179155945777893, 0.0007386207580566406]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 7.0, 17.0, 13.0, 13.0, 29.0, 35.0, 41.0, 65.0, 68.0, 96.0, 104.0, 105.0, 101.0, 59.0, 51.0, 49.0, 42.0, 28.0, 16.0, 13.0, 13.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0064142560586333275, -0.00620603421702981, -0.00599781284108758, -0.005789590999484062, -0.005581369623541832, -0.0053731477819383144, -0.005164925940334797, -0.004956704564392567, -0.004748482722789049, -0.004540260881185532, -0.004332039505243301, -0.004123817663639784, -0.003915595822036266, -0.003707374446094036, -0.0034991526044905186, -0.0032909309957176447, -0.003082709386944771, -0.002874487778171897, -0.002666266169399023, -0.0024580443277955055, -0.0022498227190226316, -0.0020416011102497578, -0.001833379385061562, -0.0016251576598733664, -0.0014169360511004925, -0.0012087144423276186, -0.001000492717139423, -0.0007922710501588881, -0.0005840493831783533, -0.00037582777440547943, -0.00016760604921728373, 4.061567597091198e-05, 0.00024883681908249855, 0.00045705848606303334, 0.0006652801530435681, 0.0008735018200241029, 0.0010817234870046377, 0.0012899450957775116, 0.0014981668209657073, 0.001706388546153903, 0.0019146101549267769, 0.0021228317636996508, 0.0023310533724725246, 0.002539275214076042, 0.002747496822848916, 0.00295571843162179, 0.0031639402732253075, 0.0033721618819981813, 0.0035803834907710552, 0.003788605099543929, 0.003996826708316803, 0.0042050485499203205, 0.004413270391523838, 0.004621491767466068, 0.004829713609069586, 0.005037935450673103, 0.0052461568266153336, 0.005454378668218851, 0.005662600044161081, 0.005870821885764599, 0.006079043261706829, 0.006287265103310347, 0.006495486944913864, 0.006703708320856094, 0.006911930162459612]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 8.0, 7.0, 6.0, 7.0, 12.0, 11.0, 11.0, 15.0, 21.0, 23.0, 26.0, 40.0, 32.0, 32.0, 31.0, 38.0, 32.0, 49.0, 47.0, 48.0, 52.0, 44.0, 48.0, 41.0, 37.0, 41.0, 30.0, 27.0, 24.0, 20.0, 18.0, 20.0, 22.0, 16.0, 12.0, 14.0, 6.0, 12.0, 9.0, 2.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003445139154791832, -0.0033185624051839113, -0.0031919858884066343, -0.0030654091387987137, -0.002938832389190793, -0.0028122556395828724, -0.0026856791228055954, -0.0025591023731976748, -0.002432525623589754, -0.0023059488739818335, -0.0021793723572045565, -0.002052795607596636, -0.0019262188579887152, -0.0017996422247961164, -0.0016730655916035175, -0.0015464888419955969, -0.00141991232521832, -0.001293335692025721, -0.0011667589424178004, -0.0010401823092252016, -0.0009136056178249419, -0.0007870289264246821, -0.0006604522932320833, -0.0005338756018318236, -0.00040729891043156385, -0.0002807222190313041, -0.00015414555673487484, -2.7568894438445568e-05, 9.900779696181417e-05, 0.0002255844883620739, 0.0003521611215546727, 0.00047873781295493245, 0.0006053145043551922, 0.0007318911957554519, 0.0008584678871557117, 0.0009850445203483105, 0.0011116212699562311, 0.00123819790314883, 0.0013647745363414288, 0.0014913512859493494, 0.0016179279191419482, 0.001744504552334547, 0.0018710813019424677, 0.0019976580515503883, 0.0021242345683276653, 0.002250811317935586, 0.0023773880675435066, 0.0025039645843207836, 0.0026305413339287043, 0.002757118083536625, 0.002883694600313902, 0.0030102713499218225, 0.003136848099529743, 0.00326342461630702, 0.003390001365914941, 0.0035165781155228615, 0.0036431546323001385, 0.003769731381908059, 0.003896307898685336, 0.004022884648293257, 0.004149461165070534, 0.004276038147509098, 0.004402614664286375, 0.004529191181063652, 0.004655768163502216]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 9.0, 14.0, 10.0, 16.0, 11.0, 25.0, 21.0, 23.0, 33.0, 27.0, 57.0, 55.0, 60.0, 70.0, 73.0, 113.0, 151.0, 348.0, 1140.0, 3803.0, 515640.0, 1322.0, 422.0, 177.0, 105.0, 74.0, 75.0, 61.0, 44.0, 48.0, 51.0, 37.0, 25.0, 22.0, 19.0, 16.0, 18.0, 11.0, 7.0, 8.0, 6.0, 8.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08651912957429886, -0.08382194489240646, -0.08112476021051407, -0.07842757552862167, -0.07573039084672928, -0.07303320616483688, -0.07033602893352509, -0.06763884425163269, -0.0649416595697403, -0.0622444748878479, -0.059547290205955505, -0.05685010552406311, -0.054152920842170715, -0.05145573616027832, -0.048758555203676224, -0.04606137052178383, -0.043364182114601135, -0.04066699743270874, -0.037969812750816345, -0.03527262806892395, -0.032575443387031555, -0.02987826056778431, -0.027181077748537064, -0.02448389306664467, -0.021786708384752274, -0.01908952370285988, -0.016392339020967484, -0.013695156201720238, -0.010997971519827843, -0.008300786837935448, -0.005603604018688202, -0.002906419336795807, -0.00020923465490341187, 0.002487949561327696, 0.0051851337775588036, 0.007882317528128624, 0.010579502210021019, 0.013276686891913414, 0.01597386971116066, 0.018671054393053055, 0.02136823907494545, 0.024065423756837845, 0.02676260843873024, 0.029459791257977486, 0.03215697407722473, 0.034854158759117126, 0.03755134344100952, 0.040248528122901917, 0.04294571280479431, 0.04564289748668671, 0.0483400821685791, 0.0510372668504715, 0.05373445153236389, 0.05643163621425629, 0.05912881717085838, 0.06182600185275078, 0.06452319025993347, 0.06722037494182587, 0.06991755962371826, 0.07261474430561066, 0.07531192898750305, 0.07800911366939545, 0.08070629835128784, 0.08340348303318024, 0.08610066026449203]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 8.0, 7.0, 15.0, 9.0, 18.0, 18.0, 23.0, 29.0, 29.0, 42.0, 34.0, 22.0, 39.0, 37.0, 47.0, 45.0, 42.0, 1073.0, 58.0, 44.0, 44.0, 37.0, 35.0, 33.0, 30.0, 31.0, 21.0, 17.0, 23.0, 14.0, 15.0, 15.0, 13.0, 10.0, 7.0, 9.0, 5.0, 1.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09995340555906296, -0.09629634022712708, -0.0926392674446106, -0.08898220211267471, -0.08532513678073883, -0.08166806399822235, -0.07801099866628647, -0.07435393333435059, -0.0706968605518341, -0.06703979521989822, -0.06338272243738174, -0.05972565710544586, -0.05606858804821968, -0.0524115189909935, -0.04875445365905762, -0.045097384601831436, -0.041440315544605255, -0.037783246487379074, -0.03412617743015289, -0.03046911209821701, -0.02681204304099083, -0.02315497398376465, -0.019497906789183617, -0.015840839594602585, -0.012183770537376404, -0.008526702411472797, -0.004869634285569191, -0.0012125661596655846, 0.002444501966238022, 0.006101571023464203, 0.009758638218045235, 0.013415705412626266, 0.017072781920433044, 0.020729850977659225, 0.024386918172240257, 0.02804398536682129, 0.03170105442404747, 0.03535812348127365, 0.039015188813209534, 0.042672257870435715, 0.046329326927661896, 0.04998639598488808, 0.05364346504211426, 0.05730053037405014, 0.06095759943127632, 0.0646146684885025, 0.06827173382043839, 0.07192879915237427, 0.07558587193489075, 0.07924293726682663, 0.08290001004934311, 0.08655707538127899, 0.09021414816379547, 0.09387121349573135, 0.09752827882766724, 0.10118535161018372, 0.1048424169421196, 0.10849948227405548, 0.11215655505657196, 0.11581362038850784, 0.11947068572044373, 0.1231277585029602, 0.12678483128547668, 0.13044188916683197, 0.13409896194934845]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 3.0, 6.0, 8.0, 5.0, 12.0, 13.0, 11.0, 19.0, 35.0, 39.0, 51.0, 80.0, 126.0, 218.0, 341.0, 419.0, 565.0, 774.0, 911.0, 1082.0, 1441.0, 2445.0, 2573.0, 31199214.0, 19487.0, 21513.0, 1813.0, 255.0, 228.0, 546.0, 58.0, 46.0, 41.0, 34.0, 28.0, 15.0, 9.0, 5.0, 5.0, 3.0, 1.0], "bins": [-21232.0, -20778.1875, -20324.375, -19870.5625, -19416.75, -18962.9375, -18509.125, -18055.3125, -17601.5, -17147.6875, -16693.875, -16240.0625, -15786.25, -15332.4375, -14878.625, -14424.8125, -13971.0, -13517.1875, -13063.375, -12609.5625, -12155.75, -11701.9375, -11248.125, -10794.3125, -10340.5, -9886.6875, -9432.875, -8979.0625, -8525.25, -8071.4375, -7617.625, -7163.8125, -6710.0, -6256.1875, -5802.375, -5348.5625, -4894.75, -4440.9375, -3987.125, -3533.3125, -3079.5, -2625.6875, -2171.875, -1718.0625, -1264.25, -810.4375, -356.625, 97.1875, 551.0, 1004.8125, 1458.625, 1912.4375, 2366.25, 2820.0625, 3273.875, 3727.6875, 4181.5, 4635.3125, 5089.125, 5542.9375, 5996.75, 6450.5625, 6904.375, 7358.1875, 7812.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 11.0, 17.0, 38.0, 56.0, 73.0, 95.0, 141.0, 224.0, 359.0, 573.0, 902.0, 1405.0, 2250.0, 3410.0, 5437.0, 8812.0, 14278.0, 23575.0, 40810.0, 68910.0, 122204.0, 231381.0, 573084.0, 3884417.0, 729828.0, 259875.0, 133051.0, 75141.0, 43483.0, 25799.0, 16030.0, 9810.0, 5945.0, 3601.0, 2243.0, 1499.0, 945.0, 586.0, 379.0, 250.0, 167.0, 103.0, 69.0, 61.0, 40.0, 16.0, 13.0, 12.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-117.0625, -113.2333984375, -109.404296875, -105.5751953125, -101.74609375, -97.9169921875, -94.087890625, -90.2587890625, -86.4296875, -82.6005859375, -78.771484375, -74.9423828125, -71.11328125, -67.2841796875, -63.455078125, -59.6259765625, -55.796875, -51.9677734375, -48.138671875, -44.3095703125, -40.48046875, -36.6513671875, -32.822265625, -28.9931640625, -25.1640625, -21.3349609375, -17.505859375, -13.6767578125, -9.84765625, -6.0185546875, -2.189453125, 1.6396484375, 5.46875, 9.2978515625, 13.126953125, 16.9560546875, 20.78515625, 24.6142578125, 28.443359375, 32.2724609375, 36.1015625, 39.9306640625, 43.759765625, 47.5888671875, 51.41796875, 55.2470703125, 59.076171875, 62.9052734375, 66.734375, 70.5634765625, 74.392578125, 78.2216796875, 82.05078125, 85.8798828125, 89.708984375, 93.5380859375, 97.3671875, 101.1962890625, 105.025390625, 108.8544921875, 112.68359375, 116.5126953125, 120.341796875, 124.1708984375, 128.0]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 6.0, 8.0, 7.0, 7.0, 10.0, 12.0, 15.0, 13.0, 16.0, 24.0, 29.0, 38.0, 64.0, 76.0, 119.0, 192.0, 347.0, 556.0, 86.0, 63.0, 50.0, 40.0, 34.0, 27.0, 22.0, 22.0, 24.0, 18.0, 13.0, 13.0, 17.0, 10.0, 10.0, 7.0, 4.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-235.375, -228.72265625, -222.0703125, -215.41796875, -208.765625, -202.11328125, -195.4609375, -188.80859375, -182.15625, -175.50390625, -168.8515625, -162.19921875, -155.546875, -148.89453125, -142.2421875, -135.58984375, -128.9375, -122.28515625, -115.6328125, -108.98046875, -102.328125, -95.67578125, -89.0234375, -82.37109375, -75.71875, -69.06640625, -62.4140625, -55.76171875, -49.109375, -42.45703125, -35.8046875, -29.15234375, -22.5, -15.84765625, -9.1953125, -2.54296875, 4.109375, 10.76171875, 17.4140625, 24.06640625, 30.71875, 37.37109375, 44.0234375, 50.67578125, 57.328125, 63.98046875, 70.6328125, 77.28515625, 83.9375, 90.58984375, 97.2421875, 103.89453125, 110.546875, 117.19921875, 123.8515625, 130.50390625, 137.15625, 143.80859375, 150.4609375, 157.11328125, 163.765625, 170.41796875, 177.0703125, 183.72265625, 190.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 0.0, 6.0, 4.0, 14.0, 9.0, 23.0, 34.0, 26.0, 45.0, 68.0, 82.0, 114.0, 210.0, 254.0, 313.0, 545.0, 781.0, 1195.0, 1771.0, 2653.0, 4667.0, 7440.0, 13170.0, 25264.0, 56603.0, 151797.0, 897629.0, 4732145.0, 243519.0, 77212.0, 33418.0, 16467.0, 9105.0, 5178.0, 3165.0, 2066.0, 1401.0, 899.0, 626.0, 449.0, 279.0, 220.0, 147.0, 132.0, 75.0, 57.0, 41.0, 39.0, 27.0, 21.0, 9.0, 9.0, 0.0, 6.0, 9.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-260.25, -251.90234375, -243.5546875, -235.20703125, -226.859375, -218.51171875, -210.1640625, -201.81640625, -193.46875, -185.12109375, -176.7734375, -168.42578125, -160.078125, -151.73046875, -143.3828125, -135.03515625, -126.6875, -118.33984375, -109.9921875, -101.64453125, -93.296875, -84.94921875, -76.6015625, -68.25390625, -59.90625, -51.55859375, -43.2109375, -34.86328125, -26.515625, -18.16796875, -9.8203125, -1.47265625, 6.875, 15.22265625, 23.5703125, 31.91796875, 40.265625, 48.61328125, 56.9609375, 65.30859375, 73.65625, 82.00390625, 90.3515625, 98.69921875, 107.046875, 115.39453125, 123.7421875, 132.08984375, 140.4375, 148.78515625, 157.1328125, 165.48046875, 173.828125, 182.17578125, 190.5234375, 198.87109375, 207.21875, 215.56640625, 223.9140625, 232.26171875, 240.609375, 248.95703125, 257.3046875, 265.65234375, 274.0]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 1.0, 5.0, 3.0, 5.0, 10.0, 9.0, 15.0, 21.0, 20.0, 26.0, 44.0, 69.0, 126.0, 184.0, 464.0, 577.0, 111.0, 57.0, 56.0, 42.0, 29.0, 21.0, 26.0, 16.0, 13.0, 9.0, 8.0, 6.0, 5.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 7.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-369.25, -357.41015625, -345.5703125, -333.73046875, -321.890625, -310.05078125, -298.2109375, -286.37109375, -274.53125, -262.69140625, -250.8515625, -239.01171875, -227.171875, -215.33203125, -203.4921875, -191.65234375, -179.8125, -167.97265625, -156.1328125, -144.29296875, -132.453125, -120.61328125, -108.7734375, -96.93359375, -85.09375, -73.25390625, -61.4140625, -49.57421875, -37.734375, -25.89453125, -14.0546875, -2.21484375, 9.625, 21.46484375, 33.3046875, 45.14453125, 56.984375, 68.82421875, 80.6640625, 92.50390625, 104.34375, 116.18359375, 128.0234375, 139.86328125, 151.703125, 163.54296875, 175.3828125, 187.22265625, 199.0625, 210.90234375, 222.7421875, 234.58203125, 246.421875, 258.26171875, 270.1015625, 281.94140625, 293.78125, 305.62109375, 317.4609375, 329.30078125, 341.140625, 352.98046875, 364.8203125, 376.66015625, 388.5]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [9.0, 0.0, 2.0, 4.0, 12.0, 6.0, 0.0, 9.0, 5.0, 10.0, 8.0, 35.0, 38.0, 44.0, 25.0, 76.0, 52.0, 50.0, 104.0, 143.0, 161.0, 240.0, 372.0, 486.0, 758.0, 1135.0, 1954.0, 3409.0, 7142.0, 18364.0, 90722.0, 6096800.0, 43651.0, 12555.0, 5493.0, 2799.0, 1455.0, 1001.0, 582.0, 419.0, 321.0, 226.0, 188.0, 121.0, 96.0, 77.0, 70.0, 49.0, 49.0, 38.0, 10.0, 10.0, 11.0, 3.0, 17.0, 1.0, 6.0, 5.0, 19.0, 0.0, 0.0, 6.0, 0.0, 3.0], "bins": [-2332.0, -2257.5625, -2183.125, -2108.6875, -2034.25, -1959.8125, -1885.375, -1810.9375, -1736.5, -1662.0625, -1587.625, -1513.1875, -1438.75, -1364.3125, -1289.875, -1215.4375, -1141.0, -1066.5625, -992.125, -917.6875, -843.25, -768.8125, -694.375, -619.9375, -545.5, -471.0625, -396.625, -322.1875, -247.75, -173.3125, -98.875, -24.4375, 50.0, 124.4375, 198.875, 273.3125, 347.75, 422.1875, 496.625, 571.0625, 645.5, 719.9375, 794.375, 868.8125, 943.25, 1017.6875, 1092.125, 1166.5625, 1241.0, 1315.4375, 1389.875, 1464.3125, 1538.75, 1613.1875, 1687.625, 1762.0625, 1836.5, 1910.9375, 1985.375, 2059.8125, 2134.25, 2208.6875, 2283.125, 2357.5625, 2432.0]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 7.0, 7.0, 5.0, 4.0, 5.0, 10.0, 15.0, 10.0, 13.0, 17.0, 19.0, 25.0, 32.0, 60.0, 125.0, 291.0, 943.0, 157.0, 72.0, 42.0, 32.0, 21.0, 14.0, 15.0, 17.0, 11.0, 10.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-772.0, -747.5546875, -723.109375, -698.6640625, -674.21875, -649.7734375, -625.328125, -600.8828125, -576.4375, -551.9921875, -527.546875, -503.1015625, -478.65625, -454.2109375, -429.765625, -405.3203125, -380.875, -356.4296875, -331.984375, -307.5390625, -283.09375, -258.6484375, -234.203125, -209.7578125, -185.3125, -160.8671875, -136.421875, -111.9765625, -87.53125, -63.0859375, -38.640625, -14.1953125, 10.25, 34.6953125, 59.140625, 83.5859375, 108.03125, 132.4765625, 156.921875, 181.3671875, 205.8125, 230.2578125, 254.703125, 279.1484375, 303.59375, 328.0390625, 352.484375, 376.9296875, 401.375, 425.8203125, 450.265625, 474.7109375, 499.15625, 523.6015625, 548.046875, 572.4921875, 596.9375, 621.3828125, 645.828125, 670.2734375, 694.71875, 719.1640625, 743.609375, 768.0546875, 792.5]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 7.0, 14.0, 19.0, 35.0, 656.0, 240.0, 18.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-14771.30078125, -14502.5732421875, -14233.845703125, -13965.1181640625, -13696.390625, -13427.6630859375, -13158.935546875, -12890.20703125, -12621.48046875, -12352.7529296875, -12084.025390625, -11815.2978515625, -11546.5703125, -11277.8427734375, -11009.115234375, -10740.38671875, -10471.6591796875, -10202.931640625, -9934.2041015625, -9665.4765625, -9396.7490234375, -9128.021484375, -8859.2939453125, -8590.56640625, -8321.837890625, -8053.1103515625, -7784.3828125, -7515.6552734375, -7246.927734375, -6978.2001953125, -6709.47216796875, -6440.74462890625, -6172.017578125, -5903.2900390625, -5634.5625, -5365.8349609375, -5097.107421875, -4828.3798828125, -4559.65185546875, -4290.92431640625, -4022.197021484375, -3753.469482421875, -3484.74169921875, -3216.01416015625, -2947.28662109375, -2678.55908203125, -2409.83154296875, -2141.103759765625, -1872.376220703125, -1603.648681640625, -1334.9210205078125, -1066.193359375, -797.4658203125, -528.73828125, -260.0106201171875, 8.717041015625, 277.444580078125, 546.1721801757812, 814.8997802734375, 1083.62744140625, 1352.35498046875, 1621.08251953125, 1889.8101806640625, 2158.537841796875, 2427.265380859375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 9.0, 9.0, 13.0, 18.0, 23.0, 36.0, 759.0, 32.0, 18.0, 19.0, 13.0, 11.0, 7.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5487.4111328125, -5358.158203125, -5228.9052734375, -5099.65234375, -4970.3994140625, -4841.146484375, -4711.8935546875, -4582.640625, -4453.3876953125, -4324.134765625, -4194.8818359375, -4065.62890625, -3936.3759765625, -3807.123046875, -3677.870361328125, -3548.617431640625, -3419.36474609375, -3290.11181640625, -3160.85888671875, -3031.60595703125, -2902.35302734375, -2773.10009765625, -2643.847412109375, -2514.594482421875, -2385.341552734375, -2256.088623046875, -2126.835693359375, -1997.5828857421875, -1868.3299560546875, -1739.0770263671875, -1609.82421875, -1480.5712890625, -1351.318359375, -1222.0654296875, -1092.8125, -963.5596923828125, -834.3067626953125, -705.0538330078125, -575.8009643554688, -446.548095703125, -317.295166015625, -188.04226684570312, -58.78936767578125, 70.46353149414062, 199.7164306640625, 328.9693603515625, 458.22222900390625, 587.47509765625, 716.72802734375, 845.98095703125, 975.2338256835938, 1104.4866943359375, 1233.7396240234375, 1362.9925537109375, 1492.245361328125, 1621.498291015625, 1750.751220703125, 1880.004150390625, 2009.257080078125, 2138.510009765625, 2267.7626953125, 2397.015625, 2526.2685546875, 2655.521484375, 2784.7744140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 17.0, 17.0, 15.0, 24.0, 37.0, 41.0, 69.0, 107.0, 130.0, 188.0, 259.0, 355.0, 534.0, 745.0, 1228.0, 2434.0, 5570.0, 17802.0, 127353.0, 3825317.0, 177984.0, 20937.0, 6863.0, 2857.0, 1398.0, 691.0, 389.0, 229.0, 160.0, 93.0, 89.0, 75.0, 58.0, 44.0, 42.0, 30.0, 25.0, 10.0, 13.0, 12.0, 11.0, 9.0, 8.0, 9.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.859375, -23.989013671875, -23.11865234375, -22.248291015625, -21.3779296875, -20.507568359375, -19.63720703125, -18.766845703125, -17.896484375, -17.026123046875, -16.15576171875, -15.285400390625, -14.4150390625, -13.544677734375, -12.67431640625, -11.803955078125, -10.93359375, -10.063232421875, -9.19287109375, -8.322509765625, -7.4521484375, -6.581787109375, -5.71142578125, -4.841064453125, -3.970703125, -3.100341796875, -2.22998046875, -1.359619140625, -0.4892578125, 0.381103515625, 1.25146484375, 2.121826171875, 2.9921875, 3.862548828125, 4.73291015625, 5.603271484375, 6.4736328125, 7.343994140625, 8.21435546875, 9.084716796875, 9.955078125, 10.825439453125, 11.69580078125, 12.566162109375, 13.4365234375, 14.306884765625, 15.17724609375, 16.047607421875, 16.91796875, 17.788330078125, 18.65869140625, 19.529052734375, 20.3994140625, 21.269775390625, 22.14013671875, 23.010498046875, 23.880859375, 24.751220703125, 25.62158203125, 26.491943359375, 27.3623046875, 28.232666015625, 29.10302734375, 29.973388671875, 30.84375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 10.0, 27.0, 40.0, 52.0, 82.0, 138.0, 163.0, 157.0, 125.0, 105.0, 44.0, 25.0, 11.0, 5.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.064453125, -1.031005859375, -0.99755859375, -0.964111328125, -0.9306640625, -0.897216796875, -0.86376953125, -0.830322265625, -0.796875, -0.763427734375, -0.72998046875, -0.696533203125, -0.6630859375, -0.629638671875, -0.59619140625, -0.562744140625, -0.529296875, -0.495849609375, -0.46240234375, -0.428955078125, -0.3955078125, -0.362060546875, -0.32861328125, -0.295166015625, -0.26171875, -0.228271484375, -0.19482421875, -0.161376953125, -0.1279296875, -0.094482421875, -0.06103515625, -0.027587890625, 0.005859375, 0.039306640625, 0.07275390625, 0.106201171875, 0.1396484375, 0.173095703125, 0.20654296875, 0.239990234375, 0.2734375, 0.306884765625, 0.34033203125, 0.373779296875, 0.4072265625, 0.440673828125, 0.47412109375, 0.507568359375, 0.541015625, 0.574462890625, 0.60791015625, 0.641357421875, 0.6748046875, 0.708251953125, 0.74169921875, 0.775146484375, 0.80859375, 0.842041015625, 0.87548828125, 0.908935546875, 0.9423828125, 0.975830078125, 1.00927734375, 1.042724609375, 1.076171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 12.0, 14.0, 33.0, 30.0, 59.0, 68.0, 94.0, 151.0, 284.0, 491.0, 996.0, 2268.0, 7460.0, 36503.0, 510620.0, 3533991.0, 83406.0, 11938.0, 3187.0, 1196.0, 544.0, 286.0, 175.0, 128.0, 88.0, 51.0, 54.0, 29.0, 16.0, 20.0, 14.0, 16.0, 10.0, 10.0, 11.0, 1.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.203125, -17.481201171875, -16.75927734375, -16.037353515625, -15.3154296875, -14.593505859375, -13.87158203125, -13.149658203125, -12.427734375, -11.705810546875, -10.98388671875, -10.261962890625, -9.5400390625, -8.818115234375, -8.09619140625, -7.374267578125, -6.65234375, -5.930419921875, -5.20849609375, -4.486572265625, -3.7646484375, -3.042724609375, -2.32080078125, -1.598876953125, -0.876953125, -0.155029296875, 0.56689453125, 1.288818359375, 2.0107421875, 2.732666015625, 3.45458984375, 4.176513671875, 4.8984375, 5.620361328125, 6.34228515625, 7.064208984375, 7.7861328125, 8.508056640625, 9.22998046875, 9.951904296875, 10.673828125, 11.395751953125, 12.11767578125, 12.839599609375, 13.5615234375, 14.283447265625, 15.00537109375, 15.727294921875, 16.44921875, 17.171142578125, 17.89306640625, 18.614990234375, 19.3369140625, 20.058837890625, 20.78076171875, 21.502685546875, 22.224609375, 22.946533203125, 23.66845703125, 24.390380859375, 25.1123046875, 25.834228515625, 26.55615234375, 27.278076171875, 28.0]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 13.0, 7.0, 9.0, 12.0, 12.0, 13.0, 17.0, 25.0, 23.0, 52.0, 58.0, 61.0, 82.0, 104.0, 116.0, 166.0, 211.0, 270.0, 397.0, 953.0, 434.0, 280.0, 215.0, 160.0, 100.0, 70.0, 58.0, 40.0, 31.0, 16.0, 22.0, 9.0, 9.0, 10.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.7929840087890625, -2.718780517578125, -2.6445770263671875, -2.57037353515625, -2.4961700439453125, -2.421966552734375, -2.3477630615234375, -2.2735595703125, -2.1993560791015625, -2.125152587890625, -2.0509490966796875, -1.97674560546875, -1.9025421142578125, -1.828338623046875, -1.7541351318359375, -1.679931640625, -1.6057281494140625, -1.531524658203125, -1.4573211669921875, -1.38311767578125, -1.3089141845703125, -1.234710693359375, -1.1605072021484375, -1.0863037109375, -1.0121002197265625, -0.937896728515625, -0.8636932373046875, -0.78948974609375, -0.7152862548828125, -0.641082763671875, -0.5668792724609375, -0.49267578125, -0.4184722900390625, -0.344268798828125, -0.2700653076171875, -0.19586181640625, -0.1216583251953125, -0.047454833984375, 0.0267486572265625, 0.1009521484375, 0.1751556396484375, 0.249359130859375, 0.3235626220703125, 0.39776611328125, 0.4719696044921875, 0.546173095703125, 0.6203765869140625, 0.694580078125, 0.7687835693359375, 0.842987060546875, 0.9171905517578125, 0.99139404296875, 1.0655975341796875, 1.139801025390625, 1.2140045166015625, 1.2882080078125, 1.3624114990234375, 1.436614990234375, 1.5108184814453125, 1.58502197265625, 1.6592254638671875, 1.733428955078125, 1.8076324462890625, 1.8818359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 7.0, 8.0, 34.0, 104.0, 326.0, 509.0, 24.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-271.809326171875, -265.9299621582031, -260.0505676269531, -254.17120361328125, -248.29183959960938, -242.41246032714844, -236.5330810546875, -230.65371704101562, -224.7743377685547, -218.89495849609375, -213.01559448242188, -207.13621520996094, -201.2568359375, -195.37747192382812, -189.4980926513672, -183.61871337890625, -177.73934936523438, -171.85997009277344, -165.98060607910156, -160.10122680664062, -154.22186279296875, -148.3424835205078, -142.46310424804688, -136.583740234375, -130.70436096191406, -124.82498931884766, -118.94561767578125, -113.06623840332031, -107.1868667602539, -101.3074951171875, -95.42811584472656, -89.54874420166016, -83.66937255859375, -77.79000091552734, -71.91062927246094, -66.03125, -60.151878356933594, -54.27250671386719, -48.393131256103516, -42.513755798339844, -36.63438415527344, -30.7550106048584, -24.87563705444336, -18.99626350402832, -13.116889953613281, -7.237516403198242, -1.3581428527832031, 4.521232604980469, 10.400604248046875, 16.279977798461914, 22.159351348876953, 28.038724899291992, 33.91809844970703, 39.79747009277344, 45.67684555053711, 51.55622100830078, 57.43559265136719, 63.314964294433594, 69.1943359375, 75.07371520996094, 80.95308685302734, 86.83245849609375, 92.71183776855469, 98.5912094116211, 104.4705810546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 9.0, 16.0, 18.0, 21.0, 43.0, 38.0, 63.0, 64.0, 98.0, 91.0, 94.0, 94.0, 74.0, 76.0, 55.0, 42.0, 32.0, 20.0, 24.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.99345016479492, -46.60926818847656, -45.2250862121582, -43.840904235839844, -42.456722259521484, -41.072540283203125, -39.688358306884766, -38.304176330566406, -36.91999435424805, -35.53581237792969, -34.15163040161133, -32.76744842529297, -31.38326644897461, -29.99908447265625, -28.61490249633789, -27.23072052001953, -25.84653663635254, -24.46235466003418, -23.07817268371582, -21.69399070739746, -20.3098087310791, -18.925626754760742, -17.54144287109375, -16.15726089477539, -14.773079872131348, -13.388897895812988, -12.004715919494629, -10.620532989501953, -9.236351013183594, -7.852169513702393, -6.467987060546875, -5.083805084228516, -3.6996231079101562, -2.315441131591797, -0.9312589168548584, 0.4529232978820801, 1.8371052742004395, 3.221287250518799, 4.605469703674316, 5.989651679992676, 7.373833656311035, 8.758015632629395, 10.142197608947754, 11.52638053894043, 12.910562515258789, 14.294744491577148, 15.678926467895508, 17.063108444213867, 18.447290420532227, 19.831472396850586, 21.215654373168945, 22.599836349487305, 23.984018325805664, 25.368200302124023, 26.752384185791016, 28.136566162109375, 29.520748138427734, 30.904930114746094, 32.28911209106445, 33.67329406738281, 35.05747604370117, 36.44165802001953, 37.82583999633789, 39.21002197265625, 40.59420394897461]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 12.0, 13.0, 30.0, 16.0, 25.0, 30.0, 52.0, 80.0, 75.0, 129.0, 151.0, 260.0, 373.0, 546.0, 858.0, 1379.0, 2524.0, 5013.0, 14703.0, 70060.0, 665135.0, 236220.0, 33180.0, 8859.0, 3653.0, 1863.0, 1052.0, 688.0, 445.0, 304.0, 217.0, 156.0, 122.0, 65.0, 49.0, 63.0, 38.0, 23.0, 21.0, 18.0, 14.0, 5.0, 4.0, 2.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.5, -8.24072265625, -7.9814453125, -7.72216796875, -7.462890625, -7.20361328125, -6.9443359375, -6.68505859375, -6.42578125, -6.16650390625, -5.9072265625, -5.64794921875, -5.388671875, -5.12939453125, -4.8701171875, -4.61083984375, -4.3515625, -4.09228515625, -3.8330078125, -3.57373046875, -3.314453125, -3.05517578125, -2.7958984375, -2.53662109375, -2.27734375, -2.01806640625, -1.7587890625, -1.49951171875, -1.240234375, -0.98095703125, -0.7216796875, -0.46240234375, -0.203125, 0.05615234375, 0.3154296875, 0.57470703125, 0.833984375, 1.09326171875, 1.3525390625, 1.61181640625, 1.87109375, 2.13037109375, 2.3896484375, 2.64892578125, 2.908203125, 3.16748046875, 3.4267578125, 3.68603515625, 3.9453125, 4.20458984375, 4.4638671875, 4.72314453125, 4.982421875, 5.24169921875, 5.5009765625, 5.76025390625, 6.01953125, 6.27880859375, 6.5380859375, 6.79736328125, 7.056640625, 7.31591796875, 7.5751953125, 7.83447265625, 8.09375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 11.0, 27.0, 48.0, 65.0, 98.0, 127.0, 136.0, 155.0, 112.0, 64.0, 62.0, 22.0, 20.0, 8.0, 4.0, 0.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2568359375, -1.2257919311523438, -1.1947479248046875, -1.1637039184570312, -1.132659912109375, -1.1016159057617188, -1.0705718994140625, -1.0395278930664062, -1.00848388671875, -0.9774398803710938, -0.9463958740234375, -0.9153518676757812, -0.884307861328125, -0.8532638549804688, -0.8222198486328125, -0.7911758422851562, -0.7601318359375, -0.7290878295898438, -0.6980438232421875, -0.6669998168945312, -0.635955810546875, -0.6049118041992188, -0.5738677978515625, -0.5428237915039062, -0.51177978515625, -0.48073577880859375, -0.4496917724609375, -0.41864776611328125, -0.387603759765625, -0.35655975341796875, -0.3255157470703125, -0.29447174072265625, -0.263427734375, -0.23238372802734375, -0.2013397216796875, -0.17029571533203125, -0.139251708984375, -0.10820770263671875, -0.0771636962890625, -0.04611968994140625, -0.01507568359375, 0.01596832275390625, 0.0470123291015625, 0.07805633544921875, 0.109100341796875, 0.14014434814453125, 0.1711883544921875, 0.20223236083984375, 0.2332763671875, 0.26432037353515625, 0.2953643798828125, 0.32640838623046875, 0.357452392578125, 0.38849639892578125, 0.4195404052734375, 0.45058441162109375, 0.48162841796875, 0.5126724243164062, 0.5437164306640625, 0.5747604370117188, 0.605804443359375, 0.6368484497070312, 0.6678924560546875, 0.6989364624023438, 0.72998046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 12.0, 12.0, 18.0, 36.0, 55.0, 154.0, 326.0, 883.0, 2650.0, 14076.0, 413344.0, 596855.0, 15669.0, 2924.0, 876.0, 338.0, 141.0, 70.0, 40.0, 18.0, 17.0, 12.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.09375, -27.31396484375, -26.5341796875, -25.75439453125, -24.974609375, -24.19482421875, -23.4150390625, -22.63525390625, -21.85546875, -21.07568359375, -20.2958984375, -19.51611328125, -18.736328125, -17.95654296875, -17.1767578125, -16.39697265625, -15.6171875, -14.83740234375, -14.0576171875, -13.27783203125, -12.498046875, -11.71826171875, -10.9384765625, -10.15869140625, -9.37890625, -8.59912109375, -7.8193359375, -7.03955078125, -6.259765625, -5.47998046875, -4.7001953125, -3.92041015625, -3.140625, -2.36083984375, -1.5810546875, -0.80126953125, -0.021484375, 0.75830078125, 1.5380859375, 2.31787109375, 3.09765625, 3.87744140625, 4.6572265625, 5.43701171875, 6.216796875, 6.99658203125, 7.7763671875, 8.55615234375, 9.3359375, 10.11572265625, 10.8955078125, 11.67529296875, 12.455078125, 13.23486328125, 14.0146484375, 14.79443359375, 15.57421875, 16.35400390625, 17.1337890625, 17.91357421875, 18.693359375, 19.47314453125, 20.2529296875, 21.03271484375, 21.8125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 12.0, 20.0, 23.0, 23.0, 37.0, 33.0, 33.0, 63.0, 68.0, 65.0, 72.0, 70.0, 63.0, 65.0, 56.0, 45.0, 52.0, 44.0, 30.0, 25.0, 16.0, 21.0, 16.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.2115478515625, -5.020751953125, -4.8299560546875, -4.63916015625, -4.4483642578125, -4.257568359375, -4.0667724609375, -3.8759765625, -3.6851806640625, -3.494384765625, -3.3035888671875, -3.11279296875, -2.9219970703125, -2.731201171875, -2.5404052734375, -2.349609375, -2.1588134765625, -1.968017578125, -1.7772216796875, -1.58642578125, -1.3956298828125, -1.204833984375, -1.0140380859375, -0.8232421875, -0.6324462890625, -0.441650390625, -0.2508544921875, -0.06005859375, 0.1307373046875, 0.321533203125, 0.5123291015625, 0.703125, 0.8939208984375, 1.084716796875, 1.2755126953125, 1.46630859375, 1.6571044921875, 1.847900390625, 2.0386962890625, 2.2294921875, 2.4202880859375, 2.611083984375, 2.8018798828125, 2.99267578125, 3.1834716796875, 3.374267578125, 3.5650634765625, 3.755859375, 3.9466552734375, 4.137451171875, 4.3282470703125, 4.51904296875, 4.7098388671875, 4.900634765625, 5.0914306640625, 5.2822265625, 5.4730224609375, 5.663818359375, 5.8546142578125, 6.04541015625, 6.2362060546875, 6.427001953125, 6.6177978515625, 6.80859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 6.0, 3.0, 6.0, 11.0, 9.0, 20.0, 16.0, 37.0, 76.0, 183.0, 414.0, 1239.0, 12699.0, 1027252.0, 5032.0, 951.0, 288.0, 138.0, 62.0, 47.0, 18.0, 12.0, 13.0, 7.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.25, -157.52734375, -152.8046875, -148.08203125, -143.359375, -138.63671875, -133.9140625, -129.19140625, -124.46875, -119.74609375, -115.0234375, -110.30078125, -105.578125, -100.85546875, -96.1328125, -91.41015625, -86.6875, -81.96484375, -77.2421875, -72.51953125, -67.796875, -63.07421875, -58.3515625, -53.62890625, -48.90625, -44.18359375, -39.4609375, -34.73828125, -30.015625, -25.29296875, -20.5703125, -15.84765625, -11.125, -6.40234375, -1.6796875, 3.04296875, 7.765625, 12.48828125, 17.2109375, 21.93359375, 26.65625, 31.37890625, 36.1015625, 40.82421875, 45.546875, 50.26953125, 54.9921875, 59.71484375, 64.4375, 69.16015625, 73.8828125, 78.60546875, 83.328125, 88.05078125, 92.7734375, 97.49609375, 102.21875, 106.94140625, 111.6640625, 116.38671875, 121.109375, 125.83203125, 130.5546875, 135.27734375, 140.0]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 3.0, 4.0, 3.0, 7.0, 14.0, 19.0, 49.0, 183.0, 401.0, 184.0, 64.0, 27.0, 17.0, 8.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008707046508789062, -0.0008210986852645874, -0.0007714927196502686, -0.0007218867540359497, -0.0006722807884216309, -0.000622674822807312, -0.0005730688571929932, -0.0005234628915786743, -0.00047385692596435547, -0.0004242509603500366, -0.0003746449947357178, -0.0003250390291213989, -0.0002754330635070801, -0.00022582709789276123, -0.00017622113227844238, -0.00012661516666412354, -7.700920104980469e-05, -2.740323543548584e-05, 2.2202730178833008e-05, 7.180869579315186e-05, 0.0001214146614074707, 0.00017102062702178955, 0.0002206265926361084, 0.00027023255825042725, 0.0003198385238647461, 0.00036944448947906494, 0.0004190504550933838, 0.00046865642070770264, 0.0005182623863220215, 0.0005678683519363403, 0.0006174743175506592, 0.000667080283164978, 0.0007166862487792969, 0.0007662922143936157, 0.0008158981800079346, 0.0008655041456222534, 0.0009151101112365723, 0.0009647160768508911, 0.00101432204246521, 0.0010639280080795288, 0.0011135339736938477, 0.0011631399393081665, 0.0012127459049224854, 0.0012623518705368042, 0.001311957836151123, 0.001361563801765442, 0.0014111697673797607, 0.0014607757329940796, 0.0015103816986083984, 0.0015599876642227173, 0.0016095936298370361, 0.001659199595451355, 0.0017088055610656738, 0.0017584115266799927, 0.0018080174922943115, 0.0018576234579086304, 0.0019072294235229492, 0.001956835389137268, 0.002006441354751587, 0.0020560473203659058, 0.0021056532859802246, 0.0021552592515945435, 0.0022048652172088623, 0.002254471182823181, 0.0023040771484375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 0.0, 6.0, 9.0, 6.0, 12.0, 15.0, 11.0, 39.0, 36.0, 50.0, 70.0, 76.0, 147.0, 219.0, 375.0, 601.0, 1132.0, 2358.0, 5451.0, 18366.0, 810817.0, 185539.0, 13937.0, 4726.0, 1999.0, 1034.0, 542.0, 297.0, 193.0, 152.0, 95.0, 68.0, 31.0, 39.0, 23.0, 20.0, 19.0, 14.0, 7.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.8125, -25.916015625, -25.01953125, -24.123046875, -23.2265625, -22.330078125, -21.43359375, -20.537109375, -19.640625, -18.744140625, -17.84765625, -16.951171875, -16.0546875, -15.158203125, -14.26171875, -13.365234375, -12.46875, -11.572265625, -10.67578125, -9.779296875, -8.8828125, -7.986328125, -7.08984375, -6.193359375, -5.296875, -4.400390625, -3.50390625, -2.607421875, -1.7109375, -0.814453125, 0.08203125, 0.978515625, 1.875, 2.771484375, 3.66796875, 4.564453125, 5.4609375, 6.357421875, 7.25390625, 8.150390625, 9.046875, 9.943359375, 10.83984375, 11.736328125, 12.6328125, 13.529296875, 14.42578125, 15.322265625, 16.21875, 17.115234375, 18.01171875, 18.908203125, 19.8046875, 20.701171875, 21.59765625, 22.494140625, 23.390625, 24.287109375, 25.18359375, 26.080078125, 26.9765625, 27.873046875, 28.76953125, 29.666015625, 30.5625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 5.0, 7.0, 7.0, 9.0, 11.0, 17.0, 32.0, 61.0, 252.0, 354.0, 124.0, 33.0, 20.0, 11.0, 11.0, 6.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-18.5625, -18.064453125, -17.56640625, -17.068359375, -16.5703125, -16.072265625, -15.57421875, -15.076171875, -14.578125, -14.080078125, -13.58203125, -13.083984375, -12.5859375, -12.087890625, -11.58984375, -11.091796875, -10.59375, -10.095703125, -9.59765625, -9.099609375, -8.6015625, -8.103515625, -7.60546875, -7.107421875, -6.609375, -6.111328125, -5.61328125, -5.115234375, -4.6171875, -4.119140625, -3.62109375, -3.123046875, -2.625, -2.126953125, -1.62890625, -1.130859375, -0.6328125, -0.134765625, 0.36328125, 0.861328125, 1.359375, 1.857421875, 2.35546875, 2.853515625, 3.3515625, 3.849609375, 4.34765625, 4.845703125, 5.34375, 5.841796875, 6.33984375, 6.837890625, 7.3359375, 7.833984375, 8.33203125, 8.830078125, 9.328125, 9.826171875, 10.32421875, 10.822265625, 11.3203125, 11.818359375, 12.31640625, 12.814453125, 13.3125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 6.0, 20.0, 63.0, 132.0, 394.0, 264.0, 75.0, 23.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.96810913085938, -172.7336883544922, -165.499267578125, -158.2648468017578, -151.03042602539062, -143.7960205078125, -136.56158447265625, -129.32717895507812, -122.09275817871094, -114.85833740234375, -107.62391662597656, -100.38949584960938, -93.15508270263672, -85.92066192626953, -78.68624114990234, -71.45182800292969, -64.21739959716797, -56.98297882080078, -49.74856185913086, -42.51414108276367, -35.27972412109375, -28.045303344726562, -20.810882568359375, -13.576465606689453, -6.342044830322266, 0.8923745155334473, 8.12679386138916, 15.361213684082031, 22.595632553100586, 29.83005142211914, 37.06447219848633, 44.29888916015625, 51.53330993652344, 58.767730712890625, 66.00215148925781, 73.236572265625, 80.47098541259766, 87.70540618896484, 94.93982696533203, 102.17424011230469, 109.40866088867188, 116.64308166503906, 123.87750244140625, 131.11192321777344, 138.34634399414062, 145.58074951171875, 152.815185546875, 160.04959106445312, 167.28402709960938, 174.51844787597656, 181.75286865234375, 188.98728942871094, 196.22171020507812, 203.45611572265625, 210.6905517578125, 217.92495727539062, 225.1593780517578, 232.393798828125, 239.6282196044922, 246.86264038085938, 254.09706115722656, 261.33148193359375, 268.5658874511719, 275.8003234863281, 283.03472900390625]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 17.0, 16.0, 27.0, 36.0, 56.0, 73.0, 86.0, 102.0, 100.0, 97.0, 92.0, 72.0, 61.0, 42.0, 39.0, 18.0, 10.0, 12.0, 3.0, 5.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.634521484375, -71.15935516357422, -68.68419647216797, -66.20903015136719, -63.73386764526367, -61.258705139160156, -58.783538818359375, -56.30837631225586, -53.833213806152344, -51.35805130004883, -48.88288497924805, -46.40772247314453, -43.932559967041016, -41.4573974609375, -38.98223114013672, -36.5070686340332, -34.03190231323242, -31.556737899780273, -29.081575393676758, -26.60641098022461, -24.131248474121094, -21.656084060668945, -19.180919647216797, -16.70575714111328, -14.230592727661133, -11.7554292678833, -9.280265808105469, -6.80510139465332, -4.329937934875488, -1.8547744750976562, 0.6203899383544922, 3.095552444458008, 5.570716857910156, 8.045880317687988, 10.52104377746582, 12.996208190917969, 15.4713716506958, 17.946535110473633, 20.42169952392578, 22.896862030029297, 25.372026443481445, 27.847190856933594, 30.32235336303711, 32.797515869140625, 35.272682189941406, 37.74784469604492, 40.22300720214844, 42.69817352294922, 45.173336029052734, 47.64849853515625, 50.12366485595703, 52.59882736206055, 55.07398986816406, 57.549156188964844, 60.02431869506836, 62.499481201171875, 64.97464752197266, 67.44981384277344, 69.92497253417969, 72.40013885498047, 74.87530517578125, 77.3504638671875, 79.82563018798828, 82.30079650878906, 84.77595520019531]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 9.0, 14.0, 21.0, 33.0, 131.0, 717.0, 4183262.0, 9850.0, 160.0, 37.0, 20.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2039.0, -1987.765625, -1936.53125, -1885.296875, -1834.0625, -1782.828125, -1731.59375, -1680.359375, -1629.125, -1577.890625, -1526.65625, -1475.421875, -1424.1875, -1372.953125, -1321.71875, -1270.484375, -1219.25, -1168.015625, -1116.78125, -1065.546875, -1014.3125, -963.078125, -911.84375, -860.609375, -809.375, -758.140625, -706.90625, -655.671875, -604.4375, -553.203125, -501.96875, -450.734375, -399.5, -348.265625, -297.03125, -245.796875, -194.5625, -143.328125, -92.09375, -40.859375, 10.375, 61.609375, 112.84375, 164.078125, 215.3125, 266.546875, 317.78125, 369.015625, 420.25, 471.484375, 522.71875, 573.953125, 625.1875, 676.421875, 727.65625, 778.890625, 830.125, 881.359375, 932.59375, 983.828125, 1035.0625, 1086.296875, 1137.53125, 1188.765625, 1240.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 13.0, 9.0, 28.0, 25.0, 60.0, 73.0, 91.0, 108.0, 114.0, 102.0, 104.0, 80.0, 59.0, 36.0, 27.0, 21.0, 12.0, 8.0, 3.0, 6.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.3743438720703125, -1.340484619140625, -1.3066253662109375, -1.27276611328125, -1.2389068603515625, -1.205047607421875, -1.1711883544921875, -1.1373291015625, -1.1034698486328125, -1.069610595703125, -1.0357513427734375, -1.00189208984375, -0.9680328369140625, -0.934173583984375, -0.9003143310546875, -0.866455078125, -0.8325958251953125, -0.798736572265625, -0.7648773193359375, -0.73101806640625, -0.6971588134765625, -0.663299560546875, -0.6294403076171875, -0.5955810546875, -0.5617218017578125, -0.527862548828125, -0.4940032958984375, -0.46014404296875, -0.4262847900390625, -0.392425537109375, -0.3585662841796875, -0.32470703125, -0.2908477783203125, -0.256988525390625, -0.2231292724609375, -0.18927001953125, -0.1554107666015625, -0.121551513671875, -0.0876922607421875, -0.0538330078125, -0.0199737548828125, 0.013885498046875, 0.0477447509765625, 0.08160400390625, 0.1154632568359375, 0.149322509765625, 0.1831817626953125, 0.217041015625, 0.2509002685546875, 0.284759521484375, 0.3186187744140625, 0.35247802734375, 0.3863372802734375, 0.420196533203125, 0.4540557861328125, 0.4879150390625, 0.5217742919921875, 0.555633544921875, 0.5894927978515625, 0.62335205078125, 0.6572113037109375, 0.691070556640625, 0.7249298095703125, 0.7587890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 11.0, 26.0, 108.0, 382.0, 4183171.0, 9476.0, 447.0, 266.0, 174.0, 110.0, 52.0, 33.0, 17.0, 6.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.0, -89.484375, -73.96875, -58.453125, -42.9375, -27.421875, -11.90625, 3.609375, 19.125, 34.640625, 50.15625, 65.671875, 81.1875, 96.703125, 112.21875, 127.734375, 143.25, 158.765625, 174.28125, 189.796875, 205.3125, 220.828125, 236.34375, 251.859375, 267.375, 282.890625, 298.40625, 313.921875, 329.4375, 344.953125, 360.46875, 375.984375, 391.5, 407.015625, 422.53125, 438.046875, 453.5625, 469.078125, 484.59375, 500.109375, 515.625, 531.140625, 546.65625, 562.171875, 577.6875, 593.203125, 608.71875, 624.234375, 639.75, 655.265625, 670.78125, 686.296875, 701.8125, 717.328125, 732.84375, 748.359375, 763.875, 779.390625, 794.90625, 810.421875, 825.9375, 841.453125, 856.96875, 872.484375, 888.0]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 10.0, 32.0, 43.0, 83.0, 246.0, 1566.0, 974.0, 462.0, 282.0, 184.0, 82.0, 50.0, 26.0, 16.0, 12.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.732391357421875, -2.58001708984375, -2.427642822265625, -2.2752685546875, -2.122894287109375, -1.97052001953125, -1.818145751953125, -1.665771484375, -1.513397216796875, -1.36102294921875, -1.208648681640625, -1.0562744140625, -0.903900146484375, -0.75152587890625, -0.599151611328125, -0.44677734375, -0.294403076171875, -0.14202880859375, 0.010345458984375, 0.1627197265625, 0.315093994140625, 0.46746826171875, 0.619842529296875, 0.772216796875, 0.924591064453125, 1.07696533203125, 1.229339599609375, 1.3817138671875, 1.534088134765625, 1.68646240234375, 1.838836669921875, 1.9912109375, 2.143585205078125, 2.29595947265625, 2.448333740234375, 2.6007080078125, 2.753082275390625, 2.90545654296875, 3.057830810546875, 3.210205078125, 3.362579345703125, 3.51495361328125, 3.667327880859375, 3.8197021484375, 3.972076416015625, 4.12445068359375, 4.276824951171875, 4.42919921875, 4.581573486328125, 4.73394775390625, 4.886322021484375, 5.0386962890625, 5.191070556640625, 5.34344482421875, 5.495819091796875, 5.648193359375, 5.800567626953125, 5.95294189453125, 6.105316162109375, 6.2576904296875, 6.410064697265625, 6.56243896484375, 6.714813232421875, 6.8671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [612.0, 391.0, 16.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.79662322998047, 3.957538604736328, 64.71170043945312, 125.46585845947266, 186.22003173828125, 246.97418212890625, 307.72833251953125, 368.4825134277344, 429.2366638183594, 489.9908142089844, 550.7449951171875, 611.4991455078125, 672.2532958984375, 733.0074462890625, 793.7615966796875, 854.5158081054688, 915.2699584960938, 976.0241088867188, 1036.7783203125, 1097.532470703125, 1158.28662109375, 1219.040771484375, 1279.794921875, 1340.549072265625, 1401.30322265625, 1462.057373046875, 1522.8115234375, 1583.565673828125, 1644.31982421875, 1705.073974609375, 1765.828125, 1826.5823974609375, 1887.3365478515625, 1948.0906982421875, 2008.8448486328125, 2069.59912109375, 2130.353271484375, 2191.107421875, 2251.861572265625, 2312.61572265625, 2373.369873046875, 2434.1240234375, 2494.878173828125, 2555.63232421875, 2616.386474609375, 2677.140625, 2737.894775390625, 2798.64892578125, 2859.403076171875, 2920.1572265625, 2980.911376953125, 3041.66552734375, 3102.419677734375, 3163.173828125, 3223.927978515625, 3284.68212890625, 3345.4365234375, 3406.190673828125, 3466.94482421875, 3527.698974609375, 3588.453125, 3649.207275390625, 3709.96142578125, 3770.715576171875, 3831.4697265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 15.0, 28.0, 42.0, 81.0, 107.0, 146.0, 165.0, 142.0, 112.0, 82.0, 40.0, 19.0, 9.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.37444305419922, -54.753570556640625, -50.13269805908203, -45.51182556152344, -40.890953063964844, -36.27008056640625, -31.649208068847656, -27.028335571289062, -22.40746307373047, -17.786590576171875, -13.165718078613281, -8.544845581054688, -3.9239730834960938, 0.6968994140625, 5.317771911621094, 9.938644409179688, 14.559516906738281, 19.180389404296875, 23.80126190185547, 28.422134399414062, 33.043006896972656, 37.66387939453125, 42.284751892089844, 46.90562438964844, 51.52649688720703, 56.147369384765625, 60.76824188232422, 65.38911437988281, 70.0099868774414, 74.630859375, 79.2517318725586, 83.87260437011719, 88.49346923828125, 93.11434173583984, 97.73521423339844, 102.35608673095703, 106.97695922851562, 111.59783172607422, 116.21870422363281, 120.8395767211914, 125.46044921875, 130.08132934570312, 134.7021942138672, 139.32305908203125, 143.94393920898438, 148.5648193359375, 153.18568420410156, 157.80654907226562, 162.42742919921875, 167.04830932617188, 171.66917419433594, 176.2900390625, 180.91091918945312, 185.53179931640625, 190.1526641845703, 194.77352905273438, 199.3944091796875, 204.01528930664062, 208.6361541748047, 213.25701904296875, 217.87789916992188, 222.498779296875, 227.11964416503906, 231.74050903320312, 236.36138916015625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 6.0, 5.0, 13.0, 17.0, 16.0, 29.0, 33.0, 51.0, 67.0, 94.0, 157.0, 239.0, 376.0, 630.0, 1151.0, 1975.0, 3994.0, 8749.0, 22778.0, 79935.0, 537640.0, 304284.0, 54487.0, 17206.0, 7057.0, 3252.0, 1685.0, 1023.0, 558.0, 357.0, 205.0, 141.0, 98.0, 68.0, 48.0, 30.0, 24.0, 17.0, 20.0, 11.0, 5.0, 9.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.77587890625, -10.4267578125, -10.07763671875, -9.728515625, -9.37939453125, -9.0302734375, -8.68115234375, -8.33203125, -7.98291015625, -7.6337890625, -7.28466796875, -6.935546875, -6.58642578125, -6.2373046875, -5.88818359375, -5.5390625, -5.18994140625, -4.8408203125, -4.49169921875, -4.142578125, -3.79345703125, -3.4443359375, -3.09521484375, -2.74609375, -2.39697265625, -2.0478515625, -1.69873046875, -1.349609375, -1.00048828125, -0.6513671875, -0.30224609375, 0.046875, 0.39599609375, 0.7451171875, 1.09423828125, 1.443359375, 1.79248046875, 2.1416015625, 2.49072265625, 2.83984375, 3.18896484375, 3.5380859375, 3.88720703125, 4.236328125, 4.58544921875, 4.9345703125, 5.28369140625, 5.6328125, 5.98193359375, 6.3310546875, 6.68017578125, 7.029296875, 7.37841796875, 7.7275390625, 8.07666015625, 8.42578125, 8.77490234375, 9.1240234375, 9.47314453125, 9.822265625, 10.17138671875, 10.5205078125, 10.86962890625, 11.21875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 7.0, 9.0, 15.0, 22.0, 37.0, 34.0, 56.0, 78.0, 82.0, 85.0, 107.0, 112.0, 91.0, 74.0, 58.0, 44.0, 27.0, 20.0, 13.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.380859375, -1.3483505249023438, -1.3158416748046875, -1.2833328247070312, -1.250823974609375, -1.2183151245117188, -1.1858062744140625, -1.1532974243164062, -1.12078857421875, -1.0882797241210938, -1.0557708740234375, -1.0232620239257812, -0.990753173828125, -0.9582443237304688, -0.9257354736328125, -0.8932266235351562, -0.8607177734375, -0.8282089233398438, -0.7957000732421875, -0.7631912231445312, -0.730682373046875, -0.6981735229492188, -0.6656646728515625, -0.6331558227539062, -0.60064697265625, -0.5681381225585938, -0.5356292724609375, -0.5031204223632812, -0.470611572265625, -0.43810272216796875, -0.4055938720703125, -0.37308502197265625, -0.340576171875, -0.30806732177734375, -0.2755584716796875, -0.24304962158203125, -0.210540771484375, -0.17803192138671875, -0.1455230712890625, -0.11301422119140625, -0.08050537109375, -0.04799652099609375, -0.0154876708984375, 0.01702117919921875, 0.049530029296875, 0.08203887939453125, 0.1145477294921875, 0.14705657958984375, 0.1795654296875, 0.21207427978515625, 0.2445831298828125, 0.27709197998046875, 0.309600830078125, 0.34210968017578125, 0.3746185302734375, 0.40712738037109375, 0.43963623046875, 0.47214508056640625, 0.5046539306640625, 0.5371627807617188, 0.569671630859375, 0.6021804809570312, 0.6346893310546875, 0.6671981811523438, 0.69970703125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 10.0, 6.0, 8.0, 16.0, 16.0, 16.0, 29.0, 39.0, 39.0, 99.0, 340.0, 3429.0, 206081.0, 828438.0, 9057.0, 628.0, 104.0, 46.0, 22.0, 20.0, 24.0, 14.0, 11.0, 14.0, 14.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.65625, -36.55322265625, -35.4501953125, -34.34716796875, -33.244140625, -32.14111328125, -31.0380859375, -29.93505859375, -28.83203125, -27.72900390625, -26.6259765625, -25.52294921875, -24.419921875, -23.31689453125, -22.2138671875, -21.11083984375, -20.0078125, -18.90478515625, -17.8017578125, -16.69873046875, -15.595703125, -14.49267578125, -13.3896484375, -12.28662109375, -11.18359375, -10.08056640625, -8.9775390625, -7.87451171875, -6.771484375, -5.66845703125, -4.5654296875, -3.46240234375, -2.359375, -1.25634765625, -0.1533203125, 0.94970703125, 2.052734375, 3.15576171875, 4.2587890625, 5.36181640625, 6.46484375, 7.56787109375, 8.6708984375, 9.77392578125, 10.876953125, 11.97998046875, 13.0830078125, 14.18603515625, 15.2890625, 16.39208984375, 17.4951171875, 18.59814453125, 19.701171875, 20.80419921875, 21.9072265625, 23.01025390625, 24.11328125, 25.21630859375, 26.3193359375, 27.42236328125, 28.525390625, 29.62841796875, 30.7314453125, 31.83447265625, 32.9375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 8.0, 11.0, 18.0, 20.0, 23.0, 25.0, 21.0, 23.0, 29.0, 41.0, 42.0, 38.0, 46.0, 53.0, 41.0, 54.0, 44.0, 55.0, 49.0, 32.0, 28.0, 32.0, 29.0, 29.0, 19.0, 26.0, 22.0, 24.0, 20.0, 17.0, 7.0, 11.0, 7.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.029296875, -2.92852783203125, -2.8277587890625, -2.72698974609375, -2.626220703125, -2.52545166015625, -2.4246826171875, -2.32391357421875, -2.22314453125, -2.12237548828125, -2.0216064453125, -1.92083740234375, -1.820068359375, -1.71929931640625, -1.6185302734375, -1.51776123046875, -1.4169921875, -1.31622314453125, -1.2154541015625, -1.11468505859375, -1.013916015625, -0.91314697265625, -0.8123779296875, -0.71160888671875, -0.61083984375, -0.51007080078125, -0.4093017578125, -0.30853271484375, -0.207763671875, -0.10699462890625, -0.0062255859375, 0.09454345703125, 0.1953125, 0.29608154296875, 0.3968505859375, 0.49761962890625, 0.598388671875, 0.69915771484375, 0.7999267578125, 0.90069580078125, 1.00146484375, 1.10223388671875, 1.2030029296875, 1.30377197265625, 1.404541015625, 1.50531005859375, 1.6060791015625, 1.70684814453125, 1.8076171875, 1.90838623046875, 2.0091552734375, 2.10992431640625, 2.210693359375, 2.31146240234375, 2.4122314453125, 2.51300048828125, 2.61376953125, 2.71453857421875, 2.8153076171875, 2.91607666015625, 3.016845703125, 3.11761474609375, 3.2183837890625, 3.31915283203125, 3.419921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 15.0, 33.0, 75.0, 386.0, 6521.0, 1039963.0, 1302.0, 167.0, 48.0, 13.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-397.75, -388.11328125, -378.4765625, -368.83984375, -359.203125, -349.56640625, -339.9296875, -330.29296875, -320.65625, -311.01953125, -301.3828125, -291.74609375, -282.109375, -272.47265625, -262.8359375, -253.19921875, -243.5625, -233.92578125, -224.2890625, -214.65234375, -205.015625, -195.37890625, -185.7421875, -176.10546875, -166.46875, -156.83203125, -147.1953125, -137.55859375, -127.921875, -118.28515625, -108.6484375, -99.01171875, -89.375, -79.73828125, -70.1015625, -60.46484375, -50.828125, -41.19140625, -31.5546875, -21.91796875, -12.28125, -2.64453125, 6.9921875, 16.62890625, 26.265625, 35.90234375, 45.5390625, 55.17578125, 64.8125, 74.44921875, 84.0859375, 93.72265625, 103.359375, 112.99609375, 122.6328125, 132.26953125, 141.90625, 151.54296875, 161.1796875, 170.81640625, 180.453125, 190.08984375, 199.7265625, 209.36328125, 219.0]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 9.0, 15.0, 28.0, 69.0, 152.0, 295.0, 220.0, 77.0, 43.0, 27.0, 14.0, 14.0, 8.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007638931274414062, -0.000738188624382019, -0.0007124841213226318, -0.0006867796182632446, -0.0006610751152038574, -0.0006353706121444702, -0.000609666109085083, -0.0005839616060256958, -0.0005582571029663086, -0.0005325525999069214, -0.0005068480968475342, -0.00048114359378814697, -0.00045543909072875977, -0.00042973458766937256, -0.00040403008460998535, -0.00037832558155059814, -0.00035262107849121094, -0.00032691657543182373, -0.0003012120723724365, -0.0002755075693130493, -0.0002498030662536621, -0.0002240985631942749, -0.0001983940601348877, -0.0001726895570755005, -0.00014698505401611328, -0.00012128055095672607, -9.557604789733887e-05, -6.987154483795166e-05, -4.416704177856445e-05, -1.8462538719177246e-05, 7.241964340209961e-06, 3.294646739959717e-05, 5.8650970458984375e-05, 8.435547351837158e-05, 0.00011005997657775879, 0.000135764479637146, 0.0001614689826965332, 0.0001871734857559204, 0.00021287798881530762, 0.00023858249187469482, 0.00026428699493408203, 0.00028999149799346924, 0.00031569600105285645, 0.00034140050411224365, 0.00036710500717163086, 0.00039280951023101807, 0.0004185140132904053, 0.0004442185163497925, 0.0004699230194091797, 0.0004956275224685669, 0.0005213320255279541, 0.0005470365285873413, 0.0005727410316467285, 0.0005984455347061157, 0.0006241500377655029, 0.0006498545408248901, 0.0006755590438842773, 0.0007012635469436646, 0.0007269680500030518, 0.000752672553062439, 0.0007783770561218262, 0.0008040815591812134, 0.0008297860622406006, 0.0008554905652999878, 0.000881195068359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 1.0, 4.0, 4.0, 10.0, 21.0, 34.0, 59.0, 83.0, 149.0, 240.0, 485.0, 853.0, 1742.0, 3948.0, 11079.0, 78522.0, 915925.0, 23559.0, 6407.0, 2589.0, 1174.0, 691.0, 390.0, 215.0, 134.0, 104.0, 44.0, 31.0, 19.0, 11.0, 10.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-54.90625, -53.5078125, -52.109375, -50.7109375, -49.3125, -47.9140625, -46.515625, -45.1171875, -43.71875, -42.3203125, -40.921875, -39.5234375, -38.125, -36.7265625, -35.328125, -33.9296875, -32.53125, -31.1328125, -29.734375, -28.3359375, -26.9375, -25.5390625, -24.140625, -22.7421875, -21.34375, -19.9453125, -18.546875, -17.1484375, -15.75, -14.3515625, -12.953125, -11.5546875, -10.15625, -8.7578125, -7.359375, -5.9609375, -4.5625, -3.1640625, -1.765625, -0.3671875, 1.03125, 2.4296875, 3.828125, 5.2265625, 6.625, 8.0234375, 9.421875, 10.8203125, 12.21875, 13.6171875, 15.015625, 16.4140625, 17.8125, 19.2109375, 20.609375, 22.0078125, 23.40625, 24.8046875, 26.203125, 27.6015625, 29.0, 30.3984375, 31.796875, 33.1953125, 34.59375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 4.0, 7.0, 13.0, 8.0, 26.0, 54.0, 120.0, 486.0, 143.0, 54.0, 22.0, 10.0, 10.0, 12.0, 2.0, 2.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.875, -18.163818359375, -17.45263671875, -16.741455078125, -16.0302734375, -15.319091796875, -14.60791015625, -13.896728515625, -13.185546875, -12.474365234375, -11.76318359375, -11.052001953125, -10.3408203125, -9.629638671875, -8.91845703125, -8.207275390625, -7.49609375, -6.784912109375, -6.07373046875, -5.362548828125, -4.6513671875, -3.940185546875, -3.22900390625, -2.517822265625, -1.806640625, -1.095458984375, -0.38427734375, 0.326904296875, 1.0380859375, 1.749267578125, 2.46044921875, 3.171630859375, 3.8828125, 4.593994140625, 5.30517578125, 6.016357421875, 6.7275390625, 7.438720703125, 8.14990234375, 8.861083984375, 9.572265625, 10.283447265625, 10.99462890625, 11.705810546875, 12.4169921875, 13.128173828125, 13.83935546875, 14.550537109375, 15.26171875, 15.972900390625, 16.68408203125, 17.395263671875, 18.1064453125, 18.817626953125, 19.52880859375, 20.239990234375, 20.951171875, 21.662353515625, 22.37353515625, 23.084716796875, 23.7958984375, 24.507080078125, 25.21826171875, 25.929443359375, 26.640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 34.0, 288.0, 596.0, 74.0, 13.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.26786804199219, -103.86064147949219, -92.45341491699219, -81.04619598388672, -69.63896942138672, -58.23174285888672, -46.82452392578125, -35.41729736328125, -24.01007080078125, -12.602846145629883, -1.1956214904785156, 10.211601257324219, 21.61882781982422, 33.02605438232422, 44.43327331542969, 55.84049987792969, 67.24772644042969, 78.65495300292969, 90.06217956542969, 101.46939849853516, 112.87662506103516, 124.28385162353516, 135.69107055664062, 147.09829711914062, 158.50552368164062, 169.91275024414062, 181.31997680664062, 192.72720336914062, 204.13442993164062, 215.54165649414062, 226.94886779785156, 238.35609436035156, 249.7633056640625, 261.1705322265625, 272.5777587890625, 283.9849853515625, 295.3922119140625, 306.7994384765625, 318.2066650390625, 329.6138916015625, 341.0211181640625, 352.4283447265625, 363.8355712890625, 375.2427978515625, 386.6500244140625, 398.0572509765625, 409.4644775390625, 420.8717041015625, 432.2789001464844, 443.6861267089844, 455.0933532714844, 466.5005798339844, 477.9078063964844, 489.3150329589844, 500.72222900390625, 512.1294555664062, 523.5366821289062, 534.9439086914062, 546.3511352539062, 557.7583618164062, 569.1655883789062, 580.5728149414062, 591.9800415039062, 603.3872680664062, 614.7944946289062]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 2.0, 8.0, 15.0, 12.0, 18.0, 28.0, 35.0, 40.0, 45.0, 66.0, 50.0, 69.0, 69.0, 57.0, 83.0, 73.0, 52.0, 49.0, 33.0, 43.0, 25.0, 27.0, 23.0, 17.0, 12.0, 10.0, 5.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.27056121826172, -44.96403503417969, -43.657508850097656, -42.35097885131836, -41.04445266723633, -39.7379264831543, -38.431396484375, -37.12487030029297, -35.81834411621094, -34.511817932128906, -33.205291748046875, -31.898761749267578, -30.592235565185547, -29.285709381103516, -27.97918128967285, -26.672653198242188, -25.366127014160156, -24.059600830078125, -22.75307273864746, -21.446544647216797, -20.140018463134766, -18.833492279052734, -17.52696418762207, -16.220436096191406, -14.913909912109375, -13.607382774353027, -12.30085563659668, -10.994328498840332, -9.687801361083984, -8.381274223327637, -7.074747085571289, -5.768219947814941, -4.461692810058594, -3.155165672302246, -1.8486385345458984, -0.5421113967895508, 0.7644157409667969, 2.0709428787231445, 3.377470016479492, 4.68399715423584, 5.9905242919921875, 7.297051429748535, 8.603578567504883, 9.91010570526123, 11.216632843017578, 12.523159980773926, 13.829687118530273, 15.136214256286621, 16.44274139404297, 17.749267578125, 19.055795669555664, 20.362323760986328, 21.66884994506836, 22.97537612915039, 24.281904220581055, 25.58843231201172, 26.89495849609375, 28.20148468017578, 29.508012771606445, 30.81454086303711, 32.12106704711914, 33.42759323120117, 34.73412322998047, 36.0406494140625, 37.34717559814453]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 6.0, 2.0, 2.0, 2.0, 8.0, 0.0, 12.0, 6.0, 0.0, 10.0, 4.0, 13.0, 25.0, 30.0, 12.0, 26.0, 56.0, 243.0, 4181962.0, 11473.0, 198.0, 48.0, 28.0, 24.0, 16.0, 22.0, 12.0, 10.0, 8.0, 6.0, 8.0, 6.0, 0.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-527.5, -504.4609375, -481.421875, -458.3828125, -435.34375, -412.3046875, -389.265625, -366.2265625, -343.1875, -320.1484375, -297.109375, -274.0703125, -251.03125, -227.9921875, -204.953125, -181.9140625, -158.875, -135.8359375, -112.796875, -89.7578125, -66.71875, -43.6796875, -20.640625, 2.3984375, 25.4375, 48.4765625, 71.515625, 94.5546875, 117.59375, 140.6328125, 163.671875, 186.7109375, 209.75, 232.7890625, 255.828125, 278.8671875, 301.90625, 324.9453125, 347.984375, 371.0234375, 394.0625, 417.1015625, 440.140625, 463.1796875, 486.21875, 509.2578125, 532.296875, 555.3359375, 578.375, 601.4140625, 624.453125, 647.4921875, 670.53125, 693.5703125, 716.609375, 739.6484375, 762.6875, 785.7265625, 808.765625, 831.8046875, 854.84375, 877.8828125, 900.921875, 923.9609375, 947.0]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 9.0, 18.0, 26.0, 29.0, 47.0, 66.0, 66.0, 71.0, 102.0, 95.0, 114.0, 88.0, 84.0, 45.0, 41.0, 33.0, 22.0, 11.0, 11.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.482421875, -1.442901611328125, -1.40338134765625, -1.363861083984375, -1.3243408203125, -1.284820556640625, -1.24530029296875, -1.205780029296875, -1.166259765625, -1.126739501953125, -1.08721923828125, -1.047698974609375, -1.0081787109375, -0.968658447265625, -0.92913818359375, -0.889617919921875, -0.85009765625, -0.810577392578125, -0.77105712890625, -0.731536865234375, -0.6920166015625, -0.652496337890625, -0.61297607421875, -0.573455810546875, -0.533935546875, -0.494415283203125, -0.45489501953125, -0.415374755859375, -0.3758544921875, -0.336334228515625, -0.29681396484375, -0.257293701171875, -0.2177734375, -0.178253173828125, -0.13873291015625, -0.099212646484375, -0.0596923828125, -0.020172119140625, 0.01934814453125, 0.058868408203125, 0.098388671875, 0.137908935546875, 0.17742919921875, 0.216949462890625, 0.2564697265625, 0.295989990234375, 0.33551025390625, 0.375030517578125, 0.41455078125, 0.454071044921875, 0.49359130859375, 0.533111572265625, 0.5726318359375, 0.612152099609375, 0.65167236328125, 0.691192626953125, 0.730712890625, 0.770233154296875, 0.80975341796875, 0.849273681640625, 0.8887939453125, 0.928314208984375, 0.96783447265625, 1.007354736328125, 1.046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 94.0, 853.0, 4193204.0, 121.0, 13.0, 4.0], "bins": [-2226.0, -2189.087890625, -2152.17578125, -2115.263671875, -2078.3515625, -2041.439453125, -2004.52734375, -1967.615234375, -1930.703125, -1893.791015625, -1856.87890625, -1819.966796875, -1783.0546875, -1746.142578125, -1709.23046875, -1672.318359375, -1635.40625, -1598.494140625, -1561.58203125, -1524.669921875, -1487.7578125, -1450.845703125, -1413.93359375, -1377.021484375, -1340.109375, -1303.197265625, -1266.28515625, -1229.373046875, -1192.4609375, -1155.548828125, -1118.63671875, -1081.724609375, -1044.8125, -1007.900390625, -970.98828125, -934.076171875, -897.1640625, -860.251953125, -823.33984375, -786.427734375, -749.515625, -712.603515625, -675.69140625, -638.779296875, -601.8671875, -564.955078125, -528.04296875, -491.130859375, -454.21875, -417.306640625, -380.39453125, -343.482421875, -306.5703125, -269.658203125, -232.74609375, -195.833984375, -158.921875, -122.009765625, -85.09765625, -48.185546875, -11.2734375, 25.638671875, 62.55078125, 99.462890625, 136.375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 16.0, 28.0, 44.0, 115.0, 406.0, 3032.0, 296.0, 66.0, 33.0, 19.0, 7.0, 8.0, 3.0, 4.0, 1.0], "bins": [-12.84375, -12.608154296875, -12.37255859375, -12.136962890625, -11.9013671875, -11.665771484375, -11.43017578125, -11.194580078125, -10.958984375, -10.723388671875, -10.48779296875, -10.252197265625, -10.0166015625, -9.781005859375, -9.54541015625, -9.309814453125, -9.07421875, -8.838623046875, -8.60302734375, -8.367431640625, -8.1318359375, -7.896240234375, -7.66064453125, -7.425048828125, -7.189453125, -6.953857421875, -6.71826171875, -6.482666015625, -6.2470703125, -6.011474609375, -5.77587890625, -5.540283203125, -5.3046875, -5.069091796875, -4.83349609375, -4.597900390625, -4.3623046875, -4.126708984375, -3.89111328125, -3.655517578125, -3.419921875, -3.184326171875, -2.94873046875, -2.713134765625, -2.4775390625, -2.241943359375, -2.00634765625, -1.770751953125, -1.53515625, -1.299560546875, -1.06396484375, -0.828369140625, -0.5927734375, -0.357177734375, -0.12158203125, 0.114013671875, 0.349609375, 0.585205078125, 0.82080078125, 1.056396484375, 1.2919921875, 1.527587890625, 1.76318359375, 1.998779296875, 2.234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1013.0, 7.0], "bins": [-5447.3291015625, -5360.4169921875, -5273.5048828125, -5186.5927734375, -5099.6806640625, -5012.7685546875, -4925.8564453125, -4838.9443359375, -4752.0322265625, -4665.1201171875, -4578.2080078125, -4491.2958984375, -4404.3837890625, -4317.4716796875, -4230.5595703125, -4143.6474609375, -4056.73486328125, -3969.82275390625, -3882.91064453125, -3795.99853515625, -3709.08642578125, -3622.174072265625, -3535.261962890625, -3448.349853515625, -3361.437744140625, -3274.525634765625, -3187.613525390625, -3100.701416015625, -3013.7890625, -2926.876953125, -2839.96484375, -2753.052734375, -2666.140869140625, -2579.228759765625, -2492.316650390625, -2405.404541015625, -2318.4921875, -2231.580078125, -2144.66796875, -2057.755859375, -1970.8436279296875, -1883.9315185546875, -1797.019287109375, -1710.107177734375, -1623.195068359375, -1536.282958984375, -1449.370849609375, -1362.4586181640625, -1275.5465087890625, -1188.6343994140625, -1101.72216796875, -1014.81005859375, -927.89794921875, -840.98583984375, -754.0736694335938, -667.1614990234375, -580.2493896484375, -493.3372497558594, -406.42510986328125, -319.5129699707031, -232.600830078125, -145.68869018554688, -58.77655029296875, 28.1356201171875, 115.04772186279297]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 11.0, 37.0, 72.0, 151.0, 214.0, 236.0, 153.0, 74.0, 40.0, 15.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-270.3216552734375, -264.8896179199219, -259.45758056640625, -254.02554321289062, -248.59352111816406, -243.16148376464844, -237.7294464111328, -232.2974090576172, -226.86538696289062, -221.433349609375, -216.00131225585938, -210.56927490234375, -205.1372528076172, -199.70521545410156, -194.27317810058594, -188.8411407470703, -183.4091033935547, -177.97706604003906, -172.54502868652344, -167.11300659179688, -161.68096923828125, -156.24893188476562, -150.81689453125, -145.38485717773438, -139.95281982421875, -134.52078247070312, -129.0887451171875, -123.6567153930664, -118.22468566894531, -112.79264831542969, -107.36061096191406, -101.92857360839844, -96.4965591430664, -91.06452178955078, -85.63249206542969, -80.20045471191406, -74.76841735839844, -69.33638763427734, -63.90435028076172, -58.47231674194336, -53.040283203125, -47.60824966430664, -42.17621612548828, -36.744178771972656, -31.312145233154297, -25.880111694335938, -20.448074340820312, -15.016040802001953, -9.584007263183594, -4.151972770690918, 1.2800617218017578, 6.71209716796875, 12.14413070678711, 17.57616424560547, 23.008201599121094, 28.440235137939453, 33.87226867675781, 39.30430221557617, 44.73633575439453, 50.168373107910156, 55.600406646728516, 61.032440185546875, 66.4644775390625, 71.89651489257812, 77.32854461669922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 8.0, 4.0, 9.0, 12.0, 7.0, 8.0, 12.0, 26.0, 23.0, 28.0, 28.0, 31.0, 44.0, 66.0, 72.0, 156.0, 1075.0, 280996.0, 763930.0, 1490.0, 167.0, 68.0, 51.0, 42.0, 31.0, 21.0, 29.0, 24.0, 16.0, 17.0, 11.0, 10.0, 7.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-214.125, -207.4453125, -200.765625, -194.0859375, -187.40625, -180.7265625, -174.046875, -167.3671875, -160.6875, -154.0078125, -147.328125, -140.6484375, -133.96875, -127.2890625, -120.609375, -113.9296875, -107.25, -100.5703125, -93.890625, -87.2109375, -80.53125, -73.8515625, -67.171875, -60.4921875, -53.8125, -47.1328125, -40.453125, -33.7734375, -27.09375, -20.4140625, -13.734375, -7.0546875, -0.375, 6.3046875, 12.984375, 19.6640625, 26.34375, 33.0234375, 39.703125, 46.3828125, 53.0625, 59.7421875, 66.421875, 73.1015625, 79.78125, 86.4609375, 93.140625, 99.8203125, 106.5, 113.1796875, 119.859375, 126.5390625, 133.21875, 139.8984375, 146.578125, 153.2578125, 159.9375, 166.6171875, 173.296875, 179.9765625, 186.65625, 193.3359375, 200.015625, 206.6953125, 213.375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 30.0, 153.0, 335.0, 304.0, 148.0, 35.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.792236328125, -34.14697265625, -33.501708984375, -32.8564453125, -32.211181640625, -31.56591796875, -30.920654296875, -30.275390625, -29.630126953125, -28.98486328125, -28.339599609375, -27.6943359375, -27.049072265625, -26.40380859375, -25.758544921875, -25.11328125, -24.468017578125, -23.82275390625, -23.177490234375, -22.5322265625, -21.886962890625, -21.24169921875, -20.596435546875, -19.951171875, -19.305908203125, -18.66064453125, -18.015380859375, -17.3701171875, -16.724853515625, -16.07958984375, -15.434326171875, -14.7890625, -14.143798828125, -13.49853515625, -12.853271484375, -12.2080078125, -11.562744140625, -10.91748046875, -10.272216796875, -9.626953125, -8.981689453125, -8.33642578125, -7.691162109375, -7.0458984375, -6.400634765625, -5.75537109375, -5.110107421875, -4.46484375, -3.819580078125, -3.17431640625, -2.529052734375, -1.8837890625, -1.238525390625, -0.59326171875, 0.052001953125, 0.697265625, 1.342529296875, 1.98779296875, 2.633056640625, 3.2783203125, 3.923583984375, 4.56884765625, 5.214111328125, 5.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 6.0, 5.0, 7.0, 13.0, 19.0, 22.0, 17.0, 25.0, 36.0, 47.0, 81.0, 150.0, 354.0, 1151.0, 10549.0, 575117.0, 449389.0, 9652.0, 1152.0, 324.0, 147.0, 73.0, 61.0, 25.0, 22.0, 20.0, 22.0, 14.0, 8.0, 11.0, 3.0, 6.0, 2.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-129.875, -125.232421875, -120.58984375, -115.947265625, -111.3046875, -106.662109375, -102.01953125, -97.376953125, -92.734375, -88.091796875, -83.44921875, -78.806640625, -74.1640625, -69.521484375, -64.87890625, -60.236328125, -55.59375, -50.951171875, -46.30859375, -41.666015625, -37.0234375, -32.380859375, -27.73828125, -23.095703125, -18.453125, -13.810546875, -9.16796875, -4.525390625, 0.1171875, 4.759765625, 9.40234375, 14.044921875, 18.6875, 23.330078125, 27.97265625, 32.615234375, 37.2578125, 41.900390625, 46.54296875, 51.185546875, 55.828125, 60.470703125, 65.11328125, 69.755859375, 74.3984375, 79.041015625, 83.68359375, 88.326171875, 92.96875, 97.611328125, 102.25390625, 106.896484375, 111.5390625, 116.181640625, 120.82421875, 125.466796875, 130.109375, 134.751953125, 139.39453125, 144.037109375, 148.6796875, 153.322265625, 157.96484375, 162.607421875, 167.25]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 7.0, 10.0, 9.0, 23.0, 20.0, 19.0, 28.0, 29.0, 33.0, 33.0, 43.0, 50.0, 49.0, 54.0, 71.0, 61.0, 80.0, 46.0, 51.0, 39.0, 38.0, 36.0, 26.0, 29.0, 18.0, 11.0, 19.0, 18.0, 5.0, 11.0, 7.0, 7.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.46875, -30.302734375, -29.13671875, -27.970703125, -26.8046875, -25.638671875, -24.47265625, -23.306640625, -22.140625, -20.974609375, -19.80859375, -18.642578125, -17.4765625, -16.310546875, -15.14453125, -13.978515625, -12.8125, -11.646484375, -10.48046875, -9.314453125, -8.1484375, -6.982421875, -5.81640625, -4.650390625, -3.484375, -2.318359375, -1.15234375, 0.013671875, 1.1796875, 2.345703125, 3.51171875, 4.677734375, 5.84375, 7.009765625, 8.17578125, 9.341796875, 10.5078125, 11.673828125, 12.83984375, 14.005859375, 15.171875, 16.337890625, 17.50390625, 18.669921875, 19.8359375, 21.001953125, 22.16796875, 23.333984375, 24.5, 25.666015625, 26.83203125, 27.998046875, 29.1640625, 30.330078125, 31.49609375, 32.662109375, 33.828125, 34.994140625, 36.16015625, 37.326171875, 38.4921875, 39.658203125, 40.82421875, 41.990234375, 43.15625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 11.0, 8.0, 22.0, 35.0, 70.0, 142.0, 309.0, 1058.0, 5573.0, 1002753.0, 35118.0, 2471.0, 569.0, 209.0, 95.0, 51.0, 21.0, 7.0, 13.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.75, -200.12109375, -190.4921875, -180.86328125, -171.234375, -161.60546875, -151.9765625, -142.34765625, -132.71875, -123.08984375, -113.4609375, -103.83203125, -94.203125, -84.57421875, -74.9453125, -65.31640625, -55.6875, -46.05859375, -36.4296875, -26.80078125, -17.171875, -7.54296875, 2.0859375, 11.71484375, 21.34375, 30.97265625, 40.6015625, 50.23046875, 59.859375, 69.48828125, 79.1171875, 88.74609375, 98.375, 108.00390625, 117.6328125, 127.26171875, 136.890625, 146.51953125, 156.1484375, 165.77734375, 175.40625, 185.03515625, 194.6640625, 204.29296875, 213.921875, 223.55078125, 233.1796875, 242.80859375, 252.4375, 262.06640625, 271.6953125, 281.32421875, 290.953125, 300.58203125, 310.2109375, 319.83984375, 329.46875, 339.09765625, 348.7265625, 358.35546875, 367.984375, 377.61328125, 387.2421875, 396.87109375, 406.5]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 9.0, 5.0, 19.0, 19.0, 19.0, 33.0, 37.0, 64.0, 73.0, 103.0, 126.0, 137.0, 90.0, 71.0, 52.0, 41.0, 28.0, 19.0, 15.0, 12.0, 9.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00238800048828125, -0.0022989511489868164, -0.002209901809692383, -0.0021208524703979492, -0.0020318031311035156, -0.001942753791809082, -0.0018537044525146484, -0.0017646551132202148, -0.0016756057739257812, -0.0015865564346313477, -0.001497507095336914, -0.0014084577560424805, -0.0013194084167480469, -0.0012303590774536133, -0.0011413097381591797, -0.001052260398864746, -0.0009632110595703125, -0.0008741617202758789, -0.0007851123809814453, -0.0006960630416870117, -0.0006070137023925781, -0.0005179643630981445, -0.00042891502380371094, -0.00033986568450927734, -0.00025081634521484375, -0.00016176700592041016, -7.271766662597656e-05, 1.633167266845703e-05, 0.00010538101196289062, 0.00019443035125732422, 0.0002834796905517578, 0.0003725290298461914, 0.000461578369140625, 0.0005506277084350586, 0.0006396770477294922, 0.0007287263870239258, 0.0008177757263183594, 0.000906825065612793, 0.0009958744049072266, 0.0010849237442016602, 0.0011739730834960938, 0.0012630224227905273, 0.001352071762084961, 0.0014411211013793945, 0.0015301704406738281, 0.0016192197799682617, 0.0017082691192626953, 0.001797318458557129, 0.0018863677978515625, 0.001975417137145996, 0.0020644664764404297, 0.0021535158157348633, 0.002242565155029297, 0.0023316144943237305, 0.002420663833618164, 0.0025097131729125977, 0.0025987625122070312, 0.002687811851501465, 0.0027768611907958984, 0.002865910530090332, 0.0029549598693847656, 0.0030440092086791992, 0.003133058547973633, 0.0032221078872680664, 0.0033111572265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 6.0, 18.0, 14.0, 35.0, 82.0, 481.0, 4000.0, 1030560.0, 12066.0, 1026.0, 149.0, 43.0, 25.0, 20.0, 4.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-456.5, -443.33984375, -430.1796875, -417.01953125, -403.859375, -390.69921875, -377.5390625, -364.37890625, -351.21875, -338.05859375, -324.8984375, -311.73828125, -298.578125, -285.41796875, -272.2578125, -259.09765625, -245.9375, -232.77734375, -219.6171875, -206.45703125, -193.296875, -180.13671875, -166.9765625, -153.81640625, -140.65625, -127.49609375, -114.3359375, -101.17578125, -88.015625, -74.85546875, -61.6953125, -48.53515625, -35.375, -22.21484375, -9.0546875, 4.10546875, 17.265625, 30.42578125, 43.5859375, 56.74609375, 69.90625, 83.06640625, 96.2265625, 109.38671875, 122.546875, 135.70703125, 148.8671875, 162.02734375, 175.1875, 188.34765625, 201.5078125, 214.66796875, 227.828125, 240.98828125, 254.1484375, 267.30859375, 280.46875, 293.62890625, 306.7890625, 319.94921875, 333.109375, 346.26953125, 359.4296875, 372.58984375, 385.75]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 8.0, 15.0, 42.0, 147.0, 544.0, 149.0, 35.0, 13.0, 11.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-100.8125, -97.888671875, -94.96484375, -92.041015625, -89.1171875, -86.193359375, -83.26953125, -80.345703125, -77.421875, -74.498046875, -71.57421875, -68.650390625, -65.7265625, -62.802734375, -59.87890625, -56.955078125, -54.03125, -51.107421875, -48.18359375, -45.259765625, -42.3359375, -39.412109375, -36.48828125, -33.564453125, -30.640625, -27.716796875, -24.79296875, -21.869140625, -18.9453125, -16.021484375, -13.09765625, -10.173828125, -7.25, -4.326171875, -1.40234375, 1.521484375, 4.4453125, 7.369140625, 10.29296875, 13.216796875, 16.140625, 19.064453125, 21.98828125, 24.912109375, 27.8359375, 30.759765625, 33.68359375, 36.607421875, 39.53125, 42.455078125, 45.37890625, 48.302734375, 51.2265625, 54.150390625, 57.07421875, 59.998046875, 62.921875, 65.845703125, 68.76953125, 71.693359375, 74.6171875, 77.541015625, 80.46484375, 83.388671875, 86.3125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 11.0, 311.0, 610.0, 50.0, 15.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-386.14691162109375, -331.39495849609375, -276.64300537109375, -221.89105224609375, -167.13909912109375, -112.38714599609375, -57.63519287109375, -2.88323974609375, 51.86871337890625, 106.62066650390625, 161.37261962890625, 216.12457275390625, 270.87652587890625, 325.62847900390625, 380.38043212890625, 435.13238525390625, 489.88433837890625, 544.6362915039062, 599.3882446289062, 654.1401977539062, 708.8921508789062, 763.6441040039062, 818.3960571289062, 873.1480102539062, 927.8999633789062, 982.6519165039062, 1037.40380859375, 1092.15576171875, 1146.90771484375, 1201.65966796875, 1256.41162109375, 1311.16357421875, 1365.91552734375, 1420.66748046875, 1475.41943359375, 1530.17138671875, 1584.92333984375, 1639.67529296875, 1694.42724609375, 1749.17919921875, 1803.93115234375, 1858.68310546875, 1913.43505859375, 1968.18701171875, 2022.93896484375, 2077.69091796875, 2132.44287109375, 2187.19482421875, 2241.94677734375, 2296.69873046875, 2351.45068359375, 2406.20263671875, 2460.95458984375, 2515.70654296875, 2570.45849609375, 2625.21044921875, 2679.96240234375, 2734.71435546875, 2789.46630859375, 2844.21826171875, 2898.97021484375, 2953.72216796875, 3008.47412109375, 3063.22607421875, 3117.97802734375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 14.0, 31.0, 31.0, 44.0, 60.0, 98.0, 92.0, 97.0, 100.0, 88.0, 94.0, 73.0, 58.0, 47.0, 34.0, 14.0, 12.0, 10.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-522.893798828125, -507.7615661621094, -492.6293640136719, -477.49713134765625, -462.36492919921875, -447.2326965332031, -432.1004638671875, -416.96826171875, -401.8360595703125, -386.7038269042969, -371.5716247558594, -356.43939208984375, -341.30718994140625, -326.1749572753906, -311.042724609375, -295.9105224609375, -280.7782897949219, -265.64605712890625, -250.51385498046875, -235.38162231445312, -220.24942016601562, -205.1171875, -189.98497009277344, -174.85275268554688, -159.7205352783203, -144.58831787109375, -129.4561004638672, -114.3238754272461, -99.19165802001953, -84.05944061279297, -68.92721557617188, -53.79499816894531, -38.662811279296875, -23.53059196472168, -8.398372650146484, 6.733848571777344, 21.866065979003906, 36.99828338623047, 52.13050842285156, 67.26272583007812, 82.39494323730469, 97.52716064453125, 112.65937805175781, 127.7916030883789, 142.923828125, 158.0560302734375, 173.18826293945312, 188.3204803466797, 203.45269775390625, 218.5849151611328, 233.71713256835938, 248.849365234375, 263.9815673828125, 279.1138000488281, 294.24603271484375, 309.37823486328125, 324.51043701171875, 339.6426696777344, 354.7748718261719, 369.9071044921875, 385.039306640625, 400.1715393066406, 415.30377197265625, 430.43597412109375, 445.5682067871094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 11.0, 40.0, 108.0, 527.0, 4815.0, 4187837.0, 713.0, 184.0, 35.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0], "bins": [-1503.0, -1475.30078125, -1447.6015625, -1419.90234375, -1392.203125, -1364.50390625, -1336.8046875, -1309.10546875, -1281.40625, -1253.70703125, -1226.0078125, -1198.30859375, -1170.609375, -1142.91015625, -1115.2109375, -1087.51171875, -1059.8125, -1032.11328125, -1004.4140625, -976.71484375, -949.015625, -921.31640625, -893.6171875, -865.91796875, -838.21875, -810.51953125, -782.8203125, -755.12109375, -727.421875, -699.72265625, -672.0234375, -644.32421875, -616.625, -588.92578125, -561.2265625, -533.52734375, -505.828125, -478.12890625, -450.4296875, -422.73046875, -395.03125, -367.33203125, -339.6328125, -311.93359375, -284.234375, -256.53515625, -228.8359375, -201.13671875, -173.4375, -145.73828125, -118.0390625, -90.33984375, -62.640625, -34.94140625, -7.2421875, 20.45703125, 48.15625, 75.85546875, 103.5546875, 131.25390625, 158.953125, 186.65234375, 214.3515625, 242.05078125, 269.75]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 13.0, 24.0, 119.0, 235.0, 253.0, 208.0, 109.0, 38.0, 14.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.5, -36.79803466796875, -36.0960693359375, -35.39410400390625, -34.692138671875, -33.99017333984375, -33.2882080078125, -32.58624267578125, -31.88427734375, -31.18231201171875, -30.4803466796875, -29.77838134765625, -29.076416015625, -28.37445068359375, -27.6724853515625, -26.97052001953125, -26.2685546875, -25.56658935546875, -24.8646240234375, -24.16265869140625, -23.460693359375, -22.75872802734375, -22.0567626953125, -21.35479736328125, -20.65283203125, -19.95086669921875, -19.2489013671875, -18.54693603515625, -17.844970703125, -17.14300537109375, -16.4410400390625, -15.73907470703125, -15.037109375, -14.33514404296875, -13.6331787109375, -12.93121337890625, -12.229248046875, -11.52728271484375, -10.8253173828125, -10.12335205078125, -9.42138671875, -8.71942138671875, -8.0174560546875, -7.31549072265625, -6.613525390625, -5.91156005859375, -5.2095947265625, -4.50762939453125, -3.8056640625, -3.10369873046875, -2.4017333984375, -1.69976806640625, -0.997802734375, -0.29583740234375, 0.4061279296875, 1.10809326171875, 1.81005859375, 2.51202392578125, 3.2139892578125, 3.91595458984375, 4.617919921875, 5.31988525390625, 6.0218505859375, 6.72381591796875, 7.42578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 9.0, 17.0, 91.0, 218.0, 380.0, 1836.0, 4191208.0, 284.0, 162.0, 68.0, 14.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3990.0, -3910.484375, -3830.96875, -3751.453125, -3671.9375, -3592.421875, -3512.90625, -3433.390625, -3353.875, -3274.359375, -3194.84375, -3115.328125, -3035.8125, -2956.296875, -2876.78125, -2797.265625, -2717.75, -2638.234375, -2558.71875, -2479.203125, -2399.6875, -2320.171875, -2240.65625, -2161.140625, -2081.625, -2002.109375, -1922.59375, -1843.078125, -1763.5625, -1684.046875, -1604.53125, -1525.015625, -1445.5, -1365.984375, -1286.46875, -1206.953125, -1127.4375, -1047.921875, -968.40625, -888.890625, -809.375, -729.859375, -650.34375, -570.828125, -491.3125, -411.796875, -332.28125, -252.765625, -173.25, -93.734375, -14.21875, 65.296875, 144.8125, 224.328125, 303.84375, 383.359375, 462.875, 542.390625, 621.90625, 701.421875, 780.9375, 860.453125, 939.96875, 1019.484375, 1099.0]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 20.0, 146.0, 3836.0, 74.0, 9.0, 3.0, 2.0], "bins": [-268.5, -263.98583984375, -259.4716796875, -254.95751953125, -250.443359375, -245.92919921875, -241.4150390625, -236.90087890625, -232.38671875, -227.87255859375, -223.3583984375, -218.84423828125, -214.330078125, -209.81591796875, -205.3017578125, -200.78759765625, -196.2734375, -191.75927734375, -187.2451171875, -182.73095703125, -178.216796875, -173.70263671875, -169.1884765625, -164.67431640625, -160.16015625, -155.64599609375, -151.1318359375, -146.61767578125, -142.103515625, -137.58935546875, -133.0751953125, -128.56103515625, -124.046875, -119.53271484375, -115.0185546875, -110.50439453125, -105.990234375, -101.47607421875, -96.9619140625, -92.44775390625, -87.93359375, -83.41943359375, -78.9052734375, -74.39111328125, -69.876953125, -65.36279296875, -60.8486328125, -56.33447265625, -51.8203125, -47.30615234375, -42.7919921875, -38.27783203125, -33.763671875, -29.24951171875, -24.7353515625, -20.22119140625, -15.70703125, -11.19287109375, -6.6787109375, -2.16455078125, 2.349609375, 6.86376953125, 11.3779296875, 15.89208984375, 20.40625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 92.0, 863.0, 44.0, 4.0, 3.0], "bins": [-4584.515625, -4508.68115234375, -4432.84716796875, -4357.0126953125, -4281.1787109375, -4205.34423828125, -4129.509765625, -4053.67578125, -3977.841552734375, -3902.00732421875, -3826.173095703125, -3750.3388671875, -3674.50439453125, -3598.670166015625, -3522.8359375, -3447.001708984375, -3371.16748046875, -3295.333251953125, -3219.4990234375, -3143.66455078125, -3067.830322265625, -2991.99609375, -2916.161865234375, -2840.32763671875, -2764.4931640625, -2688.658935546875, -2612.82470703125, -2536.990234375, -2461.156005859375, -2385.32177734375, -2309.487548828125, -2233.6533203125, -2157.81884765625, -2081.984619140625, -2006.1502685546875, -1930.3160400390625, -1854.4818115234375, -1778.6474609375, -1702.813232421875, -1626.97900390625, -1551.144775390625, -1475.310546875, -1399.4761962890625, -1323.6419677734375, -1247.8077392578125, -1171.973388671875, -1096.13916015625, -1020.304931640625, -944.4706420898438, -868.6363525390625, -792.8021240234375, -716.9678344726562, -641.133544921875, -565.29931640625, -489.46502685546875, -413.63079833984375, -337.7965087890625, -261.9622497558594, -186.1279754638672, -110.293701171875, -34.459442138671875, 41.37481689453125, 117.2091064453125, 193.0433349609375, 268.87762451171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 16.0, 31.0, 57.0, 96.0, 153.0, 176.0, 164.0, 121.0, 85.0, 53.0, 26.0, 12.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-705.514892578125, -679.2584838867188, -653.0021362304688, -626.7457275390625, -600.4893188476562, -574.2329711914062, -547.9765625, -521.72021484375, -495.46380615234375, -469.2074279785156, -442.9510192871094, -416.69464111328125, -390.4382629394531, -364.181884765625, -337.92547607421875, -311.6690979003906, -285.4126892089844, -259.15631103515625, -232.89991760253906, -206.64352416992188, -180.38714599609375, -154.13075256347656, -127.87435913085938, -101.61798095703125, -75.36158752441406, -49.105201721191406, -22.848812103271484, 3.4075775146484375, 29.663963317871094, 55.92034912109375, 82.17674255371094, 108.43312072753906, 134.68951416015625, 160.94590759277344, 187.20228576660156, 213.45867919921875, 239.71505737304688, 265.971435546875, 292.22784423828125, 318.4842224121094, 344.7406005859375, 370.9969787597656, 397.2533874511719, 423.509765625, 449.7661437988281, 476.02252197265625, 502.2789306640625, 528.5352783203125, 554.791748046875, 581.0481567382812, 607.3045043945312, 633.5609130859375, 659.8173217773438, 686.0736694335938, 712.330078125, 738.58642578125, 764.8428344726562, 791.0992431640625, 817.3555908203125, 843.6119995117188, 869.868408203125, 896.124755859375, 922.3811645507812, 948.6375732421875, 974.8939208984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 10.0, 12.0, 16.0, 9.0, 22.0, 35.0, 46.0, 67.0, 97.0, 205.0, 457.0, 1229.0, 5117.0, 62071.0, 911937.0, 59836.0, 5098.0, 1314.0, 453.0, 195.0, 107.0, 61.0, 42.0, 41.0, 23.0, 16.0, 12.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-296.0, -286.6015625, -277.203125, -267.8046875, -258.40625, -249.0078125, -239.609375, -230.2109375, -220.8125, -211.4140625, -202.015625, -192.6171875, -183.21875, -173.8203125, -164.421875, -155.0234375, -145.625, -136.2265625, -126.828125, -117.4296875, -108.03125, -98.6328125, -89.234375, -79.8359375, -70.4375, -61.0390625, -51.640625, -42.2421875, -32.84375, -23.4453125, -14.046875, -4.6484375, 4.75, 14.1484375, 23.546875, 32.9453125, 42.34375, 51.7421875, 61.140625, 70.5390625, 79.9375, 89.3359375, 98.734375, 108.1328125, 117.53125, 126.9296875, 136.328125, 145.7265625, 155.125, 164.5234375, 173.921875, 183.3203125, 192.71875, 202.1171875, 211.515625, 220.9140625, 230.3125, 239.7109375, 249.109375, 258.5078125, 267.90625, 277.3046875, 286.703125, 296.1015625, 305.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 21.0, 48.0, 67.0, 100.0, 132.0, 171.0, 150.0, 114.0, 85.0, 55.0, 29.0, 13.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -50.194091796875, -49.04443359375, -47.894775390625, -46.7451171875, -45.595458984375, -44.44580078125, -43.296142578125, -42.146484375, -40.996826171875, -39.84716796875, -38.697509765625, -37.5478515625, -36.398193359375, -35.24853515625, -34.098876953125, -32.94921875, -31.799560546875, -30.64990234375, -29.500244140625, -28.3505859375, -27.200927734375, -26.05126953125, -24.901611328125, -23.751953125, -22.602294921875, -21.45263671875, -20.302978515625, -19.1533203125, -18.003662109375, -16.85400390625, -15.704345703125, -14.5546875, -13.405029296875, -12.25537109375, -11.105712890625, -9.9560546875, -8.806396484375, -7.65673828125, -6.507080078125, -5.357421875, -4.207763671875, -3.05810546875, -1.908447265625, -0.7587890625, 0.390869140625, 1.54052734375, 2.690185546875, 3.83984375, 4.989501953125, 6.13916015625, 7.288818359375, 8.4384765625, 9.588134765625, 10.73779296875, 11.887451171875, 13.037109375, 14.186767578125, 15.33642578125, 16.486083984375, 17.6357421875, 18.785400390625, 19.93505859375, 21.084716796875, 22.234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 12.0, 10.0, 19.0, 22.0, 29.0, 40.0, 82.0, 154.0, 314.0, 996.0, 5738.0, 220476.0, 807275.0, 11144.0, 1349.0, 415.0, 183.0, 85.0, 52.0, 44.0, 25.0, 18.0, 10.0, 10.0, 6.0, 2.0, 6.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.5, -296.072265625, -287.64453125, -279.216796875, -270.7890625, -262.361328125, -253.93359375, -245.505859375, -237.078125, -228.650390625, -220.22265625, -211.794921875, -203.3671875, -194.939453125, -186.51171875, -178.083984375, -169.65625, -161.228515625, -152.80078125, -144.373046875, -135.9453125, -127.517578125, -119.08984375, -110.662109375, -102.234375, -93.806640625, -85.37890625, -76.951171875, -68.5234375, -60.095703125, -51.66796875, -43.240234375, -34.8125, -26.384765625, -17.95703125, -9.529296875, -1.1015625, 7.326171875, 15.75390625, 24.181640625, 32.609375, 41.037109375, 49.46484375, 57.892578125, 66.3203125, 74.748046875, 83.17578125, 91.603515625, 100.03125, 108.458984375, 116.88671875, 125.314453125, 133.7421875, 142.169921875, 150.59765625, 159.025390625, 167.453125, 175.880859375, 184.30859375, 192.736328125, 201.1640625, 209.591796875, 218.01953125, 226.447265625, 234.875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 7.0, 9.0, 13.0, 18.0, 26.0, 25.0, 37.0, 36.0, 49.0, 64.0, 65.0, 67.0, 86.0, 67.0, 66.0, 64.0, 46.0, 38.0, 38.0, 38.0, 35.0, 20.0, 14.0, 11.0, 10.0, 6.0, 5.0, 4.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-90.625, -88.171875, -85.71875, -83.265625, -80.8125, -78.359375, -75.90625, -73.453125, -71.0, -68.546875, -66.09375, -63.640625, -61.1875, -58.734375, -56.28125, -53.828125, -51.375, -48.921875, -46.46875, -44.015625, -41.5625, -39.109375, -36.65625, -34.203125, -31.75, -29.296875, -26.84375, -24.390625, -21.9375, -19.484375, -17.03125, -14.578125, -12.125, -9.671875, -7.21875, -4.765625, -2.3125, 0.140625, 2.59375, 5.046875, 7.5, 9.953125, 12.40625, 14.859375, 17.3125, 19.765625, 22.21875, 24.671875, 27.125, 29.578125, 32.03125, 34.484375, 36.9375, 39.390625, 41.84375, 44.296875, 46.75, 49.203125, 51.65625, 54.109375, 56.5625, 59.015625, 61.46875, 63.921875, 66.375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 14.0, 18.0, 28.0, 49.0, 73.0, 125.0, 268.0, 640.0, 2181.0, 14580.0, 808907.0, 211367.0, 7702.0, 1522.0, 525.0, 225.0, 102.0, 72.0, 36.0, 25.0, 18.0, 15.0, 11.0, 7.0, 11.0, 1.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-156.0, -151.9853515625, -147.970703125, -143.9560546875, -139.94140625, -135.9267578125, -131.912109375, -127.8974609375, -123.8828125, -119.8681640625, -115.853515625, -111.8388671875, -107.82421875, -103.8095703125, -99.794921875, -95.7802734375, -91.765625, -87.7509765625, -83.736328125, -79.7216796875, -75.70703125, -71.6923828125, -67.677734375, -63.6630859375, -59.6484375, -55.6337890625, -51.619140625, -47.6044921875, -43.58984375, -39.5751953125, -35.560546875, -31.5458984375, -27.53125, -23.5166015625, -19.501953125, -15.4873046875, -11.47265625, -7.4580078125, -3.443359375, 0.5712890625, 4.5859375, 8.6005859375, 12.615234375, 16.6298828125, 20.64453125, 24.6591796875, 28.673828125, 32.6884765625, 36.703125, 40.7177734375, 44.732421875, 48.7470703125, 52.76171875, 56.7763671875, 60.791015625, 64.8056640625, 68.8203125, 72.8349609375, 76.849609375, 80.8642578125, 84.87890625, 88.8935546875, 92.908203125, 96.9228515625, 100.9375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 6.0, 7.0, 4.0, 7.0, 20.0, 14.0, 17.0, 27.0, 58.0, 61.0, 90.0, 111.0, 124.0, 119.0, 91.0, 62.0, 47.0, 42.0, 20.0, 25.0, 14.0, 11.0, 8.0, 4.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038967132568359375, -0.003754168748855591, -0.003611624240875244, -0.0034690797328948975, -0.0033265352249145508, -0.003183990716934204, -0.0030414462089538574, -0.0028989017009735107, -0.002756357192993164, -0.0026138126850128174, -0.0024712681770324707, -0.002328723669052124, -0.0021861791610717773, -0.0020436346530914307, -0.001901090145111084, -0.0017585456371307373, -0.0016160011291503906, -0.001473456621170044, -0.0013309121131896973, -0.0011883676052093506, -0.001045823097229004, -0.0009032785892486572, -0.0007607340812683105, -0.0006181895732879639, -0.0004756450653076172, -0.0003331005573272705, -0.00019055604934692383, -4.801154136657715e-05, 9.453296661376953e-05, 0.0002370774745941162, 0.0003796219825744629, 0.0005221664905548096, 0.0006647109985351562, 0.0008072555065155029, 0.0009498000144958496, 0.0010923445224761963, 0.001234889030456543, 0.0013774335384368896, 0.0015199780464172363, 0.001662522554397583, 0.0018050670623779297, 0.0019476115703582764, 0.002090156078338623, 0.0022327005863189697, 0.0023752450942993164, 0.002517789602279663, 0.0026603341102600098, 0.0028028786182403564, 0.002945423126220703, 0.00308796763420105, 0.0032305121421813965, 0.003373056650161743, 0.00351560115814209, 0.0036581456661224365, 0.003800690174102783, 0.00394323468208313, 0.0040857791900634766, 0.004228323698043823, 0.00437086820602417, 0.004513412714004517, 0.004655957221984863, 0.00479850172996521, 0.004941046237945557, 0.005083590745925903, 0.00522613525390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 10.0, 10.0, 18.0, 32.0, 55.0, 80.0, 181.0, 437.0, 1897.0, 20198.0, 955979.0, 65342.0, 3193.0, 618.0, 207.0, 114.0, 42.0, 38.0, 26.0, 19.0, 12.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.0, -120.2021484375, -116.404296875, -112.6064453125, -108.80859375, -105.0107421875, -101.212890625, -97.4150390625, -93.6171875, -89.8193359375, -86.021484375, -82.2236328125, -78.42578125, -74.6279296875, -70.830078125, -67.0322265625, -63.234375, -59.4365234375, -55.638671875, -51.8408203125, -48.04296875, -44.2451171875, -40.447265625, -36.6494140625, -32.8515625, -29.0537109375, -25.255859375, -21.4580078125, -17.66015625, -13.8623046875, -10.064453125, -6.2666015625, -2.46875, 1.3291015625, 5.126953125, 8.9248046875, 12.72265625, 16.5205078125, 20.318359375, 24.1162109375, 27.9140625, 31.7119140625, 35.509765625, 39.3076171875, 43.10546875, 46.9033203125, 50.701171875, 54.4990234375, 58.296875, 62.0947265625, 65.892578125, 69.6904296875, 73.48828125, 77.2861328125, 81.083984375, 84.8818359375, 88.6796875, 92.4775390625, 96.275390625, 100.0732421875, 103.87109375, 107.6689453125, 111.466796875, 115.2646484375, 119.0625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 3.0, 5.0, 11.0, 15.0, 17.0, 29.0, 27.0, 65.0, 88.0, 104.0, 113.0, 151.0, 118.0, 69.0, 51.0, 34.0, 17.0, 18.0, 15.0, 11.0, 7.0, 8.0, 6.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.66748046875, -35.5537109375, -34.43994140625, -33.326171875, -32.21240234375, -31.0986328125, -29.98486328125, -28.87109375, -27.75732421875, -26.6435546875, -25.52978515625, -24.416015625, -23.30224609375, -22.1884765625, -21.07470703125, -19.9609375, -18.84716796875, -17.7333984375, -16.61962890625, -15.505859375, -14.39208984375, -13.2783203125, -12.16455078125, -11.05078125, -9.93701171875, -8.8232421875, -7.70947265625, -6.595703125, -5.48193359375, -4.3681640625, -3.25439453125, -2.140625, -1.02685546875, 0.0869140625, 1.20068359375, 2.314453125, 3.42822265625, 4.5419921875, 5.65576171875, 6.76953125, 7.88330078125, 8.9970703125, 10.11083984375, 11.224609375, 12.33837890625, 13.4521484375, 14.56591796875, 15.6796875, 16.79345703125, 17.9072265625, 19.02099609375, 20.134765625, 21.24853515625, 22.3623046875, 23.47607421875, 24.58984375, 25.70361328125, 26.8173828125, 27.93115234375, 29.044921875, 30.15869140625, 31.2724609375, 32.38623046875, 33.5]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 10.0, 42.0, 511.0, 386.0, 39.0, 8.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-359.887451171875, -297.334716796875, -234.781982421875, -172.22923278808594, -109.67649841308594, -47.123748779296875, 15.428985595703125, 77.98171997070312, 140.53445434570312, 203.08718872070312, 265.6399230957031, 328.19268798828125, 390.74542236328125, 453.29815673828125, 515.8508911132812, 578.4036254882812, 640.9563598632812, 703.5090942382812, 766.0618286132812, 828.6145629882812, 891.1672973632812, 953.7200927734375, 1016.2728271484375, 1078.8255615234375, 1141.3782958984375, 1203.9310302734375, 1266.4837646484375, 1329.0364990234375, 1391.5892333984375, 1454.1419677734375, 1516.6947021484375, 1579.2474365234375, 1641.8001708984375, 1704.3529052734375, 1766.9056396484375, 1829.4583740234375, 1892.0111083984375, 1954.5638427734375, 2017.1165771484375, 2079.66943359375, 2142.22216796875, 2204.77490234375, 2267.32763671875, 2329.88037109375, 2392.43310546875, 2454.98583984375, 2517.53857421875, 2580.09130859375, 2642.64404296875, 2705.19677734375, 2767.74951171875, 2830.30224609375, 2892.85498046875, 2955.40771484375, 3017.96044921875, 3080.51318359375, 3143.06591796875, 3205.61865234375, 3268.17138671875, 3330.72412109375, 3393.27685546875, 3455.82958984375, 3518.38232421875, 3580.93505859375, 3643.48779296875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 0.0, 7.0, 7.0, 10.0, 14.0, 18.0, 25.0, 33.0, 49.0, 60.0, 72.0, 65.0, 71.0, 68.0, 63.0, 68.0, 70.0, 63.0, 48.0, 45.0, 35.0, 33.0, 29.0, 9.0, 14.0, 10.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-674.919921875, -657.9329833984375, -640.946044921875, -623.9590454101562, -606.9721069335938, -589.9851684570312, -572.9981689453125, -556.01123046875, -539.0242919921875, -522.037353515625, -505.0503845214844, -488.06341552734375, -471.07647705078125, -454.08953857421875, -437.1025695800781, -420.1156005859375, -403.128662109375, -386.1417236328125, -369.1547546386719, -352.16778564453125, -335.18084716796875, -318.19390869140625, -301.2069396972656, -284.219970703125, -267.2330322265625, -250.24607849121094, -233.25912475585938, -216.2721710205078, -199.28521728515625, -182.2982635498047, -165.31130981445312, -148.32435607910156, -131.33746337890625, -114.35050964355469, -97.36355590820312, -80.37660217285156, -63.3896484375, -46.40269470214844, -29.415740966796875, -12.428787231445312, 4.55816650390625, 21.545120239257812, 38.532073974609375, 55.51902770996094, 72.5059814453125, 89.49293518066406, 106.47988891601562, 123.46684265136719, 140.45379638671875, 157.4407501220703, 174.42770385742188, 191.41465759277344, 208.401611328125, 225.38856506347656, 242.37551879882812, 259.36248779296875, 276.34942626953125, 293.33636474609375, 310.3233337402344, 327.310302734375, 344.2972412109375, 361.2841796875, 378.2711486816406, 395.25811767578125, 412.24505615234375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 27.0, 51.0, 98.0, 226.0, 620.0, 6402.0, 4177150.0, 9194.0, 302.0, 104.0, 55.0, 20.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0], "bins": [-1128.0, -1106.537109375, -1085.07421875, -1063.611328125, -1042.1484375, -1020.685546875, -999.22265625, -977.759765625, -956.296875, -934.833984375, -913.37109375, -891.908203125, -870.4453125, -848.982421875, -827.51953125, -806.056640625, -784.59375, -763.130859375, -741.66796875, -720.205078125, -698.7421875, -677.279296875, -655.81640625, -634.353515625, -612.890625, -591.427734375, -569.96484375, -548.501953125, -527.0390625, -505.576171875, -484.11328125, -462.650390625, -441.1875, -419.724609375, -398.26171875, -376.798828125, -355.3359375, -333.873046875, -312.41015625, -290.947265625, -269.484375, -248.021484375, -226.55859375, -205.095703125, -183.6328125, -162.169921875, -140.70703125, -119.244140625, -97.78125, -76.318359375, -54.85546875, -33.392578125, -11.9296875, 9.533203125, 30.99609375, 52.458984375, 73.921875, 95.384765625, 116.84765625, 138.310546875, 159.7734375, 181.236328125, 202.69921875, 224.162109375, 245.625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 11.0, 21.0, 24.0, 67.0, 85.0, 101.0, 127.0, 146.0, 158.0, 87.0, 72.0, 58.0, 22.0, 10.0, 12.0, 1.0, 5.0, 2.0, 3.0], "bins": [-52.875, -51.8634033203125, -50.851806640625, -49.8402099609375, -48.82861328125, -47.8170166015625, -46.805419921875, -45.7938232421875, -44.7822265625, -43.7706298828125, -42.759033203125, -41.7474365234375, -40.73583984375, -39.7242431640625, -38.712646484375, -37.7010498046875, -36.689453125, -35.6778564453125, -34.666259765625, -33.6546630859375, -32.64306640625, -31.6314697265625, -30.619873046875, -29.6082763671875, -28.5966796875, -27.5850830078125, -26.573486328125, -25.5618896484375, -24.55029296875, -23.5386962890625, -22.527099609375, -21.5155029296875, -20.50390625, -19.4923095703125, -18.480712890625, -17.4691162109375, -16.45751953125, -15.4459228515625, -14.434326171875, -13.4227294921875, -12.4111328125, -11.3995361328125, -10.387939453125, -9.3763427734375, -8.36474609375, -7.3531494140625, -6.341552734375, -5.3299560546875, -4.318359375, -3.3067626953125, -2.295166015625, -1.2835693359375, -0.27197265625, 0.7396240234375, 1.751220703125, 2.7628173828125, 3.7744140625, 4.7860107421875, 5.797607421875, 6.8092041015625, 7.82080078125, 8.8323974609375, 9.843994140625, 10.8555908203125, 11.8671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 11.0, 33.0, 96.0, 421.0, 4309.0, 4188626.0, 650.0, 102.0, 21.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2888.0, -2831.6875, -2775.375, -2719.0625, -2662.75, -2606.4375, -2550.125, -2493.8125, -2437.5, -2381.1875, -2324.875, -2268.5625, -2212.25, -2155.9375, -2099.625, -2043.3125, -1987.0, -1930.6875, -1874.375, -1818.0625, -1761.75, -1705.4375, -1649.125, -1592.8125, -1536.5, -1480.1875, -1423.875, -1367.5625, -1311.25, -1254.9375, -1198.625, -1142.3125, -1086.0, -1029.6875, -973.375, -917.0625, -860.75, -804.4375, -748.125, -691.8125, -635.5, -579.1875, -522.875, -466.5625, -410.25, -353.9375, -297.625, -241.3125, -185.0, -128.6875, -72.375, -16.0625, 40.25, 96.5625, 152.875, 209.1875, 265.5, 321.8125, 378.125, 434.4375, 490.75, 547.0625, 603.375, 659.6875, 716.0]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 17.0, 57.0, 204.0, 3387.0, 343.0, 51.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.5, -181.91162109375, -178.3232421875, -174.73486328125, -171.146484375, -167.55810546875, -163.9697265625, -160.38134765625, -156.79296875, -153.20458984375, -149.6162109375, -146.02783203125, -142.439453125, -138.85107421875, -135.2626953125, -131.67431640625, -128.0859375, -124.49755859375, -120.9091796875, -117.32080078125, -113.732421875, -110.14404296875, -106.5556640625, -102.96728515625, -99.37890625, -95.79052734375, -92.2021484375, -88.61376953125, -85.025390625, -81.43701171875, -77.8486328125, -74.26025390625, -70.671875, -67.08349609375, -63.4951171875, -59.90673828125, -56.318359375, -52.72998046875, -49.1416015625, -45.55322265625, -41.96484375, -38.37646484375, -34.7880859375, -31.19970703125, -27.611328125, -24.02294921875, -20.4345703125, -16.84619140625, -13.2578125, -9.66943359375, -6.0810546875, -2.49267578125, 1.095703125, 4.68408203125, 8.2724609375, 11.86083984375, 15.44921875, 19.03759765625, 22.6259765625, 26.21435546875, 29.802734375, 33.39111328125, 36.9794921875, 40.56787109375, 44.15625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 20.0, 261.0, 690.0, 25.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1611.473388671875, -1559.8580322265625, -1508.2427978515625, -1456.62744140625, -1405.0120849609375, -1353.396728515625, -1301.781494140625, -1250.1661376953125, -1198.55078125, -1146.9354248046875, -1095.3201904296875, -1043.704833984375, -992.0894775390625, -940.4741821289062, -888.85888671875, -837.2435302734375, -785.6282958984375, -734.0130004882812, -682.3976440429688, -630.7823486328125, -579.1669921875, -527.5516967773438, -475.9364013671875, -424.3210754394531, -372.70574951171875, -321.0904235839844, -269.47509765625, -217.85980224609375, -166.24447631835938, -114.629150390625, -63.01385498046875, -11.398529052734375, 40.2166748046875, 91.83199310302734, 143.4473114013672, 195.0626220703125, 246.67794799804688, 298.29327392578125, 349.9085693359375, 401.5238952636719, 453.13922119140625, 504.7545471191406, 556.369873046875, 607.9851684570312, 659.6004638671875, 711.2158203125, 762.8311157226562, 814.4464111328125, 866.061767578125, 917.6770629882812, 969.2924194335938, 1020.90771484375, 1072.5230712890625, 1124.138427734375, 1175.753662109375, 1227.3690185546875, 1278.984375, 1330.5997314453125, 1382.2149658203125, 1433.830322265625, 1485.4456787109375, 1537.06103515625, 1588.67626953125, 1640.2916259765625, 1691.9068603515625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 13.0, 18.0, 28.0, 41.0, 64.0, 86.0, 102.0, 115.0, 111.0, 117.0, 104.0, 72.0, 47.0, 33.0, 32.0, 8.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-518.6447143554688, -504.4065246582031, -490.1683349609375, -475.9301452636719, -461.69195556640625, -447.4537658691406, -433.215576171875, -418.9773864746094, -404.73919677734375, -390.5010070800781, -376.2628173828125, -362.0246276855469, -347.78643798828125, -333.5482482910156, -319.31005859375, -305.0718688964844, -290.83367919921875, -276.5954895019531, -262.3572998046875, -248.11911010742188, -233.88092041015625, -219.64273071289062, -205.404541015625, -191.16635131835938, -176.92816162109375, -162.68997192382812, -148.4517822265625, -134.21359252929688, -119.97540283203125, -105.73721313476562, -91.4990234375, -77.26083374023438, -63.02264404296875, -48.784454345703125, -34.5462646484375, -20.308074951171875, -6.06988525390625, 8.168304443359375, 22.406494140625, 36.644683837890625, 50.88287353515625, 65.12106323242188, 79.3592529296875, 93.59744262695312, 107.83563232421875, 122.07382202148438, 136.31201171875, 150.55020141601562, 164.78839111328125, 179.02658081054688, 193.2647705078125, 207.50296020507812, 221.74114990234375, 235.97933959960938, 250.217529296875, 264.4557189941406, 278.69390869140625, 292.9320983886719, 307.1702880859375, 321.4084777832031, 335.64666748046875, 349.8848571777344, 364.123046875, 378.3612365722656, 392.59942626953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 7.0, 13.0, 10.0, 15.0, 15.0, 30.0, 29.0, 43.0, 60.0, 74.0, 116.0, 151.0, 296.0, 514.0, 1127.0, 3427.0, 14292.0, 92097.0, 748962.0, 158497.0, 21057.0, 4701.0, 1398.0, 636.0, 320.0, 191.0, 123.0, 92.0, 69.0, 38.0, 24.0, 39.0, 19.0, 15.0, 11.0, 9.0, 10.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.75, -147.412109375, -142.07421875, -136.736328125, -131.3984375, -126.060546875, -120.72265625, -115.384765625, -110.046875, -104.708984375, -99.37109375, -94.033203125, -88.6953125, -83.357421875, -78.01953125, -72.681640625, -67.34375, -62.005859375, -56.66796875, -51.330078125, -45.9921875, -40.654296875, -35.31640625, -29.978515625, -24.640625, -19.302734375, -13.96484375, -8.626953125, -3.2890625, 2.048828125, 7.38671875, 12.724609375, 18.0625, 23.400390625, 28.73828125, 34.076171875, 39.4140625, 44.751953125, 50.08984375, 55.427734375, 60.765625, 66.103515625, 71.44140625, 76.779296875, 82.1171875, 87.455078125, 92.79296875, 98.130859375, 103.46875, 108.806640625, 114.14453125, 119.482421875, 124.8203125, 130.158203125, 135.49609375, 140.833984375, 146.171875, 151.509765625, 156.84765625, 162.185546875, 167.5234375, 172.861328125, 178.19921875, 183.537109375, 188.875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 14.0, 25.0, 27.0, 47.0, 55.0, 103.0, 94.0, 127.0, 115.0, 127.0, 80.0, 65.0, 57.0, 33.0, 11.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.59375, -51.39599609375, -50.1982421875, -49.00048828125, -47.802734375, -46.60498046875, -45.4072265625, -44.20947265625, -43.01171875, -41.81396484375, -40.6162109375, -39.41845703125, -38.220703125, -37.02294921875, -35.8251953125, -34.62744140625, -33.4296875, -32.23193359375, -31.0341796875, -29.83642578125, -28.638671875, -27.44091796875, -26.2431640625, -25.04541015625, -23.84765625, -22.64990234375, -21.4521484375, -20.25439453125, -19.056640625, -17.85888671875, -16.6611328125, -15.46337890625, -14.265625, -13.06787109375, -11.8701171875, -10.67236328125, -9.474609375, -8.27685546875, -7.0791015625, -5.88134765625, -4.68359375, -3.48583984375, -2.2880859375, -1.09033203125, 0.107421875, 1.30517578125, 2.5029296875, 3.70068359375, 4.8984375, 6.09619140625, 7.2939453125, 8.49169921875, 9.689453125, 10.88720703125, 12.0849609375, 13.28271484375, 14.48046875, 15.67822265625, 16.8759765625, 18.07373046875, 19.271484375, 20.46923828125, 21.6669921875, 22.86474609375, 24.0625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 15.0, 16.0, 21.0, 25.0, 33.0, 62.0, 85.0, 155.0, 234.0, 479.0, 1108.0, 3509.0, 20793.0, 444114.0, 547965.0, 23783.0, 3789.0, 1144.0, 500.0, 253.0, 158.0, 99.0, 61.0, 40.0, 30.0, 20.0, 14.0, 11.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.0, -162.970703125, -156.94140625, -150.912109375, -144.8828125, -138.853515625, -132.82421875, -126.794921875, -120.765625, -114.736328125, -108.70703125, -102.677734375, -96.6484375, -90.619140625, -84.58984375, -78.560546875, -72.53125, -66.501953125, -60.47265625, -54.443359375, -48.4140625, -42.384765625, -36.35546875, -30.326171875, -24.296875, -18.267578125, -12.23828125, -6.208984375, -0.1796875, 5.849609375, 11.87890625, 17.908203125, 23.9375, 29.966796875, 35.99609375, 42.025390625, 48.0546875, 54.083984375, 60.11328125, 66.142578125, 72.171875, 78.201171875, 84.23046875, 90.259765625, 96.2890625, 102.318359375, 108.34765625, 114.376953125, 120.40625, 126.435546875, 132.46484375, 138.494140625, 144.5234375, 150.552734375, 156.58203125, 162.611328125, 168.640625, 174.669921875, 180.69921875, 186.728515625, 192.7578125, 198.787109375, 204.81640625, 210.845703125, 216.875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 1.0, 10.0, 15.0, 12.0, 13.0, 17.0, 25.0, 24.0, 31.0, 46.0, 49.0, 46.0, 67.0, 65.0, 67.0, 58.0, 56.0, 73.0, 42.0, 40.0, 49.0, 36.0, 34.0, 31.0, 24.0, 12.0, 18.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.0, -80.056640625, -77.11328125, -74.169921875, -71.2265625, -68.283203125, -65.33984375, -62.396484375, -59.453125, -56.509765625, -53.56640625, -50.623046875, -47.6796875, -44.736328125, -41.79296875, -38.849609375, -35.90625, -32.962890625, -30.01953125, -27.076171875, -24.1328125, -21.189453125, -18.24609375, -15.302734375, -12.359375, -9.416015625, -6.47265625, -3.529296875, -0.5859375, 2.357421875, 5.30078125, 8.244140625, 11.1875, 14.130859375, 17.07421875, 20.017578125, 22.9609375, 25.904296875, 28.84765625, 31.791015625, 34.734375, 37.677734375, 40.62109375, 43.564453125, 46.5078125, 49.451171875, 52.39453125, 55.337890625, 58.28125, 61.224609375, 64.16796875, 67.111328125, 70.0546875, 72.998046875, 75.94140625, 78.884765625, 81.828125, 84.771484375, 87.71484375, 90.658203125, 93.6015625, 96.544921875, 99.48828125, 102.431640625, 105.375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 6.0, 21.0, 26.0, 42.0, 79.0, 192.0, 460.0, 1541.0, 8290.0, 137134.0, 864191.0, 31381.0, 3687.0, 897.0, 306.0, 137.0, 59.0, 41.0, 20.0, 12.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.5, -97.201171875, -94.90234375, -92.603515625, -90.3046875, -88.005859375, -85.70703125, -83.408203125, -81.109375, -78.810546875, -76.51171875, -74.212890625, -71.9140625, -69.615234375, -67.31640625, -65.017578125, -62.71875, -60.419921875, -58.12109375, -55.822265625, -53.5234375, -51.224609375, -48.92578125, -46.626953125, -44.328125, -42.029296875, -39.73046875, -37.431640625, -35.1328125, -32.833984375, -30.53515625, -28.236328125, -25.9375, -23.638671875, -21.33984375, -19.041015625, -16.7421875, -14.443359375, -12.14453125, -9.845703125, -7.546875, -5.248046875, -2.94921875, -0.650390625, 1.6484375, 3.947265625, 6.24609375, 8.544921875, 10.84375, 13.142578125, 15.44140625, 17.740234375, 20.0390625, 22.337890625, 24.63671875, 26.935546875, 29.234375, 31.533203125, 33.83203125, 36.130859375, 38.4296875, 40.728515625, 43.02734375, 45.326171875, 47.625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 10.0, 13.0, 9.0, 19.0, 27.0, 27.0, 41.0, 58.0, 55.0, 85.0, 76.0, 92.0, 86.0, 83.0, 62.0, 56.0, 40.0, 46.0, 25.0, 14.0, 14.0, 17.0, 9.0, 7.0, 7.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003284454345703125, -0.0031896233558654785, -0.003094792366027832, -0.0029999613761901855, -0.002905130386352539, -0.0028102993965148926, -0.002715468406677246, -0.0026206374168395996, -0.002525806427001953, -0.0024309754371643066, -0.00233614444732666, -0.0022413134574890137, -0.002146482467651367, -0.0020516514778137207, -0.0019568204879760742, -0.0018619894981384277, -0.0017671585083007812, -0.0016723275184631348, -0.0015774965286254883, -0.0014826655387878418, -0.0013878345489501953, -0.0012930035591125488, -0.0011981725692749023, -0.0011033415794372559, -0.0010085105895996094, -0.0009136795997619629, -0.0008188486099243164, -0.0007240176200866699, -0.0006291866302490234, -0.000534355640411377, -0.00043952465057373047, -0.000344693660736084, -0.0002498626708984375, -0.00015503168106079102, -6.020069122314453e-05, 3.463029861450195e-05, 0.00012946128845214844, 0.00022429227828979492, 0.0003191232681274414, 0.0004139542579650879, 0.0005087852478027344, 0.0006036162376403809, 0.0006984472274780273, 0.0007932782173156738, 0.0008881092071533203, 0.0009829401969909668, 0.0010777711868286133, 0.0011726021766662598, 0.0012674331665039062, 0.0013622641563415527, 0.0014570951461791992, 0.0015519261360168457, 0.0016467571258544922, 0.0017415881156921387, 0.0018364191055297852, 0.0019312500953674316, 0.002026081085205078, 0.0021209120750427246, 0.002215743064880371, 0.0023105740547180176, 0.002405405044555664, 0.0025002360343933105, 0.002595067024230957, 0.0026898980140686035, 0.00278472900390625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 12.0, 10.0, 7.0, 8.0, 21.0, 22.0, 41.0, 54.0, 80.0, 128.0, 242.0, 525.0, 1347.0, 4320.0, 22936.0, 410232.0, 572126.0, 28658.0, 5022.0, 1470.0, 603.0, 275.0, 134.0, 79.0, 41.0, 50.0, 29.0, 17.0, 12.0, 11.0, 6.0, 2.0, 6.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.8349609375, -44.201171875, -42.5673828125, -40.93359375, -39.2998046875, -37.666015625, -36.0322265625, -34.3984375, -32.7646484375, -31.130859375, -29.4970703125, -27.86328125, -26.2294921875, -24.595703125, -22.9619140625, -21.328125, -19.6943359375, -18.060546875, -16.4267578125, -14.79296875, -13.1591796875, -11.525390625, -9.8916015625, -8.2578125, -6.6240234375, -4.990234375, -3.3564453125, -1.72265625, -0.0888671875, 1.544921875, 3.1787109375, 4.8125, 6.4462890625, 8.080078125, 9.7138671875, 11.34765625, 12.9814453125, 14.615234375, 16.2490234375, 17.8828125, 19.5166015625, 21.150390625, 22.7841796875, 24.41796875, 26.0517578125, 27.685546875, 29.3193359375, 30.953125, 32.5869140625, 34.220703125, 35.8544921875, 37.48828125, 39.1220703125, 40.755859375, 42.3896484375, 44.0234375, 45.6572265625, 47.291015625, 48.9248046875, 50.55859375, 52.1923828125, 53.826171875, 55.4599609375, 57.09375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 9.0, 14.0, 11.0, 11.0, 16.0, 19.0, 25.0, 47.0, 61.0, 69.0, 92.0, 108.0, 103.0, 94.0, 77.0, 56.0, 41.0, 25.0, 26.0, 17.0, 13.0, 17.0, 8.0, 3.0, 6.0, 2.0, 3.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.015625, -23.2109375, -22.40625, -21.6015625, -20.796875, -19.9921875, -19.1875, -18.3828125, -17.578125, -16.7734375, -15.96875, -15.1640625, -14.359375, -13.5546875, -12.75, -11.9453125, -11.140625, -10.3359375, -9.53125, -8.7265625, -7.921875, -7.1171875, -6.3125, -5.5078125, -4.703125, -3.8984375, -3.09375, -2.2890625, -1.484375, -0.6796875, 0.125, 0.9296875, 1.734375, 2.5390625, 3.34375, 4.1484375, 4.953125, 5.7578125, 6.5625, 7.3671875, 8.171875, 8.9765625, 9.78125, 10.5859375, 11.390625, 12.1953125, 13.0, 13.8046875, 14.609375, 15.4140625, 16.21875, 17.0234375, 17.828125, 18.6328125, 19.4375, 20.2421875, 21.046875, 21.8515625, 22.65625, 23.4609375, 24.265625, 25.0703125, 25.875, 26.6796875, 27.484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 10.0, 12.0, 77.0, 240.0, 437.0, 142.0, 53.0, 19.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-880.3253173828125, -842.2881469726562, -804.2509765625, -766.2138061523438, -728.1766357421875, -690.1395263671875, -652.1023559570312, -614.065185546875, -576.0280151367188, -537.9908447265625, -499.95367431640625, -461.9165344238281, -423.8793640136719, -385.8421936035156, -347.8050537109375, -309.76788330078125, -271.730712890625, -233.69354248046875, -195.65638732910156, -157.61923217773438, -119.58206176757812, -81.54489135742188, -43.50773620605469, -5.4705810546875, 32.56658935546875, 70.60375213623047, 108.64091491699219, 146.67807006835938, 184.71524047851562, 222.75241088867188, 260.78955078125, 298.82672119140625, 336.86376953125, 374.90093994140625, 412.9381103515625, 450.9752502441406, 489.0124206542969, 527.049560546875, 565.0867309570312, 603.1239013671875, 641.1610717773438, 679.1982421875, 717.2354125976562, 755.2725830078125, 793.3096923828125, 831.346923828125, 869.384033203125, 907.4212036132812, 945.4583740234375, 983.4955444335938, 1021.53271484375, 1059.56982421875, 1097.6070556640625, 1135.6441650390625, 1173.681396484375, 1211.718505859375, 1249.755615234375, 1287.792724609375, 1325.8299560546875, 1363.8670654296875, 1401.904296875, 1439.94140625, 1477.9786376953125, 1516.0157470703125, 1554.052978515625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 15.0, 24.0, 11.0, 24.0, 32.0, 56.0, 65.0, 44.0, 71.0, 66.0, 72.0, 64.0, 79.0, 76.0, 62.0, 52.0, 45.0, 33.0, 24.0, 16.0, 16.0, 18.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-536.2186279296875, -516.4986572265625, -496.7786560058594, -477.05865478515625, -457.33868408203125, -437.61871337890625, -417.8987121582031, -398.1787109375, -378.458740234375, -358.73876953125, -339.0187683105469, -319.29876708984375, -299.57879638671875, -279.85882568359375, -260.1388244628906, -240.41883850097656, -220.6988525390625, -200.97886657714844, -181.25888061523438, -161.5388946533203, -141.81890869140625, -122.09892272949219, -102.37893676757812, -82.65895080566406, -62.93896484375, -43.21897888183594, -23.498992919921875, -3.7790069580078125, 15.94097900390625, 35.66096496582031, 55.380950927734375, 75.10093688964844, 94.82098388671875, 114.54096984863281, 134.26095581054688, 153.98094177246094, 173.700927734375, 193.42091369628906, 213.14089965820312, 232.8608856201172, 252.58087158203125, 272.30084228515625, 292.0208435058594, 311.7408447265625, 331.4608154296875, 351.1807861328125, 370.9007873535156, 390.62078857421875, 410.34075927734375, 430.06072998046875, 449.7807312011719, 469.500732421875, 489.220703125, 508.940673828125, 528.66064453125, 548.3806762695312, 568.1006469726562, 587.8206176757812, 607.5406494140625, 627.2606201171875, 646.9805908203125, 666.7005615234375, 686.4205322265625, 706.1405639648438, 725.8605346679688]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 9.0, 12.0, 12.0, 34.0, 54.0, 93.0, 188.0, 418.0, 1088.0, 5166.0, 292746.0, 3885330.0, 7530.0, 1027.0, 317.0, 129.0, 58.0, 28.0, 11.0, 11.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-507.0, -495.7578125, -484.515625, -473.2734375, -462.03125, -450.7890625, -439.546875, -428.3046875, -417.0625, -405.8203125, -394.578125, -383.3359375, -372.09375, -360.8515625, -349.609375, -338.3671875, -327.125, -315.8828125, -304.640625, -293.3984375, -282.15625, -270.9140625, -259.671875, -248.4296875, -237.1875, -225.9453125, -214.703125, -203.4609375, -192.21875, -180.9765625, -169.734375, -158.4921875, -147.25, -136.0078125, -124.765625, -113.5234375, -102.28125, -91.0390625, -79.796875, -68.5546875, -57.3125, -46.0703125, -34.828125, -23.5859375, -12.34375, -1.1015625, 10.140625, 21.3828125, 32.625, 43.8671875, 55.109375, 66.3515625, 77.59375, 88.8359375, 100.078125, 111.3203125, 122.5625, 133.8046875, 145.046875, 156.2890625, 167.53125, 178.7734375, 190.015625, 201.2578125, 212.5]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 7.0, 22.0, 35.0, 53.0, 60.0, 98.0, 104.0, 120.0, 109.0, 115.0, 78.0, 62.0, 57.0, 37.0, 20.0, 10.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.375, -50.1787109375, -48.982421875, -47.7861328125, -46.58984375, -45.3935546875, -44.197265625, -43.0009765625, -41.8046875, -40.6083984375, -39.412109375, -38.2158203125, -37.01953125, -35.8232421875, -34.626953125, -33.4306640625, -32.234375, -31.0380859375, -29.841796875, -28.6455078125, -27.44921875, -26.2529296875, -25.056640625, -23.8603515625, -22.6640625, -21.4677734375, -20.271484375, -19.0751953125, -17.87890625, -16.6826171875, -15.486328125, -14.2900390625, -13.09375, -11.8974609375, -10.701171875, -9.5048828125, -8.30859375, -7.1123046875, -5.916015625, -4.7197265625, -3.5234375, -2.3271484375, -1.130859375, 0.0654296875, 1.26171875, 2.4580078125, 3.654296875, 4.8505859375, 6.046875, 7.2431640625, 8.439453125, 9.6357421875, 10.83203125, 12.0283203125, 13.224609375, 14.4208984375, 15.6171875, 16.8134765625, 18.009765625, 19.2060546875, 20.40234375, 21.5986328125, 22.794921875, 23.9912109375, 25.1875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 12.0, 39.0, 65.0, 156.0, 1046.0, 4192110.0, 500.0, 143.0, 95.0, 46.0, 40.0, 17.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-876.0, -815.09375, -754.1875, -693.28125, -632.375, -571.46875, -510.5625, -449.65625, -388.75, -327.84375, -266.9375, -206.03125, -145.125, -84.21875, -23.3125, 37.59375, 98.5, 159.40625, 220.3125, 281.21875, 342.125, 403.03125, 463.9375, 524.84375, 585.75, 646.65625, 707.5625, 768.46875, 829.375, 890.28125, 951.1875, 1012.09375, 1073.0, 1133.90625, 1194.8125, 1255.71875, 1316.625, 1377.53125, 1438.4375, 1499.34375, 1560.25, 1621.15625, 1682.0625, 1742.96875, 1803.875, 1864.78125, 1925.6875, 1986.59375, 2047.5, 2108.40625, 2169.3125, 2230.21875, 2291.125, 2352.03125, 2412.9375, 2473.84375, 2534.75, 2595.65625, 2656.5625, 2717.46875, 2778.375, 2839.28125, 2900.1875, 2961.09375, 3022.0]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 28.0, 571.0, 3431.0, 50.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.625, -89.275390625, -81.92578125, -74.576171875, -67.2265625, -59.876953125, -52.52734375, -45.177734375, -37.828125, -30.478515625, -23.12890625, -15.779296875, -8.4296875, -1.080078125, 6.26953125, 13.619140625, 20.96875, 28.318359375, 35.66796875, 43.017578125, 50.3671875, 57.716796875, 65.06640625, 72.416015625, 79.765625, 87.115234375, 94.46484375, 101.814453125, 109.1640625, 116.513671875, 123.86328125, 131.212890625, 138.5625, 145.912109375, 153.26171875, 160.611328125, 167.9609375, 175.310546875, 182.66015625, 190.009765625, 197.359375, 204.708984375, 212.05859375, 219.408203125, 226.7578125, 234.107421875, 241.45703125, 248.806640625, 256.15625, 263.505859375, 270.85546875, 278.205078125, 285.5546875, 292.904296875, 300.25390625, 307.603515625, 314.953125, 322.302734375, 329.65234375, 337.001953125, 344.3515625, 351.701171875, 359.05078125, 366.400390625, 373.75]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 916.0, 80.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3067.76220703125, -2971.279296875, -2874.796142578125, -2778.313232421875, -2681.830078125, -2585.34716796875, -2488.8642578125, -2392.381103515625, -2295.89794921875, -2199.4150390625, -2102.931884765625, -2006.448974609375, -1909.9658203125, -1813.48291015625, -1716.9998779296875, -1620.516845703125, -1524.033935546875, -1427.5509033203125, -1331.06787109375, -1234.5849609375, -1138.101806640625, -1041.618896484375, -945.1358642578125, -848.65283203125, -752.1697998046875, -655.686767578125, -559.2037353515625, -462.72076416015625, -366.23773193359375, -269.75469970703125, -173.271728515625, -76.7886962890625, 19.6943359375, 116.17735290527344, 212.66036987304688, 309.14337158203125, 405.62640380859375, 502.10943603515625, 598.5924072265625, 695.075439453125, 791.5584716796875, 888.04150390625, 984.5245361328125, 1081.007568359375, 1177.490478515625, 1273.9736328125, 1370.45654296875, 1466.9395751953125, 1563.422607421875, 1659.9056396484375, 1756.388671875, 1852.87158203125, 1949.354736328125, 2045.837646484375, 2142.32080078125, 2238.8037109375, 2335.28662109375, 2431.76953125, 2528.252685546875, 2624.735595703125, 2721.21875, 2817.70166015625, 2914.1845703125, 3010.667724609375, 3107.15087890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 12.0, 36.0, 62.0, 109.0, 157.0, 200.0, 187.0, 110.0, 73.0, 37.0, 13.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-675.1411743164062, -657.6409301757812, -640.1406860351562, -622.6404418945312, -605.1402587890625, -587.6400146484375, -570.1397705078125, -552.6395263671875, -535.1392822265625, -517.6390380859375, -500.1387939453125, -482.6385803222656, -465.1383361816406, -447.6380920410156, -430.13787841796875, -412.63763427734375, -395.13739013671875, -377.63714599609375, -360.13690185546875, -342.6366882324219, -325.1364440917969, -307.6361999511719, -290.135986328125, -272.6357421875, -255.135498046875, -237.63525390625, -220.13502502441406, -202.63479614257812, -185.13455200195312, -167.63430786132812, -150.1340789794922, -132.63385009765625, -115.1336669921875, -97.63343048095703, -80.13319396972656, -62.632957458496094, -45.132720947265625, -27.632484436035156, -10.132247924804688, 7.367988586425781, 24.86822509765625, 42.36846160888672, 59.86869812011719, 77.36893463134766, 94.86917114257812, 112.3694076538086, 129.86964416503906, 147.369873046875, 164.8701171875, 182.370361328125, 199.87059020996094, 217.37081909179688, 234.87106323242188, 252.37130737304688, 269.87152099609375, 287.37176513671875, 304.87200927734375, 322.37225341796875, 339.87249755859375, 357.3727111816406, 374.8729553222656, 392.3731994628906, 409.8734130859375, 427.3736572265625, 444.8739013671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 11.0, 5.0, 19.0, 25.0, 28.0, 45.0, 58.0, 93.0, 182.0, 333.0, 693.0, 1778.0, 5225.0, 20928.0, 127102.0, 695084.0, 162376.0, 24945.0, 6070.0, 1913.0, 738.0, 364.0, 193.0, 107.0, 62.0, 41.0, 37.0, 21.0, 14.0, 11.0, 8.0, 3.0, 8.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.625, -113.8974609375, -110.169921875, -106.4423828125, -102.71484375, -98.9873046875, -95.259765625, -91.5322265625, -87.8046875, -84.0771484375, -80.349609375, -76.6220703125, -72.89453125, -69.1669921875, -65.439453125, -61.7119140625, -57.984375, -54.2568359375, -50.529296875, -46.8017578125, -43.07421875, -39.3466796875, -35.619140625, -31.8916015625, -28.1640625, -24.4365234375, -20.708984375, -16.9814453125, -13.25390625, -9.5263671875, -5.798828125, -2.0712890625, 1.65625, 5.3837890625, 9.111328125, 12.8388671875, 16.56640625, 20.2939453125, 24.021484375, 27.7490234375, 31.4765625, 35.2041015625, 38.931640625, 42.6591796875, 46.38671875, 50.1142578125, 53.841796875, 57.5693359375, 61.296875, 65.0244140625, 68.751953125, 72.4794921875, 76.20703125, 79.9345703125, 83.662109375, 87.3896484375, 91.1171875, 94.8447265625, 98.572265625, 102.2998046875, 106.02734375, 109.7548828125, 113.482421875, 117.2099609375, 120.9375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 17.0, 19.0, 23.0, 30.0, 45.0, 50.0, 62.0, 66.0, 74.0, 111.0, 90.0, 67.0, 78.0, 62.0, 53.0, 42.0, 37.0, 14.0, 21.0, 12.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.1875, -32.394287109375, -31.60107421875, -30.807861328125, -30.0146484375, -29.221435546875, -28.42822265625, -27.635009765625, -26.841796875, -26.048583984375, -25.25537109375, -24.462158203125, -23.6689453125, -22.875732421875, -22.08251953125, -21.289306640625, -20.49609375, -19.702880859375, -18.90966796875, -18.116455078125, -17.3232421875, -16.530029296875, -15.73681640625, -14.943603515625, -14.150390625, -13.357177734375, -12.56396484375, -11.770751953125, -10.9775390625, -10.184326171875, -9.39111328125, -8.597900390625, -7.8046875, -7.011474609375, -6.21826171875, -5.425048828125, -4.6318359375, -3.838623046875, -3.04541015625, -2.252197265625, -1.458984375, -0.665771484375, 0.12744140625, 0.920654296875, 1.7138671875, 2.507080078125, 3.30029296875, 4.093505859375, 4.88671875, 5.679931640625, 6.47314453125, 7.266357421875, 8.0595703125, 8.852783203125, 9.64599609375, 10.439208984375, 11.232421875, 12.025634765625, 12.81884765625, 13.612060546875, 14.4052734375, 15.198486328125, 15.99169921875, 16.784912109375, 17.578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 8.0, 15.0, 17.0, 33.0, 43.0, 42.0, 68.0, 118.0, 172.0, 290.0, 520.0, 914.0, 2220.0, 7923.0, 60765.0, 803143.0, 153020.0, 13374.0, 3075.0, 1202.0, 580.0, 371.0, 205.0, 120.0, 80.0, 78.0, 35.0, 32.0, 22.0, 13.0, 9.0, 5.0, 5.0, 8.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-175.625, -170.833984375, -166.04296875, -161.251953125, -156.4609375, -151.669921875, -146.87890625, -142.087890625, -137.296875, -132.505859375, -127.71484375, -122.923828125, -118.1328125, -113.341796875, -108.55078125, -103.759765625, -98.96875, -94.177734375, -89.38671875, -84.595703125, -79.8046875, -75.013671875, -70.22265625, -65.431640625, -60.640625, -55.849609375, -51.05859375, -46.267578125, -41.4765625, -36.685546875, -31.89453125, -27.103515625, -22.3125, -17.521484375, -12.73046875, -7.939453125, -3.1484375, 1.642578125, 6.43359375, 11.224609375, 16.015625, 20.806640625, 25.59765625, 30.388671875, 35.1796875, 39.970703125, 44.76171875, 49.552734375, 54.34375, 59.134765625, 63.92578125, 68.716796875, 73.5078125, 78.298828125, 83.08984375, 87.880859375, 92.671875, 97.462890625, 102.25390625, 107.044921875, 111.8359375, 116.626953125, 121.41796875, 126.208984375, 131.0]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 6.0, 10.0, 12.0, 13.0, 23.0, 25.0, 32.0, 42.0, 37.0, 50.0, 58.0, 71.0, 52.0, 57.0, 59.0, 67.0, 52.0, 57.0, 48.0, 50.0, 39.0, 27.0, 18.0, 22.0, 8.0, 9.0, 15.0, 9.0, 8.0, 5.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-108.625, -105.75, -102.875, -100.0, -97.125, -94.25, -91.375, -88.5, -85.625, -82.75, -79.875, -77.0, -74.125, -71.25, -68.375, -65.5, -62.625, -59.75, -56.875, -54.0, -51.125, -48.25, -45.375, -42.5, -39.625, -36.75, -33.875, -31.0, -28.125, -25.25, -22.375, -19.5, -16.625, -13.75, -10.875, -8.0, -5.125, -2.25, 0.625, 3.5, 6.375, 9.25, 12.125, 15.0, 17.875, 20.75, 23.625, 26.5, 29.375, 32.25, 35.125, 38.0, 40.875, 43.75, 46.625, 49.5, 52.375, 55.25, 58.125, 61.0, 63.875, 66.75, 69.625, 72.5, 75.375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 10.0, 15.0, 37.0, 35.0, 79.0, 162.0, 345.0, 1393.0, 11240.0, 904149.0, 125313.0, 4411.0, 782.0, 272.0, 121.0, 70.0, 41.0, 31.0, 15.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-115.875, -111.853515625, -107.83203125, -103.810546875, -99.7890625, -95.767578125, -91.74609375, -87.724609375, -83.703125, -79.681640625, -75.66015625, -71.638671875, -67.6171875, -63.595703125, -59.57421875, -55.552734375, -51.53125, -47.509765625, -43.48828125, -39.466796875, -35.4453125, -31.423828125, -27.40234375, -23.380859375, -19.359375, -15.337890625, -11.31640625, -7.294921875, -3.2734375, 0.748046875, 4.76953125, 8.791015625, 12.8125, 16.833984375, 20.85546875, 24.876953125, 28.8984375, 32.919921875, 36.94140625, 40.962890625, 44.984375, 49.005859375, 53.02734375, 57.048828125, 61.0703125, 65.091796875, 69.11328125, 73.134765625, 77.15625, 81.177734375, 85.19921875, 89.220703125, 93.2421875, 97.263671875, 101.28515625, 105.306640625, 109.328125, 113.349609375, 117.37109375, 121.392578125, 125.4140625, 129.435546875, 133.45703125, 137.478515625, 141.5]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 7.0, 11.0, 11.0, 14.0, 31.0, 40.0, 42.0, 66.0, 110.0, 103.0, 108.0, 121.0, 88.0, 59.0, 54.0, 33.0, 26.0, 19.0, 9.0, 12.0, 9.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00470733642578125, -0.004578739404678345, -0.0044501423835754395, -0.004321545362472534, -0.004192948341369629, -0.004064351320266724, -0.003935754299163818, -0.003807157278060913, -0.003678560256958008, -0.0035499632358551025, -0.0034213662147521973, -0.003292769193649292, -0.0031641721725463867, -0.0030355751514434814, -0.002906978130340576, -0.002778381109237671, -0.0026497840881347656, -0.0025211870670318604, -0.002392590045928955, -0.00226399302482605, -0.0021353960037231445, -0.0020067989826202393, -0.001878201961517334, -0.0017496049404144287, -0.0016210079193115234, -0.0014924108982086182, -0.0013638138771057129, -0.0012352168560028076, -0.0011066198348999023, -0.000978022813796997, -0.0008494257926940918, -0.0007208287715911865, -0.0005922317504882812, -0.000463634729385376, -0.0003350377082824707, -0.00020644068717956543, -7.784366607666016e-05, 5.075335502624512e-05, 0.0001793503761291504, 0.00030794739723205566, 0.00043654441833496094, 0.0005651414394378662, 0.0006937384605407715, 0.0008223354816436768, 0.000950932502746582, 0.0010795295238494873, 0.0012081265449523926, 0.0013367235660552979, 0.0014653205871582031, 0.0015939176082611084, 0.0017225146293640137, 0.001851111650466919, 0.0019797086715698242, 0.0021083056926727295, 0.0022369027137756348, 0.00236549973487854, 0.0024940967559814453, 0.0026226937770843506, 0.002751290798187256, 0.002879887819290161, 0.0030084848403930664, 0.0031370818614959717, 0.003265678882598877, 0.0033942759037017822, 0.0035228729248046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 11.0, 15.0, 18.0, 31.0, 63.0, 99.0, 227.0, 538.0, 1982.0, 16702.0, 952542.0, 71099.0, 3816.0, 831.0, 263.0, 115.0, 63.0, 53.0, 25.0, 15.0, 14.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-107.9375, -105.0732421875, -102.208984375, -99.3447265625, -96.48046875, -93.6162109375, -90.751953125, -87.8876953125, -85.0234375, -82.1591796875, -79.294921875, -76.4306640625, -73.56640625, -70.7021484375, -67.837890625, -64.9736328125, -62.109375, -59.2451171875, -56.380859375, -53.5166015625, -50.65234375, -47.7880859375, -44.923828125, -42.0595703125, -39.1953125, -36.3310546875, -33.466796875, -30.6025390625, -27.73828125, -24.8740234375, -22.009765625, -19.1455078125, -16.28125, -13.4169921875, -10.552734375, -7.6884765625, -4.82421875, -1.9599609375, 0.904296875, 3.7685546875, 6.6328125, 9.4970703125, 12.361328125, 15.2255859375, 18.08984375, 20.9541015625, 23.818359375, 26.6826171875, 29.546875, 32.4111328125, 35.275390625, 38.1396484375, 41.00390625, 43.8681640625, 46.732421875, 49.5966796875, 52.4609375, 55.3251953125, 58.189453125, 61.0537109375, 63.91796875, 66.7822265625, 69.646484375, 72.5107421875, 75.375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 8.0, 4.0, 20.0, 26.0, 53.0, 94.0, 149.0, 215.0, 170.0, 128.0, 54.0, 33.0, 7.0, 10.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-69.25, -67.54443359375, -65.8388671875, -64.13330078125, -62.427734375, -60.72216796875, -59.0166015625, -57.31103515625, -55.60546875, -53.89990234375, -52.1943359375, -50.48876953125, -48.783203125, -47.07763671875, -45.3720703125, -43.66650390625, -41.9609375, -40.25537109375, -38.5498046875, -36.84423828125, -35.138671875, -33.43310546875, -31.7275390625, -30.02197265625, -28.31640625, -26.61083984375, -24.9052734375, -23.19970703125, -21.494140625, -19.78857421875, -18.0830078125, -16.37744140625, -14.671875, -12.96630859375, -11.2607421875, -9.55517578125, -7.849609375, -6.14404296875, -4.4384765625, -2.73291015625, -1.02734375, 0.67822265625, 2.3837890625, 4.08935546875, 5.794921875, 7.50048828125, 9.2060546875, 10.91162109375, 12.6171875, 14.32275390625, 16.0283203125, 17.73388671875, 19.439453125, 21.14501953125, 22.8505859375, 24.55615234375, 26.26171875, 27.96728515625, 29.6728515625, 31.37841796875, 33.083984375, 34.78955078125, 36.4951171875, 38.20068359375, 39.90625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 30.0, 103.0, 322.0, 361.0, 116.0, 39.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1742.66015625, -1704.87646484375, -1667.0927734375, -1629.30908203125, -1591.525390625, -1553.74169921875, -1515.9580078125, -1478.17431640625, -1440.390625, -1402.60693359375, -1364.8232421875, -1327.03955078125, -1289.255859375, -1251.47216796875, -1213.6884765625, -1175.90478515625, -1138.12109375, -1100.33740234375, -1062.5537109375, -1024.77001953125, -986.986328125, -949.20263671875, -911.4189453125, -873.63525390625, -835.8515625, -798.06787109375, -760.2841796875, -722.50048828125, -684.716796875, -646.93310546875, -609.1494140625, -571.36572265625, -533.5820922851562, -495.79840087890625, -458.01470947265625, -420.23101806640625, -382.44732666015625, -344.66363525390625, -306.87994384765625, -269.09625244140625, -231.31256103515625, -193.52886962890625, -155.74517822265625, -117.96148681640625, -80.17779541015625, -42.39410400390625, -4.61041259765625, 33.17327880859375, 70.95697021484375, 108.74066162109375, 146.52435302734375, 184.30804443359375, 222.09173583984375, 259.87542724609375, 297.65911865234375, 335.44281005859375, 373.22650146484375, 411.01019287109375, 448.79388427734375, 486.57757568359375, 524.3612670898438, 562.1449584960938, 599.9286499023438, 637.7123413085938, 675.4960327148438]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 2.0, 9.0, 5.0, 8.0, 15.0, 11.0, 21.0, 34.0, 36.0, 30.0, 32.0, 51.0, 53.0, 54.0, 53.0, 53.0, 54.0, 50.0, 60.0, 56.0, 46.0, 44.0, 45.0, 39.0, 36.0, 26.0, 18.0, 13.0, 11.0, 8.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-432.62591552734375, -417.2890930175781, -401.9522705078125, -386.61541748046875, -371.2785949707031, -355.9417724609375, -340.6049499511719, -325.26812744140625, -309.9312744140625, -294.5944519042969, -279.25762939453125, -263.9207763671875, -248.58395385742188, -233.24713134765625, -217.91030883789062, -202.573486328125, -187.23666381835938, -171.89984130859375, -156.56300354003906, -141.22618103027344, -125.88935089111328, -110.55252075195312, -95.2156982421875, -79.87886810302734, -64.54203796386719, -49.20520782470703, -33.86838150024414, -18.53155517578125, -3.1947250366210938, 12.142105102539062, 27.478927612304688, 42.815757751464844, 58.152587890625, 73.48941802978516, 88.82624816894531, 104.16307067871094, 119.4999008178711, 134.83673095703125, 150.17355346679688, 165.5103759765625, 180.8472137451172, 196.1840362548828, 211.5208740234375, 226.85769653320312, 242.19451904296875, 257.5313720703125, 272.8681640625, 288.20501708984375, 303.5418395996094, 318.878662109375, 334.2154846191406, 349.55230712890625, 364.88916015625, 380.2259826660156, 395.56280517578125, 410.8996276855469, 426.2364501953125, 441.5732727050781, 456.91009521484375, 472.2469482421875, 487.5837707519531, 502.92059326171875, 518.2574462890625, 533.59423828125, 548.9310913085938]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 12.0, 13.0, 23.0, 33.0, 53.0, 92.0, 143.0, 232.0, 437.0, 1019.0, 2925.0, 11564.0, 103484.0, 3975721.0, 84603.0, 10036.0, 2437.0, 756.0, 335.0, 162.0, 68.0, 60.0, 21.0, 22.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0], "bins": [-283.0, -276.9091796875, -270.818359375, -264.7275390625, -258.63671875, -252.5458984375, -246.455078125, -240.3642578125, -234.2734375, -228.1826171875, -222.091796875, -216.0009765625, -209.91015625, -203.8193359375, -197.728515625, -191.6376953125, -185.546875, -179.4560546875, -173.365234375, -167.2744140625, -161.18359375, -155.0927734375, -149.001953125, -142.9111328125, -136.8203125, -130.7294921875, -124.638671875, -118.5478515625, -112.45703125, -106.3662109375, -100.275390625, -94.1845703125, -88.09375, -82.0029296875, -75.912109375, -69.8212890625, -63.73046875, -57.6396484375, -51.548828125, -45.4580078125, -39.3671875, -33.2763671875, -27.185546875, -21.0947265625, -15.00390625, -8.9130859375, -2.822265625, 3.2685546875, 9.359375, 15.4501953125, 21.541015625, 27.6318359375, 33.72265625, 39.8134765625, 45.904296875, 51.9951171875, 58.0859375, 64.1767578125, 70.267578125, 76.3583984375, 82.44921875, 88.5400390625, 94.630859375, 100.7216796875, 106.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 10.0, 14.0, 29.0, 21.0, 25.0, 31.0, 54.0, 68.0, 68.0, 61.0, 75.0, 75.0, 80.0, 65.0, 70.0, 48.0, 34.0, 43.0, 38.0, 25.0, 15.0, 14.0, 13.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-30.765625, -30.053955078125, -29.34228515625, -28.630615234375, -27.9189453125, -27.207275390625, -26.49560546875, -25.783935546875, -25.072265625, -24.360595703125, -23.64892578125, -22.937255859375, -22.2255859375, -21.513916015625, -20.80224609375, -20.090576171875, -19.37890625, -18.667236328125, -17.95556640625, -17.243896484375, -16.5322265625, -15.820556640625, -15.10888671875, -14.397216796875, -13.685546875, -12.973876953125, -12.26220703125, -11.550537109375, -10.8388671875, -10.127197265625, -9.41552734375, -8.703857421875, -7.9921875, -7.280517578125, -6.56884765625, -5.857177734375, -5.1455078125, -4.433837890625, -3.72216796875, -3.010498046875, -2.298828125, -1.587158203125, -0.87548828125, -0.163818359375, 0.5478515625, 1.259521484375, 1.97119140625, 2.682861328125, 3.39453125, 4.106201171875, 4.81787109375, 5.529541015625, 6.2412109375, 6.952880859375, 7.66455078125, 8.376220703125, 9.087890625, 9.799560546875, 10.51123046875, 11.222900390625, 11.9345703125, 12.646240234375, 13.35791015625, 14.069580078125, 14.78125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 5.0, 10.0, 15.0, 26.0, 32.0, 49.0, 108.0, 214.0, 480.0, 1248.0, 3867.0, 17764.0, 1024281.0, 3115028.0, 23092.0, 5132.0, 1681.0, 615.0, 268.0, 133.0, 69.0, 51.0, 26.0, 28.0, 11.0, 9.0, 6.0, 6.0, 9.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.375, -152.921875, -147.46875, -142.015625, -136.5625, -131.109375, -125.65625, -120.203125, -114.75, -109.296875, -103.84375, -98.390625, -92.9375, -87.484375, -82.03125, -76.578125, -71.125, -65.671875, -60.21875, -54.765625, -49.3125, -43.859375, -38.40625, -32.953125, -27.5, -22.046875, -16.59375, -11.140625, -5.6875, -0.234375, 5.21875, 10.671875, 16.125, 21.578125, 27.03125, 32.484375, 37.9375, 43.390625, 48.84375, 54.296875, 59.75, 65.203125, 70.65625, 76.109375, 81.5625, 87.015625, 92.46875, 97.921875, 103.375, 108.828125, 114.28125, 119.734375, 125.1875, 130.640625, 136.09375, 141.546875, 147.0, 152.453125, 157.90625, 163.359375, 168.8125, 174.265625, 179.71875, 185.171875, 190.625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 13.0, 11.0, 16.0, 35.0, 57.0, 113.0, 258.0, 1047.0, 1866.0, 336.0, 122.0, 61.0, 32.0, 23.0, 16.0, 9.0, 2.0, 9.0, 6.0, 2.0, 5.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.9375, -45.326171875, -43.71484375, -42.103515625, -40.4921875, -38.880859375, -37.26953125, -35.658203125, -34.046875, -32.435546875, -30.82421875, -29.212890625, -27.6015625, -25.990234375, -24.37890625, -22.767578125, -21.15625, -19.544921875, -17.93359375, -16.322265625, -14.7109375, -13.099609375, -11.48828125, -9.876953125, -8.265625, -6.654296875, -5.04296875, -3.431640625, -1.8203125, -0.208984375, 1.40234375, 3.013671875, 4.625, 6.236328125, 7.84765625, 9.458984375, 11.0703125, 12.681640625, 14.29296875, 15.904296875, 17.515625, 19.126953125, 20.73828125, 22.349609375, 23.9609375, 25.572265625, 27.18359375, 28.794921875, 30.40625, 32.017578125, 33.62890625, 35.240234375, 36.8515625, 38.462890625, 40.07421875, 41.685546875, 43.296875, 44.908203125, 46.51953125, 48.130859375, 49.7421875, 51.353515625, 52.96484375, 54.576171875, 56.1875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 35.0, 95.0, 393.0, 331.0, 89.0, 26.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-287.711181640625, -269.74853515625, -251.78590393066406, -233.82327270507812, -215.86062622070312, -197.89797973632812, -179.9353485107422, -161.97271728515625, -144.01007080078125, -126.04743194580078, -108.08479309082031, -90.12215423583984, -72.15951538085938, -54.196876525878906, -36.23423767089844, -18.27159881591797, -0.3089599609375, 17.65367889404297, 35.61631774902344, 53.578956604003906, 71.54159545898438, 89.50423431396484, 107.46687316894531, 125.42951202392578, 143.39215087890625, 161.35479736328125, 179.3174285888672, 197.28005981445312, 215.24270629882812, 233.20535278320312, 251.16798400878906, 269.130615234375, 287.09326171875, 305.055908203125, 323.0185546875, 340.9811706542969, 358.9438171386719, 376.9064636230469, 394.86907958984375, 412.83172607421875, 430.79437255859375, 448.75701904296875, 466.71966552734375, 484.6822814941406, 502.6449279785156, 520.6075439453125, 538.5701904296875, 556.5328369140625, 574.4954833984375, 592.4581298828125, 610.4207763671875, 628.3834228515625, 646.3460693359375, 664.3086547851562, 682.2713012695312, 700.2339477539062, 718.1965942382812, 736.1592407226562, 754.1218872070312, 772.0845336914062, 790.047119140625, 808.009765625, 825.972412109375, 843.93505859375, 861.897705078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 11.0, 17.0, 20.0, 29.0, 31.0, 36.0, 43.0, 52.0, 56.0, 64.0, 69.0, 56.0, 64.0, 67.0, 49.0, 53.0, 54.0, 43.0, 41.0, 35.0, 28.0, 18.0, 17.0, 9.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-206.3984375, -200.08758544921875, -193.77671813964844, -187.4658660888672, -181.15499877929688, -174.84414672851562, -168.53329467773438, -162.22242736816406, -155.91156005859375, -149.6007080078125, -143.2898406982422, -136.97898864746094, -130.66812133789062, -124.35726928710938, -118.0464096069336, -111.73554992675781, -105.42469787597656, -99.11383819580078, -92.802978515625, -86.49212646484375, -80.18125915527344, -73.87040710449219, -67.5595474243164, -61.248687744140625, -54.937828063964844, -48.62696838378906, -42.31610870361328, -36.005252838134766, -29.694393157958984, -23.383533477783203, -17.072677612304688, -10.761817932128906, -4.4509429931640625, 1.8599157333374023, 8.170774459838867, 14.481632232666016, 20.792491912841797, 27.103351593017578, 33.414207458496094, 39.725067138671875, 46.035926818847656, 52.34678649902344, 58.65764617919922, 64.968505859375, 71.27935791015625, 77.59022521972656, 83.90107727050781, 90.2119369506836, 96.52279663085938, 102.83365631103516, 109.14451599121094, 115.45536804199219, 121.7662353515625, 128.07708740234375, 134.387939453125, 140.6988067626953, 147.00967407226562, 153.32052612304688, 159.6313934326172, 165.94224548339844, 172.25311279296875, 178.56396484375, 184.87481689453125, 191.18568420410156, 197.4965362548828]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 6.0, 8.0, 4.0, 12.0, 11.0, 28.0, 23.0, 38.0, 61.0, 89.0, 138.0, 227.0, 393.0, 681.0, 1519.0, 3670.0, 9988.0, 32014.0, 139868.0, 559678.0, 230433.0, 47241.0, 13596.0, 4846.0, 1989.0, 823.0, 476.0, 252.0, 151.0, 92.0, 54.0, 48.0, 29.0, 18.0, 13.0, 14.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.0625, -70.51171875, -67.9609375, -65.41015625, -62.859375, -60.30859375, -57.7578125, -55.20703125, -52.65625, -50.10546875, -47.5546875, -45.00390625, -42.453125, -39.90234375, -37.3515625, -34.80078125, -32.25, -29.69921875, -27.1484375, -24.59765625, -22.046875, -19.49609375, -16.9453125, -14.39453125, -11.84375, -9.29296875, -6.7421875, -4.19140625, -1.640625, 0.91015625, 3.4609375, 6.01171875, 8.5625, 11.11328125, 13.6640625, 16.21484375, 18.765625, 21.31640625, 23.8671875, 26.41796875, 28.96875, 31.51953125, 34.0703125, 36.62109375, 39.171875, 41.72265625, 44.2734375, 46.82421875, 49.375, 51.92578125, 54.4765625, 57.02734375, 59.578125, 62.12890625, 64.6796875, 67.23046875, 69.78125, 72.33203125, 74.8828125, 77.43359375, 79.984375, 82.53515625, 85.0859375, 87.63671875, 90.1875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 12.0, 11.0, 28.0, 20.0, 42.0, 44.0, 52.0, 53.0, 71.0, 66.0, 73.0, 68.0, 78.0, 63.0, 50.0, 59.0, 43.0, 48.0, 22.0, 28.0, 15.0, 10.0, 11.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.88720703125, -21.2431640625, -20.59912109375, -19.955078125, -19.31103515625, -18.6669921875, -18.02294921875, -17.37890625, -16.73486328125, -16.0908203125, -15.44677734375, -14.802734375, -14.15869140625, -13.5146484375, -12.87060546875, -12.2265625, -11.58251953125, -10.9384765625, -10.29443359375, -9.650390625, -9.00634765625, -8.3623046875, -7.71826171875, -7.07421875, -6.43017578125, -5.7861328125, -5.14208984375, -4.498046875, -3.85400390625, -3.2099609375, -2.56591796875, -1.921875, -1.27783203125, -0.6337890625, 0.01025390625, 0.654296875, 1.29833984375, 1.9423828125, 2.58642578125, 3.23046875, 3.87451171875, 4.5185546875, 5.16259765625, 5.806640625, 6.45068359375, 7.0947265625, 7.73876953125, 8.3828125, 9.02685546875, 9.6708984375, 10.31494140625, 10.958984375, 11.60302734375, 12.2470703125, 12.89111328125, 13.53515625, 14.17919921875, 14.8232421875, 15.46728515625, 16.111328125, 16.75537109375, 17.3994140625, 18.04345703125, 18.6875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 8.0, 20.0, 16.0, 25.0, 46.0, 70.0, 100.0, 130.0, 186.0, 288.0, 460.0, 755.0, 1437.0, 3342.0, 10557.0, 46638.0, 309824.0, 559661.0, 88247.0, 17452.0, 4836.0, 1871.0, 951.0, 563.0, 340.0, 232.0, 139.0, 106.0, 90.0, 41.0, 34.0, 20.0, 12.0, 14.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.1875, -78.583984375, -75.98046875, -73.376953125, -70.7734375, -68.169921875, -65.56640625, -62.962890625, -60.359375, -57.755859375, -55.15234375, -52.548828125, -49.9453125, -47.341796875, -44.73828125, -42.134765625, -39.53125, -36.927734375, -34.32421875, -31.720703125, -29.1171875, -26.513671875, -23.91015625, -21.306640625, -18.703125, -16.099609375, -13.49609375, -10.892578125, -8.2890625, -5.685546875, -3.08203125, -0.478515625, 2.125, 4.728515625, 7.33203125, 9.935546875, 12.5390625, 15.142578125, 17.74609375, 20.349609375, 22.953125, 25.556640625, 28.16015625, 30.763671875, 33.3671875, 35.970703125, 38.57421875, 41.177734375, 43.78125, 46.384765625, 48.98828125, 51.591796875, 54.1953125, 56.798828125, 59.40234375, 62.005859375, 64.609375, 67.212890625, 69.81640625, 72.419921875, 75.0234375, 77.626953125, 80.23046875, 82.833984375, 85.4375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 10.0, 7.0, 9.0, 19.0, 23.0, 16.0, 22.0, 26.0, 37.0, 52.0, 36.0, 39.0, 40.0, 53.0, 51.0, 52.0, 48.0, 41.0, 51.0, 43.0, 38.0, 37.0, 46.0, 22.0, 33.0, 23.0, 15.0, 16.0, 17.0, 21.0, 14.0, 11.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-77.3125, -75.224609375, -73.13671875, -71.048828125, -68.9609375, -66.873046875, -64.78515625, -62.697265625, -60.609375, -58.521484375, -56.43359375, -54.345703125, -52.2578125, -50.169921875, -48.08203125, -45.994140625, -43.90625, -41.818359375, -39.73046875, -37.642578125, -35.5546875, -33.466796875, -31.37890625, -29.291015625, -27.203125, -25.115234375, -23.02734375, -20.939453125, -18.8515625, -16.763671875, -14.67578125, -12.587890625, -10.5, -8.412109375, -6.32421875, -4.236328125, -2.1484375, -0.060546875, 2.02734375, 4.115234375, 6.203125, 8.291015625, 10.37890625, 12.466796875, 14.5546875, 16.642578125, 18.73046875, 20.818359375, 22.90625, 24.994140625, 27.08203125, 29.169921875, 31.2578125, 33.345703125, 35.43359375, 37.521484375, 39.609375, 41.697265625, 43.78515625, 45.873046875, 47.9609375, 50.048828125, 52.13671875, 54.224609375, 56.3125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 6.0, 16.0, 17.0, 28.0, 37.0, 61.0, 96.0, 154.0, 261.0, 453.0, 874.0, 2055.0, 6008.0, 28296.0, 966604.0, 32755.0, 6543.0, 2188.0, 909.0, 472.0, 274.0, 163.0, 93.0, 63.0, 30.0, 19.0, 14.0, 12.0, 12.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-151.875, -147.4765625, -143.078125, -138.6796875, -134.28125, -129.8828125, -125.484375, -121.0859375, -116.6875, -112.2890625, -107.890625, -103.4921875, -99.09375, -94.6953125, -90.296875, -85.8984375, -81.5, -77.1015625, -72.703125, -68.3046875, -63.90625, -59.5078125, -55.109375, -50.7109375, -46.3125, -41.9140625, -37.515625, -33.1171875, -28.71875, -24.3203125, -19.921875, -15.5234375, -11.125, -6.7265625, -2.328125, 2.0703125, 6.46875, 10.8671875, 15.265625, 19.6640625, 24.0625, 28.4609375, 32.859375, 37.2578125, 41.65625, 46.0546875, 50.453125, 54.8515625, 59.25, 63.6484375, 68.046875, 72.4453125, 76.84375, 81.2421875, 85.640625, 90.0390625, 94.4375, 98.8359375, 103.234375, 107.6328125, 112.03125, 116.4296875, 120.828125, 125.2265625, 129.625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 19.0, 21.0, 36.0, 68.0, 91.0, 115.0, 123.0, 126.0, 143.0, 85.0, 53.0, 45.0, 16.0, 13.0, 3.0, 7.0, 3.0, 2.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00388336181640625, -0.0037270188331604004, -0.0035706758499145508, -0.003414332866668701, -0.0032579898834228516, -0.003101646900177002, -0.0029453039169311523, -0.0027889609336853027, -0.002632617950439453, -0.0024762749671936035, -0.002319931983947754, -0.0021635890007019043, -0.0020072460174560547, -0.001850903034210205, -0.0016945600509643555, -0.0015382170677185059, -0.0013818740844726562, -0.0012255311012268066, -0.001069188117980957, -0.0009128451347351074, -0.0007565021514892578, -0.0006001591682434082, -0.0004438161849975586, -0.000287473201751709, -0.00013113021850585938, 2.5212764739990234e-05, 0.00018155574798583984, 0.00033789873123168945, 0.0004942417144775391, 0.0006505846977233887, 0.0008069276809692383, 0.0009632706642150879, 0.0011196136474609375, 0.0012759566307067871, 0.0014322996139526367, 0.0015886425971984863, 0.001744985580444336, 0.0019013285636901855, 0.002057671546936035, 0.0022140145301818848, 0.0023703575134277344, 0.002526700496673584, 0.0026830434799194336, 0.002839386463165283, 0.002995729446411133, 0.0031520724296569824, 0.003308415412902832, 0.0034647583961486816, 0.0036211013793945312, 0.003777444362640381, 0.0039337873458862305, 0.00409013032913208, 0.00424647331237793, 0.004402816295623779, 0.004559159278869629, 0.0047155022621154785, 0.004871845245361328, 0.005028188228607178, 0.005184531211853027, 0.005340874195098877, 0.0054972171783447266, 0.005653560161590576, 0.005809903144836426, 0.005966246128082275, 0.006122589111328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 3.0, 1.0, 4.0, 3.0, 6.0, 13.0, 13.0, 24.0, 29.0, 32.0, 40.0, 64.0, 80.0, 131.0, 257.0, 418.0, 633.0, 1130.0, 2305.0, 5462.0, 23879.0, 946851.0, 53178.0, 7676.0, 2793.0, 1378.0, 817.0, 479.0, 271.0, 170.0, 112.0, 77.0, 56.0, 34.0, 29.0, 20.0, 15.0, 12.0, 10.0, 7.0, 4.0, 1.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-118.0625, -114.4462890625, -110.830078125, -107.2138671875, -103.59765625, -99.9814453125, -96.365234375, -92.7490234375, -89.1328125, -85.5166015625, -81.900390625, -78.2841796875, -74.66796875, -71.0517578125, -67.435546875, -63.8193359375, -60.203125, -56.5869140625, -52.970703125, -49.3544921875, -45.73828125, -42.1220703125, -38.505859375, -34.8896484375, -31.2734375, -27.6572265625, -24.041015625, -20.4248046875, -16.80859375, -13.1923828125, -9.576171875, -5.9599609375, -2.34375, 1.2724609375, 4.888671875, 8.5048828125, 12.12109375, 15.7373046875, 19.353515625, 22.9697265625, 26.5859375, 30.2021484375, 33.818359375, 37.4345703125, 41.05078125, 44.6669921875, 48.283203125, 51.8994140625, 55.515625, 59.1318359375, 62.748046875, 66.3642578125, 69.98046875, 73.5966796875, 77.212890625, 80.8291015625, 84.4453125, 88.0615234375, 91.677734375, 95.2939453125, 98.91015625, 102.5263671875, 106.142578125, 109.7587890625, 113.375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 8.0, 4.0, 11.0, 13.0, 14.0, 28.0, 97.0, 222.0, 305.0, 163.0, 44.0, 24.0, 13.0, 10.0, 6.0, 1.0, 5.0, 4.0, 2.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.625, -68.365234375, -66.10546875, -63.845703125, -61.5859375, -59.326171875, -57.06640625, -54.806640625, -52.546875, -50.287109375, -48.02734375, -45.767578125, -43.5078125, -41.248046875, -38.98828125, -36.728515625, -34.46875, -32.208984375, -29.94921875, -27.689453125, -25.4296875, -23.169921875, -20.91015625, -18.650390625, -16.390625, -14.130859375, -11.87109375, -9.611328125, -7.3515625, -5.091796875, -2.83203125, -0.572265625, 1.6875, 3.947265625, 6.20703125, 8.466796875, 10.7265625, 12.986328125, 15.24609375, 17.505859375, 19.765625, 22.025390625, 24.28515625, 26.544921875, 28.8046875, 31.064453125, 33.32421875, 35.583984375, 37.84375, 40.103515625, 42.36328125, 44.623046875, 46.8828125, 49.142578125, 51.40234375, 53.662109375, 55.921875, 58.181640625, 60.44140625, 62.701171875, 64.9609375, 67.220703125, 69.48046875, 71.740234375, 74.0]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 13.0, 15.0, 46.0, 140.0, 372.0, 297.0, 90.0, 22.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1907.246826171875, -1863.828125, -1820.4093017578125, -1776.9906005859375, -1733.57177734375, -1690.153076171875, -1646.7342529296875, -1603.3155517578125, -1559.896728515625, -1516.47802734375, -1473.0592041015625, -1429.6405029296875, -1386.2216796875, -1342.802978515625, -1299.3841552734375, -1255.9654541015625, -1212.546630859375, -1169.1279296875, -1125.7091064453125, -1082.2904052734375, -1038.87158203125, -995.4528198242188, -952.0340576171875, -908.6153564453125, -865.1966552734375, -821.7778930664062, -778.359130859375, -734.9403686523438, -691.5216064453125, -648.1028442382812, -604.68408203125, -561.265380859375, -517.8465576171875, -474.42779541015625, -431.009033203125, -387.59027099609375, -344.1715087890625, -300.75274658203125, -257.3340148925781, -213.91525268554688, -170.49649047851562, -127.07772827148438, -83.65897369384766, -40.24021911621094, 3.1785430908203125, 46.59730529785156, 90.01605224609375, 133.434814453125, 176.85357666015625, 220.2723388671875, 263.69110107421875, 307.10986328125, 350.52862548828125, 393.9473876953125, 437.3661193847656, 480.7848815917969, 524.20361328125, 567.6223754882812, 611.0411376953125, 654.4598999023438, 697.878662109375, 741.2974243164062, 784.7161865234375, 828.1348876953125, 871.5537109375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 9.0, 10.0, 8.0, 14.0, 14.0, 21.0, 24.0, 21.0, 23.0, 32.0, 32.0, 39.0, 47.0, 46.0, 45.0, 36.0, 37.0, 40.0, 39.0, 36.0, 40.0, 34.0, 33.0, 32.0, 39.0, 29.0, 17.0, 24.0, 31.0, 15.0, 22.0, 10.0, 16.0, 14.0, 18.0, 11.0, 4.0, 6.0, 2.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-368.9228515625, -357.8231506347656, -346.72344970703125, -335.623779296875, -324.5240783691406, -313.42437744140625, -302.3246765136719, -291.2249755859375, -280.1252746582031, -269.02557373046875, -257.9258728027344, -246.82618713378906, -235.7264862060547, -224.62680053710938, -213.527099609375, -202.42739868164062, -191.3277130126953, -180.22801208496094, -169.12832641601562, -158.02862548828125, -146.92892456054688, -135.8292236328125, -124.72953796386719, -113.62983703613281, -102.53014373779297, -91.43045043945312, -80.33074951171875, -69.2310562133789, -58.1313591003418, -47.03166198730469, -35.931968688964844, -24.83226776123047, -13.732574462890625, -2.632878303527832, 8.466817855834961, 19.566513061523438, 30.666210174560547, 41.765907287597656, 52.8656005859375, 63.965301513671875, 75.06499481201172, 86.16468811035156, 97.26438903808594, 108.36408233642578, 119.46377563476562, 130.5634765625, 141.66317749023438, 152.76287841796875, 163.86256408691406, 174.96226501464844, 186.06195068359375, 197.16165161132812, 208.2613525390625, 219.36105346679688, 230.4607391357422, 241.56044006347656, 252.66012573242188, 263.75982666015625, 274.8595275878906, 285.959228515625, 297.05889892578125, 308.1585998535156, 319.25830078125, 330.3580017089844, 341.45770263671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 7.0, 10.0, 6.0, 10.0, 14.0, 32.0, 36.0, 70.0, 80.0, 153.0, 277.0, 505.0, 1012.0, 2111.0, 5377.0, 16846.0, 84617.0, 3696800.0, 338117.0, 34194.0, 8634.0, 2821.0, 1221.0, 602.0, 291.0, 168.0, 105.0, 52.0, 44.0, 16.0, 17.0, 12.0, 6.0, 7.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.0625, -76.572265625, -74.08203125, -71.591796875, -69.1015625, -66.611328125, -64.12109375, -61.630859375, -59.140625, -56.650390625, -54.16015625, -51.669921875, -49.1796875, -46.689453125, -44.19921875, -41.708984375, -39.21875, -36.728515625, -34.23828125, -31.748046875, -29.2578125, -26.767578125, -24.27734375, -21.787109375, -19.296875, -16.806640625, -14.31640625, -11.826171875, -9.3359375, -6.845703125, -4.35546875, -1.865234375, 0.625, 3.115234375, 5.60546875, 8.095703125, 10.5859375, 13.076171875, 15.56640625, 18.056640625, 20.546875, 23.037109375, 25.52734375, 28.017578125, 30.5078125, 32.998046875, 35.48828125, 37.978515625, 40.46875, 42.958984375, 45.44921875, 47.939453125, 50.4296875, 52.919921875, 55.41015625, 57.900390625, 60.390625, 62.880859375, 65.37109375, 67.861328125, 70.3515625, 72.841796875, 75.33203125, 77.822265625, 80.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 8.0, 11.0, 12.0, 14.0, 10.0, 17.0, 22.0, 31.0, 19.0, 42.0, 45.0, 41.0, 35.0, 59.0, 69.0, 63.0, 52.0, 52.0, 52.0, 52.0, 49.0, 36.0, 39.0, 27.0, 32.0, 23.0, 21.0, 21.0, 11.0, 12.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.7265625, -17.1875, -16.6484375, -16.109375, -15.5703125, -15.03125, -14.4921875, -13.953125, -13.4140625, -12.875, -12.3359375, -11.796875, -11.2578125, -10.71875, -10.1796875, -9.640625, -9.1015625, -8.5625, -8.0234375, -7.484375, -6.9453125, -6.40625, -5.8671875, -5.328125, -4.7890625, -4.25, -3.7109375, -3.171875, -2.6328125, -2.09375, -1.5546875, -1.015625, -0.4765625, 0.0625, 0.6015625, 1.140625, 1.6796875, 2.21875, 2.7578125, 3.296875, 3.8359375, 4.375, 4.9140625, 5.453125, 5.9921875, 6.53125, 7.0703125, 7.609375, 8.1484375, 8.6875, 9.2265625, 9.765625, 10.3046875, 10.84375, 11.3828125, 11.921875, 12.4609375, 13.0, 13.5390625, 14.078125, 14.6171875, 15.15625, 15.6953125, 16.234375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 15.0, 13.0, 25.0, 14.0, 33.0, 40.0, 60.0, 82.0, 112.0, 218.0, 360.0, 944.0, 3032.0, 15410.0, 227492.0, 3865131.0, 68951.0, 8683.0, 2006.0, 729.0, 382.0, 192.0, 109.0, 83.0, 49.0, 35.0, 26.0, 14.0, 11.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.375, -90.294921875, -87.21484375, -84.134765625, -81.0546875, -77.974609375, -74.89453125, -71.814453125, -68.734375, -65.654296875, -62.57421875, -59.494140625, -56.4140625, -53.333984375, -50.25390625, -47.173828125, -44.09375, -41.013671875, -37.93359375, -34.853515625, -31.7734375, -28.693359375, -25.61328125, -22.533203125, -19.453125, -16.373046875, -13.29296875, -10.212890625, -7.1328125, -4.052734375, -0.97265625, 2.107421875, 5.1875, 8.267578125, 11.34765625, 14.427734375, 17.5078125, 20.587890625, 23.66796875, 26.748046875, 29.828125, 32.908203125, 35.98828125, 39.068359375, 42.1484375, 45.228515625, 48.30859375, 51.388671875, 54.46875, 57.548828125, 60.62890625, 63.708984375, 66.7890625, 69.869140625, 72.94921875, 76.029296875, 79.109375, 82.189453125, 85.26953125, 88.349609375, 91.4296875, 94.509765625, 97.58984375, 100.669921875, 103.75]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 7.0, 4.0, 16.0, 24.0, 54.0, 97.0, 247.0, 2065.0, 1042.0, 259.0, 109.0, 60.0, 26.0, 22.0, 14.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.15625, -36.91943359375, -35.6826171875, -34.44580078125, -33.208984375, -31.97216796875, -30.7353515625, -29.49853515625, -28.26171875, -27.02490234375, -25.7880859375, -24.55126953125, -23.314453125, -22.07763671875, -20.8408203125, -19.60400390625, -18.3671875, -17.13037109375, -15.8935546875, -14.65673828125, -13.419921875, -12.18310546875, -10.9462890625, -9.70947265625, -8.47265625, -7.23583984375, -5.9990234375, -4.76220703125, -3.525390625, -2.28857421875, -1.0517578125, 0.18505859375, 1.421875, 2.65869140625, 3.8955078125, 5.13232421875, 6.369140625, 7.60595703125, 8.8427734375, 10.07958984375, 11.31640625, 12.55322265625, 13.7900390625, 15.02685546875, 16.263671875, 17.50048828125, 18.7373046875, 19.97412109375, 21.2109375, 22.44775390625, 23.6845703125, 24.92138671875, 26.158203125, 27.39501953125, 28.6318359375, 29.86865234375, 31.10546875, 32.34228515625, 33.5791015625, 34.81591796875, 36.052734375, 37.28955078125, 38.5263671875, 39.76318359375, 41.0]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 44.0, 409.0, 417.0, 89.0, 22.0, 12.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-444.410400390625, -425.7106018066406, -407.01080322265625, -388.31097412109375, -369.6111755371094, -350.911376953125, -332.2115478515625, -313.5117492675781, -294.81195068359375, -276.1121520996094, -257.412353515625, -238.7125244140625, -220.01272583007812, -201.31292724609375, -182.6131134033203, -163.91329956054688, -145.2135009765625, -126.5136947631836, -107.81388854980469, -89.11408233642578, -70.41427612304688, -51.71446990966797, -33.01466369628906, -14.314849853515625, 4.38494873046875, 23.084754943847656, 41.78456115722656, 60.48436737060547, 79.18417358398438, 97.88397979736328, 116.58378601074219, 135.28359985351562, 153.98333740234375, 172.68313598632812, 191.38294982910156, 210.082763671875, 228.78256225585938, 247.48236083984375, 266.18218994140625, 284.8819885253906, 303.581787109375, 322.2815856933594, 340.98138427734375, 359.68121337890625, 378.3810119628906, 397.080810546875, 415.7806396484375, 434.4804382324219, 453.18023681640625, 471.8800354003906, 490.579833984375, 509.2796630859375, 527.9794921875, 546.6792602539062, 565.3790893554688, 584.078857421875, 602.7786865234375, 621.478515625, 640.1782836914062, 658.8781127929688, 677.577880859375, 696.2777099609375, 714.9775390625, 733.6773681640625, 752.3771362304688]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 7.0, 8.0, 9.0, 9.0, 7.0, 17.0, 19.0, 18.0, 23.0, 28.0, 23.0, 30.0, 36.0, 43.0, 35.0, 34.0, 46.0, 41.0, 29.0, 34.0, 37.0, 45.0, 33.0, 30.0, 35.0, 44.0, 34.0, 30.0, 23.0, 30.0, 22.0, 28.0, 18.0, 12.0, 19.0, 13.0, 12.0, 12.0, 6.0, 3.0, 5.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-87.89079284667969, -85.0030288696289, -82.11527252197266, -79.22750854492188, -76.33975219726562, -73.45198822021484, -70.56422424316406, -67.67646789550781, -64.78870391845703, -61.900943756103516, -59.01318359375, -56.12541961669922, -53.2376594543457, -50.34989929199219, -47.462135314941406, -44.57437515258789, -41.686614990234375, -38.79885482788086, -35.911094665527344, -33.02333068847656, -30.135570526123047, -27.24781036376953, -24.360048294067383, -21.472286224365234, -18.58452606201172, -15.696764945983887, -12.809003829956055, -9.921242713928223, -7.033481597900391, -4.145720481872559, -1.2579593658447266, 1.6298027038574219, 4.5175628662109375, 7.4053239822387695, 10.293085098266602, 13.180846214294434, 16.068607330322266, 18.95636749267578, 21.84412956237793, 24.731891632080078, 27.619651794433594, 30.50741195678711, 33.395172119140625, 36.282936096191406, 39.17069625854492, 42.05845642089844, 44.94622039794922, 47.833980560302734, 50.72174072265625, 53.609500885009766, 56.49726104736328, 59.38502502441406, 62.27278518676758, 65.1605453491211, 68.04830932617188, 70.93606567382812, 73.8238296508789, 76.71159362792969, 79.59934997558594, 82.48711395263672, 85.3748779296875, 88.26263427734375, 91.15039825439453, 94.03816223144531, 96.92591857910156]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 20.0, 20.0, 25.0, 35.0, 43.0, 74.0, 124.0, 176.0, 247.0, 439.0, 800.0, 1387.0, 2576.0, 4884.0, 10446.0, 23478.0, 58832.0, 169852.0, 396982.0, 240063.0, 80841.0, 30687.0, 13051.0, 6118.0, 3154.0, 1710.0, 900.0, 556.0, 350.0, 229.0, 132.0, 99.0, 48.0, 38.0, 29.0, 20.0, 15.0, 14.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-57.0625, -55.201171875, -53.33984375, -51.478515625, -49.6171875, -47.755859375, -45.89453125, -44.033203125, -42.171875, -40.310546875, -38.44921875, -36.587890625, -34.7265625, -32.865234375, -31.00390625, -29.142578125, -27.28125, -25.419921875, -23.55859375, -21.697265625, -19.8359375, -17.974609375, -16.11328125, -14.251953125, -12.390625, -10.529296875, -8.66796875, -6.806640625, -4.9453125, -3.083984375, -1.22265625, 0.638671875, 2.5, 4.361328125, 6.22265625, 8.083984375, 9.9453125, 11.806640625, 13.66796875, 15.529296875, 17.390625, 19.251953125, 21.11328125, 22.974609375, 24.8359375, 26.697265625, 28.55859375, 30.419921875, 32.28125, 34.142578125, 36.00390625, 37.865234375, 39.7265625, 41.587890625, 43.44921875, 45.310546875, 47.171875, 49.033203125, 50.89453125, 52.755859375, 54.6171875, 56.478515625, 58.33984375, 60.201171875, 62.0625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 5.0, 8.0, 16.0, 13.0, 21.0, 28.0, 26.0, 27.0, 38.0, 45.0, 47.0, 56.0, 71.0, 64.0, 61.0, 60.0, 52.0, 40.0, 53.0, 46.0, 39.0, 35.0, 28.0, 31.0, 21.0, 15.0, 11.0, 11.0, 5.0, 2.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.421875, -18.8712158203125, -18.320556640625, -17.7698974609375, -17.21923828125, -16.6685791015625, -16.117919921875, -15.5672607421875, -15.0166015625, -14.4659423828125, -13.915283203125, -13.3646240234375, -12.81396484375, -12.2633056640625, -11.712646484375, -11.1619873046875, -10.611328125, -10.0606689453125, -9.510009765625, -8.9593505859375, -8.40869140625, -7.8580322265625, -7.307373046875, -6.7567138671875, -6.2060546875, -5.6553955078125, -5.104736328125, -4.5540771484375, -4.00341796875, -3.4527587890625, -2.902099609375, -2.3514404296875, -1.80078125, -1.2501220703125, -0.699462890625, -0.1488037109375, 0.40185546875, 0.9525146484375, 1.503173828125, 2.0538330078125, 2.6044921875, 3.1551513671875, 3.705810546875, 4.2564697265625, 4.80712890625, 5.3577880859375, 5.908447265625, 6.4591064453125, 7.009765625, 7.5604248046875, 8.111083984375, 8.6617431640625, 9.21240234375, 9.7630615234375, 10.313720703125, 10.8643798828125, 11.4150390625, 11.9656982421875, 12.516357421875, 13.0670166015625, 13.61767578125, 14.1683349609375, 14.718994140625, 15.2696533203125, 15.8203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 3.0, 9.0, 10.0, 13.0, 19.0, 26.0, 31.0, 49.0, 70.0, 101.0, 117.0, 131.0, 200.0, 288.0, 442.0, 634.0, 1163.0, 2550.0, 7259.0, 30900.0, 214365.0, 637868.0, 122042.0, 19998.0, 5224.0, 2059.0, 987.0, 595.0, 375.0, 268.0, 220.0, 131.0, 84.0, 74.0, 54.0, 48.0, 45.0, 19.0, 17.0, 12.0, 10.0, 8.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-102.25, -99.185546875, -96.12109375, -93.056640625, -89.9921875, -86.927734375, -83.86328125, -80.798828125, -77.734375, -74.669921875, -71.60546875, -68.541015625, -65.4765625, -62.412109375, -59.34765625, -56.283203125, -53.21875, -50.154296875, -47.08984375, -44.025390625, -40.9609375, -37.896484375, -34.83203125, -31.767578125, -28.703125, -25.638671875, -22.57421875, -19.509765625, -16.4453125, -13.380859375, -10.31640625, -7.251953125, -4.1875, -1.123046875, 1.94140625, 5.005859375, 8.0703125, 11.134765625, 14.19921875, 17.263671875, 20.328125, 23.392578125, 26.45703125, 29.521484375, 32.5859375, 35.650390625, 38.71484375, 41.779296875, 44.84375, 47.908203125, 50.97265625, 54.037109375, 57.1015625, 60.166015625, 63.23046875, 66.294921875, 69.359375, 72.423828125, 75.48828125, 78.552734375, 81.6171875, 84.681640625, 87.74609375, 90.810546875, 93.875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 13.0, 7.0, 17.0, 13.0, 29.0, 32.0, 28.0, 35.0, 45.0, 28.0, 32.0, 34.0, 44.0, 56.0, 40.0, 48.0, 54.0, 39.0, 34.0, 39.0, 46.0, 27.0, 35.0, 24.0, 33.0, 22.0, 18.0, 23.0, 15.0, 14.0, 11.0, 9.0, 7.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-71.0625, -69.005859375, -66.94921875, -64.892578125, -62.8359375, -60.779296875, -58.72265625, -56.666015625, -54.609375, -52.552734375, -50.49609375, -48.439453125, -46.3828125, -44.326171875, -42.26953125, -40.212890625, -38.15625, -36.099609375, -34.04296875, -31.986328125, -29.9296875, -27.873046875, -25.81640625, -23.759765625, -21.703125, -19.646484375, -17.58984375, -15.533203125, -13.4765625, -11.419921875, -9.36328125, -7.306640625, -5.25, -3.193359375, -1.13671875, 0.919921875, 2.9765625, 5.033203125, 7.08984375, 9.146484375, 11.203125, 13.259765625, 15.31640625, 17.373046875, 19.4296875, 21.486328125, 23.54296875, 25.599609375, 27.65625, 29.712890625, 31.76953125, 33.826171875, 35.8828125, 37.939453125, 39.99609375, 42.052734375, 44.109375, 46.166015625, 48.22265625, 50.279296875, 52.3359375, 54.392578125, 56.44921875, 58.505859375, 60.5625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 2.0, 3.0, 8.0, 6.0, 16.0, 14.0, 21.0, 28.0, 43.0, 66.0, 97.0, 149.0, 251.0, 532.0, 1030.0, 2347.0, 6248.0, 19604.0, 117735.0, 797957.0, 77617.0, 15470.0, 5274.0, 2047.0, 849.0, 463.0, 244.0, 137.0, 101.0, 71.0, 39.0, 27.0, 12.0, 13.0, 9.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-73.75, -71.66748046875, -69.5849609375, -67.50244140625, -65.419921875, -63.33740234375, -61.2548828125, -59.17236328125, -57.08984375, -55.00732421875, -52.9248046875, -50.84228515625, -48.759765625, -46.67724609375, -44.5947265625, -42.51220703125, -40.4296875, -38.34716796875, -36.2646484375, -34.18212890625, -32.099609375, -30.01708984375, -27.9345703125, -25.85205078125, -23.76953125, -21.68701171875, -19.6044921875, -17.52197265625, -15.439453125, -13.35693359375, -11.2744140625, -9.19189453125, -7.109375, -5.02685546875, -2.9443359375, -0.86181640625, 1.220703125, 3.30322265625, 5.3857421875, 7.46826171875, 9.55078125, 11.63330078125, 13.7158203125, 15.79833984375, 17.880859375, 19.96337890625, 22.0458984375, 24.12841796875, 26.2109375, 28.29345703125, 30.3759765625, 32.45849609375, 34.541015625, 36.62353515625, 38.7060546875, 40.78857421875, 42.87109375, 44.95361328125, 47.0361328125, 49.11865234375, 51.201171875, 53.28369140625, 55.3662109375, 57.44873046875, 59.53125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 6.0, 9.0, 10.0, 8.0, 13.0, 25.0, 46.0, 52.0, 56.0, 62.0, 101.0, 105.0, 108.0, 91.0, 59.0, 56.0, 35.0, 45.0, 22.0, 10.0, 15.0, 8.0, 9.0, 7.0, 1.0, 4.0, 4.0, 3.0, 1.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.004180908203125, -0.004057109355926514, -0.003933310508728027, -0.003809511661529541, -0.0036857128143310547, -0.0035619139671325684, -0.003438115119934082, -0.0033143162727355957, -0.0031905174255371094, -0.003066718578338623, -0.0029429197311401367, -0.0028191208839416504, -0.002695322036743164, -0.0025715231895446777, -0.0024477243423461914, -0.002323925495147705, -0.0022001266479492188, -0.0020763278007507324, -0.001952528953552246, -0.0018287301063537598, -0.0017049312591552734, -0.0015811324119567871, -0.0014573335647583008, -0.0013335347175598145, -0.0012097358703613281, -0.0010859370231628418, -0.0009621381759643555, -0.0008383393287658691, -0.0007145404815673828, -0.0005907416343688965, -0.00046694278717041016, -0.00034314393997192383, -0.0002193450927734375, -9.554624557495117e-05, 2.8252601623535156e-05, 0.00015205144882202148, 0.0002758502960205078, 0.00039964914321899414, 0.0005234479904174805, 0.0006472468376159668, 0.0007710456848144531, 0.0008948445320129395, 0.0010186433792114258, 0.0011424422264099121, 0.0012662410736083984, 0.0013900399208068848, 0.001513838768005371, 0.0016376376152038574, 0.0017614364624023438, 0.00188523530960083, 0.0020090341567993164, 0.0021328330039978027, 0.002256631851196289, 0.0023804306983947754, 0.0025042295455932617, 0.002628028392791748, 0.0027518272399902344, 0.0028756260871887207, 0.002999424934387207, 0.0031232237815856934, 0.0032470226287841797, 0.003370821475982666, 0.0034946203231811523, 0.0036184191703796387, 0.003742218017578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 10.0, 7.0, 11.0, 21.0, 22.0, 44.0, 65.0, 114.0, 180.0, 450.0, 1263.0, 5866.0, 69209.0, 935269.0, 30582.0, 3771.0, 929.0, 336.0, 139.0, 102.0, 64.0, 29.0, 15.0, 17.0, 15.0, 6.0, 9.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.5625, -121.9091796875, -118.255859375, -114.6025390625, -110.94921875, -107.2958984375, -103.642578125, -99.9892578125, -96.3359375, -92.6826171875, -89.029296875, -85.3759765625, -81.72265625, -78.0693359375, -74.416015625, -70.7626953125, -67.109375, -63.4560546875, -59.802734375, -56.1494140625, -52.49609375, -48.8427734375, -45.189453125, -41.5361328125, -37.8828125, -34.2294921875, -30.576171875, -26.9228515625, -23.26953125, -19.6162109375, -15.962890625, -12.3095703125, -8.65625, -5.0029296875, -1.349609375, 2.3037109375, 5.95703125, 9.6103515625, 13.263671875, 16.9169921875, 20.5703125, 24.2236328125, 27.876953125, 31.5302734375, 35.18359375, 38.8369140625, 42.490234375, 46.1435546875, 49.796875, 53.4501953125, 57.103515625, 60.7568359375, 64.41015625, 68.0634765625, 71.716796875, 75.3701171875, 79.0234375, 82.6767578125, 86.330078125, 89.9833984375, 93.63671875, 97.2900390625, 100.943359375, 104.5966796875, 108.25]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 6.0, 15.0, 14.0, 26.0, 32.0, 79.0, 121.0, 201.0, 177.0, 122.0, 79.0, 27.0, 18.0, 15.0, 12.0, 12.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.0, -70.10009765625, -68.2001953125, -66.30029296875, -64.400390625, -62.50048828125, -60.6005859375, -58.70068359375, -56.80078125, -54.90087890625, -53.0009765625, -51.10107421875, -49.201171875, -47.30126953125, -45.4013671875, -43.50146484375, -41.6015625, -39.70166015625, -37.8017578125, -35.90185546875, -34.001953125, -32.10205078125, -30.2021484375, -28.30224609375, -26.40234375, -24.50244140625, -22.6025390625, -20.70263671875, -18.802734375, -16.90283203125, -15.0029296875, -13.10302734375, -11.203125, -9.30322265625, -7.4033203125, -5.50341796875, -3.603515625, -1.70361328125, 0.1962890625, 2.09619140625, 3.99609375, 5.89599609375, 7.7958984375, 9.69580078125, 11.595703125, 13.49560546875, 15.3955078125, 17.29541015625, 19.1953125, 21.09521484375, 22.9951171875, 24.89501953125, 26.794921875, 28.69482421875, 30.5947265625, 32.49462890625, 34.39453125, 36.29443359375, 38.1943359375, 40.09423828125, 41.994140625, 43.89404296875, 45.7939453125, 47.69384765625, 49.59375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 25.0, 118.0, 611.0, 225.0, 14.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3334.91552734375, -3246.25830078125, -3157.60107421875, -3068.94384765625, -2980.28662109375, -2891.62939453125, -2802.97216796875, -2714.31494140625, -2625.65771484375, -2537.00048828125, -2448.34326171875, -2359.68603515625, -2271.02880859375, -2182.37158203125, -2093.71435546875, -2005.0572509765625, -1916.400146484375, -1827.742919921875, -1739.085693359375, -1650.428466796875, -1561.771240234375, -1473.114013671875, -1384.4569091796875, -1295.7996826171875, -1207.1424560546875, -1118.4852294921875, -1029.8280029296875, -941.1708374023438, -852.5136108398438, -763.8563842773438, -675.19921875, -586.5419921875, -497.884521484375, -409.227294921875, -320.5700988769531, -231.91290283203125, -143.25567626953125, -54.59844970703125, 34.0587158203125, 122.7159423828125, 211.3731689453125, 300.0303955078125, 388.6875915527344, 477.34478759765625, 566.0020141601562, 654.6592407226562, 743.31640625, 831.9736328125, 920.630859375, 1009.2880859375, 1097.9453125, 1186.6025390625, 1275.259765625, 1363.9169921875, 1452.5740966796875, 1541.2313232421875, 1629.8885498046875, 1718.5457763671875, 1807.2030029296875, 1895.860107421875, 1984.517333984375, 2073.174560546875, 2161.831787109375, 2250.489013671875, 2339.146240234375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 3.0, 5.0, 9.0, 11.0, 20.0, 20.0, 13.0, 22.0, 18.0, 18.0, 30.0, 46.0, 37.0, 38.0, 61.0, 39.0, 52.0, 44.0, 51.0, 38.0, 41.0, 36.0, 45.0, 36.0, 41.0, 37.0, 31.0, 23.0, 20.0, 15.0, 18.0, 17.0, 18.0, 8.0, 6.0, 5.0, 10.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.515380859375, -387.03643798828125, -373.5575256347656, -360.0785827636719, -346.5996398925781, -333.1207275390625, -319.64178466796875, -306.162841796875, -292.68389892578125, -279.2049560546875, -265.7260437011719, -252.24710083007812, -238.76815795898438, -225.2892303466797, -211.810302734375, -198.33135986328125, -184.85243225097656, -171.37350463867188, -157.89456176757812, -144.41563415527344, -130.9366912841797, -117.457763671875, -103.97882843017578, -90.49989318847656, -77.02095794677734, -63.542022705078125, -50.063087463378906, -36.58415603637695, -23.105220794677734, -9.626289367675781, 3.8526458740234375, 17.331581115722656, 30.810516357421875, 44.289451599121094, 57.76838684082031, 71.247314453125, 84.72625732421875, 98.20518493652344, 111.68412017822266, 125.16305541992188, 138.64199829101562, 152.1209259033203, 165.59986877441406, 179.07879638671875, 192.5577392578125, 206.0366668701172, 219.51559448242188, 232.99453735351562, 246.4734649658203, 259.952392578125, 273.43133544921875, 286.9102783203125, 300.3891906738281, 313.8681335449219, 327.3470764160156, 340.82598876953125, 354.304931640625, 367.78387451171875, 381.2627868652344, 394.7417297363281, 408.2206726074219, 421.6995849609375, 435.17852783203125, 448.657470703125, 462.13641357421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 13.0, 20.0, 43.0, 88.0, 141.0, 315.0, 638.0, 1769.0, 4570.0, 17028.0, 142159.0, 3902585.0, 104270.0, 14497.0, 3800.0, 1278.0, 524.0, 245.0, 134.0, 62.0, 37.0, 20.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.375, -95.6171875, -91.859375, -88.1015625, -84.34375, -80.5859375, -76.828125, -73.0703125, -69.3125, -65.5546875, -61.796875, -58.0390625, -54.28125, -50.5234375, -46.765625, -43.0078125, -39.25, -35.4921875, -31.734375, -27.9765625, -24.21875, -20.4609375, -16.703125, -12.9453125, -9.1875, -5.4296875, -1.671875, 2.0859375, 5.84375, 9.6015625, 13.359375, 17.1171875, 20.875, 24.6328125, 28.390625, 32.1484375, 35.90625, 39.6640625, 43.421875, 47.1796875, 50.9375, 54.6953125, 58.453125, 62.2109375, 65.96875, 69.7265625, 73.484375, 77.2421875, 81.0, 84.7578125, 88.515625, 92.2734375, 96.03125, 99.7890625, 103.546875, 107.3046875, 111.0625, 114.8203125, 118.578125, 122.3359375, 126.09375, 129.8515625, 133.609375, 137.3671875, 141.125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 11.0, 6.0, 8.0, 19.0, 18.0, 23.0, 21.0, 16.0, 24.0, 30.0, 42.0, 36.0, 36.0, 47.0, 39.0, 61.0, 46.0, 47.0, 48.0, 30.0, 49.0, 41.0, 28.0, 34.0, 29.0, 24.0, 38.0, 26.0, 15.0, 21.0, 22.0, 11.0, 8.0, 10.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.3046875, -14.7930908203125, -14.281494140625, -13.7698974609375, -13.25830078125, -12.7467041015625, -12.235107421875, -11.7235107421875, -11.2119140625, -10.7003173828125, -10.188720703125, -9.6771240234375, -9.16552734375, -8.6539306640625, -8.142333984375, -7.6307373046875, -7.119140625, -6.6075439453125, -6.095947265625, -5.5843505859375, -5.07275390625, -4.5611572265625, -4.049560546875, -3.5379638671875, -3.0263671875, -2.5147705078125, -2.003173828125, -1.4915771484375, -0.97998046875, -0.4683837890625, 0.043212890625, 0.5548095703125, 1.06640625, 1.5780029296875, 2.089599609375, 2.6011962890625, 3.11279296875, 3.6243896484375, 4.135986328125, 4.6475830078125, 5.1591796875, 5.6707763671875, 6.182373046875, 6.6939697265625, 7.20556640625, 7.7171630859375, 8.228759765625, 8.7403564453125, 9.251953125, 9.7635498046875, 10.275146484375, 10.7867431640625, 11.29833984375, 11.8099365234375, 12.321533203125, 12.8331298828125, 13.3447265625, 13.8563232421875, 14.367919921875, 14.8795166015625, 15.39111328125, 15.9027099609375, 16.414306640625, 16.9259033203125, 17.4375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 22.0, 21.0, 44.0, 72.0, 150.0, 298.0, 709.0, 1803.0, 5177.0, 22977.0, 381794.0, 3703236.0, 63205.0, 9682.0, 2994.0, 1121.0, 482.0, 216.0, 115.0, 57.0, 26.0, 20.0, 12.0, 13.0, 8.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.4375, -90.2412109375, -87.044921875, -83.8486328125, -80.65234375, -77.4560546875, -74.259765625, -71.0634765625, -67.8671875, -64.6708984375, -61.474609375, -58.2783203125, -55.08203125, -51.8857421875, -48.689453125, -45.4931640625, -42.296875, -39.1005859375, -35.904296875, -32.7080078125, -29.51171875, -26.3154296875, -23.119140625, -19.9228515625, -16.7265625, -13.5302734375, -10.333984375, -7.1376953125, -3.94140625, -0.7451171875, 2.451171875, 5.6474609375, 8.84375, 12.0400390625, 15.236328125, 18.4326171875, 21.62890625, 24.8251953125, 28.021484375, 31.2177734375, 34.4140625, 37.6103515625, 40.806640625, 44.0029296875, 47.19921875, 50.3955078125, 53.591796875, 56.7880859375, 59.984375, 63.1806640625, 66.376953125, 69.5732421875, 72.76953125, 75.9658203125, 79.162109375, 82.3583984375, 85.5546875, 88.7509765625, 91.947265625, 95.1435546875, 98.33984375, 101.5361328125, 104.732421875, 107.9287109375, 111.125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 16.0, 20.0, 31.0, 60.0, 94.0, 156.0, 445.0, 1958.0, 727.0, 229.0, 128.0, 63.0, 39.0, 22.0, 11.0, 12.0, 8.0, 7.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -27.879150390625, -26.64892578125, -25.418701171875, -24.1884765625, -22.958251953125, -21.72802734375, -20.497802734375, -19.267578125, -18.037353515625, -16.80712890625, -15.576904296875, -14.3466796875, -13.116455078125, -11.88623046875, -10.656005859375, -9.42578125, -8.195556640625, -6.96533203125, -5.735107421875, -4.5048828125, -3.274658203125, -2.04443359375, -0.814208984375, 0.416015625, 1.646240234375, 2.87646484375, 4.106689453125, 5.3369140625, 6.567138671875, 7.79736328125, 9.027587890625, 10.2578125, 11.488037109375, 12.71826171875, 13.948486328125, 15.1787109375, 16.408935546875, 17.63916015625, 18.869384765625, 20.099609375, 21.329833984375, 22.56005859375, 23.790283203125, 25.0205078125, 26.250732421875, 27.48095703125, 28.711181640625, 29.94140625, 31.171630859375, 32.40185546875, 33.632080078125, 34.8623046875, 36.092529296875, 37.32275390625, 38.552978515625, 39.783203125, 41.013427734375, 42.24365234375, 43.473876953125, 44.7041015625, 45.934326171875, 47.16455078125, 48.394775390625, 49.625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 35.0, 139.0, 306.0, 290.0, 142.0, 37.0, 19.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-218.39405822753906, -206.19766235351562, -194.0012664794922, -181.80487060546875, -169.60845947265625, -157.41207885742188, -145.21566772460938, -133.01927185058594, -120.8228759765625, -108.62648010253906, -96.43008422851562, -84.23368072509766, -72.03728485107422, -59.84088897705078, -47.64448547363281, -35.448089599609375, -23.251693725585938, -11.055295944213867, 1.1411018371582031, 13.337501525878906, 25.533897399902344, 37.73029327392578, 49.92669677734375, 62.12309265136719, 74.31948852539062, 86.51588439941406, 98.7122802734375, 110.90868377685547, 123.1050796508789, 135.30148315429688, 147.4978790283203, 159.69427490234375, 171.89068603515625, 184.0870819091797, 196.28347778320312, 208.47988891601562, 220.67626953125, 232.8726806640625, 245.06907653808594, 257.2654724121094, 269.46185302734375, 281.65826416015625, 293.8546447753906, 306.0510559082031, 318.2474365234375, 330.44384765625, 342.6402587890625, 354.8366394042969, 367.0330505371094, 379.2294616699219, 391.42584228515625, 403.62225341796875, 415.8186340332031, 428.0150451660156, 440.21142578125, 452.4078369140625, 464.604248046875, 476.8006591796875, 488.9970397949219, 501.1934509277344, 513.3898315429688, 525.5862426757812, 537.7826538085938, 549.97900390625, 562.1754150390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 7.0, 5.0, 6.0, 12.0, 16.0, 20.0, 31.0, 21.0, 29.0, 50.0, 54.0, 55.0, 49.0, 51.0, 59.0, 47.0, 65.0, 62.0, 55.0, 43.0, 56.0, 35.0, 33.0, 27.0, 25.0, 18.0, 16.0, 15.0, 11.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.82026672363281, -110.4427719116211, -106.06526947021484, -101.68777465820312, -97.31027221679688, -92.93277740478516, -88.55528259277344, -84.17778015136719, -79.80028533935547, -75.42279052734375, -71.0452880859375, -66.66779327392578, -62.2902946472168, -57.91279602050781, -53.535301208496094, -49.15780258178711, -44.780303955078125, -40.40280532836914, -36.025306701660156, -31.647811889648438, -27.270313262939453, -22.89281463623047, -18.515317916870117, -14.137821197509766, -9.760322570800781, -5.382824897766113, -1.0053272247314453, 3.3721704483032227, 7.749668121337891, 12.127166748046875, 16.504663467407227, 20.882160186767578, 25.259658813476562, 29.637157440185547, 34.01465606689453, 38.39215087890625, 42.769649505615234, 47.14714813232422, 51.52464294433594, 55.90214157104492, 60.279640197753906, 64.65713500976562, 69.03463745117188, 73.4121322631836, 77.78962707519531, 82.16712951660156, 86.54462432861328, 90.922119140625, 95.29962158203125, 99.67711639404297, 104.05461883544922, 108.43211364746094, 112.80961608886719, 117.1871109008789, 121.56460571289062, 125.94210815429688, 130.31961059570312, 134.69711303710938, 139.07460021972656, 143.4521026611328, 147.82960510253906, 152.20709228515625, 156.5845947265625, 160.96209716796875, 165.33958435058594]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 9.0, 9.0, 14.0, 16.0, 20.0, 33.0, 59.0, 84.0, 120.0, 172.0, 277.0, 462.0, 726.0, 1386.0, 2513.0, 5551.0, 13148.0, 35223.0, 124288.0, 517001.0, 250837.0, 60333.0, 20012.0, 8162.0, 3735.0, 1841.0, 934.0, 546.0, 333.0, 228.0, 160.0, 103.0, 64.0, 46.0, 32.0, 21.0, 16.0, 6.0, 4.0, 10.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-87.5, -84.98046875, -82.4609375, -79.94140625, -77.421875, -74.90234375, -72.3828125, -69.86328125, -67.34375, -64.82421875, -62.3046875, -59.78515625, -57.265625, -54.74609375, -52.2265625, -49.70703125, -47.1875, -44.66796875, -42.1484375, -39.62890625, -37.109375, -34.58984375, -32.0703125, -29.55078125, -27.03125, -24.51171875, -21.9921875, -19.47265625, -16.953125, -14.43359375, -11.9140625, -9.39453125, -6.875, -4.35546875, -1.8359375, 0.68359375, 3.203125, 5.72265625, 8.2421875, 10.76171875, 13.28125, 15.80078125, 18.3203125, 20.83984375, 23.359375, 25.87890625, 28.3984375, 30.91796875, 33.4375, 35.95703125, 38.4765625, 40.99609375, 43.515625, 46.03515625, 48.5546875, 51.07421875, 53.59375, 56.11328125, 58.6328125, 61.15234375, 63.671875, 66.19140625, 68.7109375, 71.23046875, 73.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 8.0, 7.0, 12.0, 16.0, 27.0, 19.0, 24.0, 35.0, 39.0, 43.0, 44.0, 43.0, 63.0, 58.0, 55.0, 55.0, 64.0, 45.0, 42.0, 56.0, 36.0, 36.0, 35.0, 16.0, 26.0, 18.0, 21.0, 15.0, 14.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.298583984375, -16.67529296875, -16.052001953125, -15.4287109375, -14.805419921875, -14.18212890625, -13.558837890625, -12.935546875, -12.312255859375, -11.68896484375, -11.065673828125, -10.4423828125, -9.819091796875, -9.19580078125, -8.572509765625, -7.94921875, -7.325927734375, -6.70263671875, -6.079345703125, -5.4560546875, -4.832763671875, -4.20947265625, -3.586181640625, -2.962890625, -2.339599609375, -1.71630859375, -1.093017578125, -0.4697265625, 0.153564453125, 0.77685546875, 1.400146484375, 2.0234375, 2.646728515625, 3.27001953125, 3.893310546875, 4.5166015625, 5.139892578125, 5.76318359375, 6.386474609375, 7.009765625, 7.633056640625, 8.25634765625, 8.879638671875, 9.5029296875, 10.126220703125, 10.74951171875, 11.372802734375, 11.99609375, 12.619384765625, 13.24267578125, 13.865966796875, 14.4892578125, 15.112548828125, 15.73583984375, 16.359130859375, 16.982421875, 17.605712890625, 18.22900390625, 18.852294921875, 19.4755859375, 20.098876953125, 20.72216796875, 21.345458984375, 21.96875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 7.0, 5.0, 16.0, 19.0, 27.0, 36.0, 44.0, 57.0, 66.0, 100.0, 160.0, 255.0, 306.0, 495.0, 846.0, 1757.0, 4828.0, 22183.0, 200866.0, 729007.0, 70161.0, 10992.0, 3056.0, 1237.0, 647.0, 404.0, 276.0, 184.0, 142.0, 100.0, 68.0, 56.0, 35.0, 32.0, 21.0, 18.0, 15.0, 8.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-148.0, -143.68359375, -139.3671875, -135.05078125, -130.734375, -126.41796875, -122.1015625, -117.78515625, -113.46875, -109.15234375, -104.8359375, -100.51953125, -96.203125, -91.88671875, -87.5703125, -83.25390625, -78.9375, -74.62109375, -70.3046875, -65.98828125, -61.671875, -57.35546875, -53.0390625, -48.72265625, -44.40625, -40.08984375, -35.7734375, -31.45703125, -27.140625, -22.82421875, -18.5078125, -14.19140625, -9.875, -5.55859375, -1.2421875, 3.07421875, 7.390625, 11.70703125, 16.0234375, 20.33984375, 24.65625, 28.97265625, 33.2890625, 37.60546875, 41.921875, 46.23828125, 50.5546875, 54.87109375, 59.1875, 63.50390625, 67.8203125, 72.13671875, 76.453125, 80.76953125, 85.0859375, 89.40234375, 93.71875, 98.03515625, 102.3515625, 106.66796875, 110.984375, 115.30078125, 119.6171875, 123.93359375, 128.25]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 8.0, 7.0, 9.0, 14.0, 9.0, 24.0, 17.0, 40.0, 31.0, 48.0, 45.0, 49.0, 61.0, 59.0, 43.0, 47.0, 49.0, 61.0, 43.0, 59.0, 42.0, 48.0, 29.0, 33.0, 29.0, 15.0, 20.0, 11.0, 18.0, 4.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-97.5, -94.572265625, -91.64453125, -88.716796875, -85.7890625, -82.861328125, -79.93359375, -77.005859375, -74.078125, -71.150390625, -68.22265625, -65.294921875, -62.3671875, -59.439453125, -56.51171875, -53.583984375, -50.65625, -47.728515625, -44.80078125, -41.873046875, -38.9453125, -36.017578125, -33.08984375, -30.162109375, -27.234375, -24.306640625, -21.37890625, -18.451171875, -15.5234375, -12.595703125, -9.66796875, -6.740234375, -3.8125, -0.884765625, 2.04296875, 4.970703125, 7.8984375, 10.826171875, 13.75390625, 16.681640625, 19.609375, 22.537109375, 25.46484375, 28.392578125, 31.3203125, 34.248046875, 37.17578125, 40.103515625, 43.03125, 45.958984375, 48.88671875, 51.814453125, 54.7421875, 57.669921875, 60.59765625, 63.525390625, 66.453125, 69.380859375, 72.30859375, 75.236328125, 78.1640625, 81.091796875, 84.01953125, 86.947265625, 89.875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 3.0, 9.0, 10.0, 27.0, 32.0, 77.0, 142.0, 434.0, 1718.0, 19466.0, 1002752.0, 21312.0, 1793.0, 457.0, 156.0, 70.0, 36.0, 16.0, 15.0, 14.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.375, -221.330078125, -213.28515625, -205.240234375, -197.1953125, -189.150390625, -181.10546875, -173.060546875, -165.015625, -156.970703125, -148.92578125, -140.880859375, -132.8359375, -124.791015625, -116.74609375, -108.701171875, -100.65625, -92.611328125, -84.56640625, -76.521484375, -68.4765625, -60.431640625, -52.38671875, -44.341796875, -36.296875, -28.251953125, -20.20703125, -12.162109375, -4.1171875, 3.927734375, 11.97265625, 20.017578125, 28.0625, 36.107421875, 44.15234375, 52.197265625, 60.2421875, 68.287109375, 76.33203125, 84.376953125, 92.421875, 100.466796875, 108.51171875, 116.556640625, 124.6015625, 132.646484375, 140.69140625, 148.736328125, 156.78125, 164.826171875, 172.87109375, 180.916015625, 188.9609375, 197.005859375, 205.05078125, 213.095703125, 221.140625, 229.185546875, 237.23046875, 245.275390625, 253.3203125, 261.365234375, 269.41015625, 277.455078125, 285.5]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 29.0, 33.0, 126.0, 298.0, 297.0, 115.0, 46.0, 19.0, 6.0, 3.0, 7.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00786590576171875, -0.007452130317687988, -0.0070383548736572266, -0.006624579429626465, -0.006210803985595703, -0.005797028541564941, -0.00538325309753418, -0.004969477653503418, -0.004555702209472656, -0.0041419267654418945, -0.003728151321411133, -0.003314375877380371, -0.0029006004333496094, -0.0024868249893188477, -0.002073049545288086, -0.0016592741012573242, -0.0012454986572265625, -0.0008317232131958008, -0.00041794776916503906, -4.172325134277344e-06, 0.0004096031188964844, 0.0008233785629272461, 0.0012371540069580078, 0.0016509294509887695, 0.0020647048950195312, 0.002478480339050293, 0.0028922557830810547, 0.0033060312271118164, 0.003719806671142578, 0.00413358211517334, 0.0045473575592041016, 0.004961133003234863, 0.005374908447265625, 0.005788683891296387, 0.0062024593353271484, 0.00661623477935791, 0.007030010223388672, 0.007443785667419434, 0.007857561111450195, 0.008271336555480957, 0.008685111999511719, 0.00909888744354248, 0.009512662887573242, 0.009926438331604004, 0.010340213775634766, 0.010753989219665527, 0.011167764663696289, 0.01158154010772705, 0.011995315551757812, 0.012409090995788574, 0.012822866439819336, 0.013236641883850098, 0.01365041732788086, 0.014064192771911621, 0.014477968215942383, 0.014891743659973145, 0.015305519104003906, 0.015719294548034668, 0.01613306999206543, 0.01654684543609619, 0.016960620880126953, 0.017374396324157715, 0.017788171768188477, 0.01820194721221924, 0.01861572265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 8.0, 6.0, 10.0, 19.0, 25.0, 58.0, 94.0, 248.0, 607.0, 2597.0, 63546.0, 971140.0, 8379.0, 1105.0, 366.0, 175.0, 68.0, 40.0, 21.0, 13.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-200.75, -193.642578125, -186.53515625, -179.427734375, -172.3203125, -165.212890625, -158.10546875, -150.998046875, -143.890625, -136.783203125, -129.67578125, -122.568359375, -115.4609375, -108.353515625, -101.24609375, -94.138671875, -87.03125, -79.923828125, -72.81640625, -65.708984375, -58.6015625, -51.494140625, -44.38671875, -37.279296875, -30.171875, -23.064453125, -15.95703125, -8.849609375, -1.7421875, 5.365234375, 12.47265625, 19.580078125, 26.6875, 33.794921875, 40.90234375, 48.009765625, 55.1171875, 62.224609375, 69.33203125, 76.439453125, 83.546875, 90.654296875, 97.76171875, 104.869140625, 111.9765625, 119.083984375, 126.19140625, 133.298828125, 140.40625, 147.513671875, 154.62109375, 161.728515625, 168.8359375, 175.943359375, 183.05078125, 190.158203125, 197.265625, 204.373046875, 211.48046875, 218.587890625, 225.6953125, 232.802734375, 239.91015625, 247.017578125, 254.125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 9.0, 13.0, 29.0, 49.0, 125.0, 295.0, 261.0, 108.0, 47.0, 27.0, 16.0, 12.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.6875, -104.1416015625, -99.595703125, -95.0498046875, -90.50390625, -85.9580078125, -81.412109375, -76.8662109375, -72.3203125, -67.7744140625, -63.228515625, -58.6826171875, -54.13671875, -49.5908203125, -45.044921875, -40.4990234375, -35.953125, -31.4072265625, -26.861328125, -22.3154296875, -17.76953125, -13.2236328125, -8.677734375, -4.1318359375, 0.4140625, 4.9599609375, 9.505859375, 14.0517578125, 18.59765625, 23.1435546875, 27.689453125, 32.2353515625, 36.78125, 41.3271484375, 45.873046875, 50.4189453125, 54.96484375, 59.5107421875, 64.056640625, 68.6025390625, 73.1484375, 77.6943359375, 82.240234375, 86.7861328125, 91.33203125, 95.8779296875, 100.423828125, 104.9697265625, 109.515625, 114.0615234375, 118.607421875, 123.1533203125, 127.69921875, 132.2451171875, 136.791015625, 141.3369140625, 145.8828125, 150.4287109375, 154.974609375, 159.5205078125, 164.06640625, 168.6123046875, 173.158203125, 177.7041015625, 182.25]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 14.0, 32.0, 110.0, 319.0, 321.0, 133.0, 41.0, 16.0, 10.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2501.990234375, -2452.849853515625, -2403.709228515625, -2354.56884765625, -2305.42822265625, -2256.287841796875, -2207.1474609375, -2158.0068359375, -2108.866455078125, -2059.72607421875, -2010.58544921875, -1961.445068359375, -1912.3045654296875, -1863.1640625, -1814.023681640625, -1764.8831787109375, -1715.74267578125, -1666.6021728515625, -1617.461669921875, -1568.3212890625, -1519.1807861328125, -1470.040283203125, -1420.89990234375, -1371.7593994140625, -1322.618896484375, -1273.4783935546875, -1224.337890625, -1175.197509765625, -1126.0570068359375, -1076.91650390625, -1027.776123046875, -978.6356201171875, -929.4950561523438, -880.3546142578125, -831.214111328125, -782.0736083984375, -732.9331665039062, -683.792724609375, -634.6522216796875, -585.51171875, -536.3712768554688, -487.2308044433594, -438.09033203125, -388.9498596191406, -339.80938720703125, -290.6689147949219, -241.5284423828125, -192.38796997070312, -143.24749755859375, -94.10702514648438, -44.966552734375, 4.173919677734375, 53.31439208984375, 102.45486450195312, 151.5953369140625, 200.73580932617188, 249.87628173828125, 299.0167541503906, 348.1572265625, 397.2976989746094, 446.43817138671875, 495.5786437988281, 544.7191162109375, 593.859619140625, 643.0000610351562]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 8.0, 6.0, 13.0, 12.0, 15.0, 19.0, 23.0, 24.0, 26.0, 21.0, 29.0, 33.0, 27.0, 29.0, 53.0, 42.0, 49.0, 39.0, 44.0, 50.0, 37.0, 34.0, 37.0, 43.0, 35.0, 33.0, 23.0, 25.0, 23.0, 17.0, 30.0, 18.0, 11.0, 8.0, 10.0, 11.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-404.33477783203125, -391.48724365234375, -378.63970947265625, -365.79217529296875, -352.94464111328125, -340.09710693359375, -327.24957275390625, -314.4020080566406, -301.5544738769531, -288.7069396972656, -275.8594055175781, -263.0118713378906, -250.16432189941406, -237.31678771972656, -224.46925354003906, -211.6217041015625, -198.77418518066406, -185.92665100097656, -173.07911682128906, -160.2315673828125, -147.384033203125, -134.5364990234375, -121.68896484375, -108.84142303466797, -95.99388885498047, -83.14635467529297, -70.29881286621094, -57.45127868652344, -44.60374069213867, -31.756202697753906, -18.908668518066406, -6.061126708984375, 6.786407470703125, 19.63394546508789, 32.481483459472656, 45.329017639160156, 58.17655563354492, 71.02409362792969, 83.87162780761719, 96.71916961669922, 109.56670379638672, 122.41423797607422, 135.26177978515625, 148.10931396484375, 160.95684814453125, 173.80438232421875, 186.65191650390625, 199.4994659423828, 212.3470001220703, 225.1945343017578, 238.0420684814453, 250.88961791992188, 263.7371520996094, 276.5846862792969, 289.4322204589844, 302.2797546386719, 315.1272888183594, 327.9748229980469, 340.8223571777344, 353.6698913574219, 366.5174255371094, 379.364990234375, 392.2125244140625, 405.06005859375, 417.9075927734375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 14.0, 15.0, 19.0, 21.0, 47.0, 81.0, 155.0, 309.0, 652.0, 1675.0, 4283.0, 13808.0, 76324.0, 3837052.0, 225060.0, 24582.0, 6431.0, 2094.0, 828.0, 392.0, 194.0, 101.0, 60.0, 32.0, 22.0, 6.0, 6.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.5625, -87.0380859375, -83.513671875, -79.9892578125, -76.46484375, -72.9404296875, -69.416015625, -65.8916015625, -62.3671875, -58.8427734375, -55.318359375, -51.7939453125, -48.26953125, -44.7451171875, -41.220703125, -37.6962890625, -34.171875, -30.6474609375, -27.123046875, -23.5986328125, -20.07421875, -16.5498046875, -13.025390625, -9.5009765625, -5.9765625, -2.4521484375, 1.072265625, 4.5966796875, 8.12109375, 11.6455078125, 15.169921875, 18.6943359375, 22.21875, 25.7431640625, 29.267578125, 32.7919921875, 36.31640625, 39.8408203125, 43.365234375, 46.8896484375, 50.4140625, 53.9384765625, 57.462890625, 60.9873046875, 64.51171875, 68.0361328125, 71.560546875, 75.0849609375, 78.609375, 82.1337890625, 85.658203125, 89.1826171875, 92.70703125, 96.2314453125, 99.755859375, 103.2802734375, 106.8046875, 110.3291015625, 113.853515625, 117.3779296875, 120.90234375, 124.4267578125, 127.951171875, 131.4755859375, 135.0]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 2.0, 5.0, 9.0, 14.0, 20.0, 17.0, 20.0, 21.0, 27.0, 32.0, 30.0, 27.0, 47.0, 59.0, 53.0, 45.0, 58.0, 67.0, 49.0, 54.0, 50.0, 48.0, 42.0, 32.0, 33.0, 30.0, 30.0, 13.0, 9.0, 13.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.402099609375, -18.72607421875, -18.050048828125, -17.3740234375, -16.697998046875, -16.02197265625, -15.345947265625, -14.669921875, -13.993896484375, -13.31787109375, -12.641845703125, -11.9658203125, -11.289794921875, -10.61376953125, -9.937744140625, -9.26171875, -8.585693359375, -7.90966796875, -7.233642578125, -6.5576171875, -5.881591796875, -5.20556640625, -4.529541015625, -3.853515625, -3.177490234375, -2.50146484375, -1.825439453125, -1.1494140625, -0.473388671875, 0.20263671875, 0.878662109375, 1.5546875, 2.230712890625, 2.90673828125, 3.582763671875, 4.2587890625, 4.934814453125, 5.61083984375, 6.286865234375, 6.962890625, 7.638916015625, 8.31494140625, 8.990966796875, 9.6669921875, 10.343017578125, 11.01904296875, 11.695068359375, 12.37109375, 13.047119140625, 13.72314453125, 14.399169921875, 15.0751953125, 15.751220703125, 16.42724609375, 17.103271484375, 17.779296875, 18.455322265625, 19.13134765625, 19.807373046875, 20.4833984375, 21.159423828125, 21.83544921875, 22.511474609375, 23.1875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 5.0, 11.0, 11.0, 17.0, 14.0, 30.0, 43.0, 76.0, 118.0, 249.0, 551.0, 1095.0, 2579.0, 6931.0, 23805.0, 147234.0, 3745458.0, 222596.0, 29558.0, 8156.0, 3059.0, 1297.0, 638.0, 320.0, 172.0, 94.0, 55.0, 34.0, 26.0, 14.0, 15.0, 6.0, 3.0, 7.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-76.3125, -73.732421875, -71.15234375, -68.572265625, -65.9921875, -63.412109375, -60.83203125, -58.251953125, -55.671875, -53.091796875, -50.51171875, -47.931640625, -45.3515625, -42.771484375, -40.19140625, -37.611328125, -35.03125, -32.451171875, -29.87109375, -27.291015625, -24.7109375, -22.130859375, -19.55078125, -16.970703125, -14.390625, -11.810546875, -9.23046875, -6.650390625, -4.0703125, -1.490234375, 1.08984375, 3.669921875, 6.25, 8.830078125, 11.41015625, 13.990234375, 16.5703125, 19.150390625, 21.73046875, 24.310546875, 26.890625, 29.470703125, 32.05078125, 34.630859375, 37.2109375, 39.791015625, 42.37109375, 44.951171875, 47.53125, 50.111328125, 52.69140625, 55.271484375, 57.8515625, 60.431640625, 63.01171875, 65.591796875, 68.171875, 70.751953125, 73.33203125, 75.912109375, 78.4921875, 81.072265625, 83.65234375, 86.232421875, 88.8125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 11.0, 8.0, 3.0, 15.0, 8.0, 13.0, 33.0, 45.0, 51.0, 87.0, 159.0, 346.0, 2023.0, 674.0, 265.0, 100.0, 76.0, 37.0, 26.0, 21.0, 21.0, 5.0, 11.0, 6.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.404541015625, -23.41845703125, -22.432373046875, -21.4462890625, -20.460205078125, -19.47412109375, -18.488037109375, -17.501953125, -16.515869140625, -15.52978515625, -14.543701171875, -13.5576171875, -12.571533203125, -11.58544921875, -10.599365234375, -9.61328125, -8.627197265625, -7.64111328125, -6.655029296875, -5.6689453125, -4.682861328125, -3.69677734375, -2.710693359375, -1.724609375, -0.738525390625, 0.24755859375, 1.233642578125, 2.2197265625, 3.205810546875, 4.19189453125, 5.177978515625, 6.1640625, 7.150146484375, 8.13623046875, 9.122314453125, 10.1083984375, 11.094482421875, 12.08056640625, 13.066650390625, 14.052734375, 15.038818359375, 16.02490234375, 17.010986328125, 17.9970703125, 18.983154296875, 19.96923828125, 20.955322265625, 21.94140625, 22.927490234375, 23.91357421875, 24.899658203125, 25.8857421875, 26.871826171875, 27.85791015625, 28.843994140625, 29.830078125, 30.816162109375, 31.80224609375, 32.788330078125, 33.7744140625, 34.760498046875, 35.74658203125, 36.732666015625, 37.71875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 10.0, 69.0, 524.0, 353.0, 35.0, 11.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-752.4171142578125, -729.530029296875, -706.6429443359375, -683.755859375, -660.8688354492188, -637.9817504882812, -615.0946655273438, -592.2075805664062, -569.320556640625, -546.4334716796875, -523.54638671875, -500.6593322753906, -477.77227783203125, -454.88519287109375, -431.99810791015625, -409.11102294921875, -386.22393798828125, -363.33685302734375, -340.4497985839844, -317.5627136230469, -294.6756591796875, -271.78857421875, -248.9014892578125, -226.01441955566406, -203.12734985351562, -180.2402801513672, -157.35321044921875, -134.46612548828125, -111.57905578613281, -88.69198608398438, -65.80490112304688, -42.91783142089844, -20.03076171875, 2.856311798095703, 25.743385314941406, 48.630462646484375, 71.51753234863281, 94.40460205078125, 117.29168701171875, 140.1787567138672, 163.06582641601562, 185.95289611816406, 208.8399658203125, 231.72705078125, 254.61412048339844, 277.5011901855469, 300.3882751464844, 323.27532958984375, 346.16241455078125, 369.04949951171875, 391.9365539550781, 414.8236389160156, 437.710693359375, 460.5977783203125, 483.48486328125, 506.3719482421875, 529.259033203125, 552.1461181640625, 575.033203125, 597.9202880859375, 620.8073120117188, 643.6943969726562, 666.5814819335938, 689.4685668945312, 712.3555908203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 15.0, 19.0, 16.0, 24.0, 27.0, 45.0, 40.0, 62.0, 62.0, 60.0, 56.0, 77.0, 52.0, 83.0, 65.0, 48.0, 51.0, 47.0, 40.0, 21.0, 22.0, 13.0, 14.0, 12.0, 10.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.28091430664062, -78.82987976074219, -74.37885284423828, -69.92781829833984, -65.4767837524414, -61.025753021240234, -56.57472229003906, -52.123687744140625, -47.67265701293945, -43.22162628173828, -38.770591735839844, -34.31956100463867, -29.868528366088867, -25.417495727539062, -20.96646499633789, -16.515432357788086, -12.064399719238281, -7.613367557525635, -3.1623353958129883, 1.2886962890625, 5.739728927612305, 10.19076156616211, 14.641792297363281, 19.092824935913086, 23.54385757446289, 27.994890213012695, 32.4459228515625, 36.89695358276367, 41.347984313964844, 45.79901885986328, 50.25004959106445, 54.701080322265625, 59.15211486816406, 63.603145599365234, 68.0541763305664, 72.50521087646484, 76.95624542236328, 81.40727233886719, 85.85830688476562, 90.30934143066406, 94.7603759765625, 99.21141052246094, 103.66243743896484, 108.11347198486328, 112.56450653076172, 117.01553344726562, 121.46656799316406, 125.9176025390625, 130.36862182617188, 134.8196563720703, 139.27069091796875, 143.72171020507812, 148.17274475097656, 152.623779296875, 157.07481384277344, 161.52584838867188, 165.9768829345703, 170.42791748046875, 174.8789520263672, 179.32998657226562, 183.781005859375, 188.23204040527344, 192.68307495117188, 197.1341094970703, 201.58514404296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 9.0, 22.0, 24.0, 32.0, 63.0, 82.0, 143.0, 224.0, 417.0, 881.0, 1979.0, 5758.0, 20581.0, 93602.0, 513544.0, 330763.0, 59132.0, 13791.0, 4261.0, 1633.0, 719.0, 366.0, 175.0, 122.0, 76.0, 48.0, 30.0, 21.0, 25.0, 11.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.4375, -64.4873046875, -61.537109375, -58.5869140625, -55.63671875, -52.6865234375, -49.736328125, -46.7861328125, -43.8359375, -40.8857421875, -37.935546875, -34.9853515625, -32.03515625, -29.0849609375, -26.134765625, -23.1845703125, -20.234375, -17.2841796875, -14.333984375, -11.3837890625, -8.43359375, -5.4833984375, -2.533203125, 0.4169921875, 3.3671875, 6.3173828125, 9.267578125, 12.2177734375, 15.16796875, 18.1181640625, 21.068359375, 24.0185546875, 26.96875, 29.9189453125, 32.869140625, 35.8193359375, 38.76953125, 41.7197265625, 44.669921875, 47.6201171875, 50.5703125, 53.5205078125, 56.470703125, 59.4208984375, 62.37109375, 65.3212890625, 68.271484375, 71.2216796875, 74.171875, 77.1220703125, 80.072265625, 83.0224609375, 85.97265625, 88.9228515625, 91.873046875, 94.8232421875, 97.7734375, 100.7236328125, 103.673828125, 106.6240234375, 109.57421875, 112.5244140625, 115.474609375, 118.4248046875, 121.375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 14.0, 10.0, 14.0, 15.0, 27.0, 29.0, 35.0, 41.0, 39.0, 44.0, 64.0, 64.0, 59.0, 78.0, 60.0, 75.0, 66.0, 44.0, 48.0, 39.0, 31.0, 25.0, 21.0, 13.0, 7.0, 9.0, 10.0, 4.0, 0.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.25, -21.431884765625, -20.61376953125, -19.795654296875, -18.9775390625, -18.159423828125, -17.34130859375, -16.523193359375, -15.705078125, -14.886962890625, -14.06884765625, -13.250732421875, -12.4326171875, -11.614501953125, -10.79638671875, -9.978271484375, -9.16015625, -8.342041015625, -7.52392578125, -6.705810546875, -5.8876953125, -5.069580078125, -4.25146484375, -3.433349609375, -2.615234375, -1.797119140625, -0.97900390625, -0.160888671875, 0.6572265625, 1.475341796875, 2.29345703125, 3.111572265625, 3.9296875, 4.747802734375, 5.56591796875, 6.384033203125, 7.2021484375, 8.020263671875, 8.83837890625, 9.656494140625, 10.474609375, 11.292724609375, 12.11083984375, 12.928955078125, 13.7470703125, 14.565185546875, 15.38330078125, 16.201416015625, 17.01953125, 17.837646484375, 18.65576171875, 19.473876953125, 20.2919921875, 21.110107421875, 21.92822265625, 22.746337890625, 23.564453125, 24.382568359375, 25.20068359375, 26.018798828125, 26.8369140625, 27.655029296875, 28.47314453125, 29.291259765625, 30.109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 11.0, 15.0, 30.0, 54.0, 62.0, 91.0, 137.0, 239.0, 466.0, 887.0, 2572.0, 13655.0, 165908.0, 787954.0, 65904.0, 7260.0, 1595.0, 709.0, 337.0, 212.0, 136.0, 94.0, 73.0, 47.0, 28.0, 25.0, 13.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-149.625, -145.13671875, -140.6484375, -136.16015625, -131.671875, -127.18359375, -122.6953125, -118.20703125, -113.71875, -109.23046875, -104.7421875, -100.25390625, -95.765625, -91.27734375, -86.7890625, -82.30078125, -77.8125, -73.32421875, -68.8359375, -64.34765625, -59.859375, -55.37109375, -50.8828125, -46.39453125, -41.90625, -37.41796875, -32.9296875, -28.44140625, -23.953125, -19.46484375, -14.9765625, -10.48828125, -6.0, -1.51171875, 2.9765625, 7.46484375, 11.953125, 16.44140625, 20.9296875, 25.41796875, 29.90625, 34.39453125, 38.8828125, 43.37109375, 47.859375, 52.34765625, 56.8359375, 61.32421875, 65.8125, 70.30078125, 74.7890625, 79.27734375, 83.765625, 88.25390625, 92.7421875, 97.23046875, 101.71875, 106.20703125, 110.6953125, 115.18359375, 119.671875, 124.16015625, 128.6484375, 133.13671875, 137.625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 16.0, 9.0, 12.0, 9.0, 18.0, 17.0, 29.0, 27.0, 41.0, 63.0, 47.0, 66.0, 60.0, 74.0, 43.0, 72.0, 69.0, 51.0, 56.0, 52.0, 30.0, 25.0, 27.0, 17.0, 19.0, 25.0, 10.0, 5.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-124.5, -121.07421875, -117.6484375, -114.22265625, -110.796875, -107.37109375, -103.9453125, -100.51953125, -97.09375, -93.66796875, -90.2421875, -86.81640625, -83.390625, -79.96484375, -76.5390625, -73.11328125, -69.6875, -66.26171875, -62.8359375, -59.41015625, -55.984375, -52.55859375, -49.1328125, -45.70703125, -42.28125, -38.85546875, -35.4296875, -32.00390625, -28.578125, -25.15234375, -21.7265625, -18.30078125, -14.875, -11.44921875, -8.0234375, -4.59765625, -1.171875, 2.25390625, 5.6796875, 9.10546875, 12.53125, 15.95703125, 19.3828125, 22.80859375, 26.234375, 29.66015625, 33.0859375, 36.51171875, 39.9375, 43.36328125, 46.7890625, 50.21484375, 53.640625, 57.06640625, 60.4921875, 63.91796875, 67.34375, 70.76953125, 74.1953125, 77.62109375, 81.046875, 84.47265625, 87.8984375, 91.32421875, 94.75]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 18.0, 27.0, 55.0, 74.0, 100.0, 167.0, 293.0, 668.0, 1840.0, 7531.0, 62749.0, 850400.0, 110465.0, 10219.0, 2285.0, 814.0, 310.0, 199.0, 116.0, 54.0, 42.0, 24.0, 21.0, 17.0, 10.0, 9.0, 5.0, 3.0, 8.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.65625, -51.90234375, -50.1484375, -48.39453125, -46.640625, -44.88671875, -43.1328125, -41.37890625, -39.625, -37.87109375, -36.1171875, -34.36328125, -32.609375, -30.85546875, -29.1015625, -27.34765625, -25.59375, -23.83984375, -22.0859375, -20.33203125, -18.578125, -16.82421875, -15.0703125, -13.31640625, -11.5625, -9.80859375, -8.0546875, -6.30078125, -4.546875, -2.79296875, -1.0390625, 0.71484375, 2.46875, 4.22265625, 5.9765625, 7.73046875, 9.484375, 11.23828125, 12.9921875, 14.74609375, 16.5, 18.25390625, 20.0078125, 21.76171875, 23.515625, 25.26953125, 27.0234375, 28.77734375, 30.53125, 32.28515625, 34.0390625, 35.79296875, 37.546875, 39.30078125, 41.0546875, 42.80859375, 44.5625, 46.31640625, 48.0703125, 49.82421875, 51.578125, 53.33203125, 55.0859375, 56.83984375, 58.59375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 17.0, 17.0, 28.0, 38.0, 58.0, 91.0, 150.0, 178.0, 139.0, 71.0, 54.0, 43.0, 20.0, 19.0, 16.0, 7.0, 5.0, 3.0, 7.0, 1.0, 6.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00469970703125, -0.004567146301269531, -0.0044345855712890625, -0.004302024841308594, -0.004169464111328125, -0.004036903381347656, -0.0039043426513671875, -0.0037717819213867188, -0.00363922119140625, -0.0035066604614257812, -0.0033740997314453125, -0.0032415390014648438, -0.003108978271484375, -0.0029764175415039062, -0.0028438568115234375, -0.0027112960815429688, -0.0025787353515625, -0.0024461746215820312, -0.0023136138916015625, -0.0021810531616210938, -0.002048492431640625, -0.0019159317016601562, -0.0017833709716796875, -0.0016508102416992188, -0.00151824951171875, -0.0013856887817382812, -0.0012531280517578125, -0.0011205673217773438, -0.000988006591796875, -0.0008554458618164062, -0.0007228851318359375, -0.0005903244018554688, -0.000457763671875, -0.00032520294189453125, -0.0001926422119140625, -6.008148193359375e-05, 7.2479248046875e-05, 0.00020503997802734375, 0.0003376007080078125, 0.00047016143798828125, 0.00060272216796875, 0.0007352828979492188, 0.0008678436279296875, 0.0010004043579101562, 0.001132965087890625, 0.0012655258178710938, 0.0013980865478515625, 0.0015306472778320312, 0.0016632080078125, 0.0017957687377929688, 0.0019283294677734375, 0.0020608901977539062, 0.002193450927734375, 0.0023260116577148438, 0.0024585723876953125, 0.0025911331176757812, 0.00272369384765625, 0.0028562545776367188, 0.0029888153076171875, 0.0031213760375976562, 0.003253936767578125, 0.0033864974975585938, 0.0035190582275390625, 0.0036516189575195312, 0.0037841796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 13.0, 18.0, 23.0, 57.0, 88.0, 158.0, 402.0, 1122.0, 8676.0, 501210.0, 525776.0, 9088.0, 1177.0, 377.0, 169.0, 87.0, 55.0, 20.0, 16.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.125, -67.86328125, -65.6015625, -63.33984375, -61.078125, -58.81640625, -56.5546875, -54.29296875, -52.03125, -49.76953125, -47.5078125, -45.24609375, -42.984375, -40.72265625, -38.4609375, -36.19921875, -33.9375, -31.67578125, -29.4140625, -27.15234375, -24.890625, -22.62890625, -20.3671875, -18.10546875, -15.84375, -13.58203125, -11.3203125, -9.05859375, -6.796875, -4.53515625, -2.2734375, -0.01171875, 2.25, 4.51171875, 6.7734375, 9.03515625, 11.296875, 13.55859375, 15.8203125, 18.08203125, 20.34375, 22.60546875, 24.8671875, 27.12890625, 29.390625, 31.65234375, 33.9140625, 36.17578125, 38.4375, 40.69921875, 42.9609375, 45.22265625, 47.484375, 49.74609375, 52.0078125, 54.26953125, 56.53125, 58.79296875, 61.0546875, 63.31640625, 65.578125, 67.83984375, 70.1015625, 72.36328125, 74.625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 12.0, 8.0, 14.0, 21.0, 43.0, 73.0, 138.0, 234.0, 203.0, 105.0, 55.0, 39.0, 19.0, 12.0, 13.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.875, -74.10546875, -72.3359375, -70.56640625, -68.796875, -67.02734375, -65.2578125, -63.48828125, -61.71875, -59.94921875, -58.1796875, -56.41015625, -54.640625, -52.87109375, -51.1015625, -49.33203125, -47.5625, -45.79296875, -44.0234375, -42.25390625, -40.484375, -38.71484375, -36.9453125, -35.17578125, -33.40625, -31.63671875, -29.8671875, -28.09765625, -26.328125, -24.55859375, -22.7890625, -21.01953125, -19.25, -17.48046875, -15.7109375, -13.94140625, -12.171875, -10.40234375, -8.6328125, -6.86328125, -5.09375, -3.32421875, -1.5546875, 0.21484375, 1.984375, 3.75390625, 5.5234375, 7.29296875, 9.0625, 10.83203125, 12.6015625, 14.37109375, 16.140625, 17.91015625, 19.6796875, 21.44921875, 23.21875, 24.98828125, 26.7578125, 28.52734375, 30.296875, 32.06640625, 33.8359375, 35.60546875, 37.375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 7.0, 8.0, 32.0, 106.0, 329.0, 360.0, 115.0, 33.0, 9.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-607.0286254882812, -566.983154296875, -526.9376831054688, -486.8922424316406, -446.8467712402344, -406.8013000488281, -366.755859375, -326.71038818359375, -286.6649169921875, -246.61944580078125, -206.57398986816406, -166.52853393554688, -126.48306274414062, -86.43759155273438, -46.39213562011719, -6.3466796875, 33.69879150390625, 73.74425506591797, 113.78971862792969, 153.83517456054688, 193.88064575195312, 233.92611694335938, 273.9715576171875, 314.01702880859375, 354.0625, 394.10797119140625, 434.1534423828125, 474.1988830566406, 514.244384765625, 554.289794921875, 594.3352661132812, 634.3807373046875, 674.42626953125, 714.4717407226562, 754.5172119140625, 794.5626831054688, 834.608154296875, 874.653564453125, 914.6990356445312, 954.7445068359375, 994.7899780273438, 1034.83544921875, 1074.880859375, 1114.9263916015625, 1154.9718017578125, 1195.017333984375, 1235.062744140625, 1275.108154296875, 1315.1536865234375, 1355.1990966796875, 1395.24462890625, 1435.2900390625, 1475.3355712890625, 1515.3809814453125, 1555.426513671875, 1595.471923828125, 1635.517333984375, 1675.562744140625, 1715.6082763671875, 1755.6536865234375, 1795.69921875, 1835.74462890625, 1875.7901611328125, 1915.8355712890625, 1955.881103515625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 13.0, 7.0, 10.0, 16.0, 22.0, 24.0, 18.0, 21.0, 31.0, 28.0, 26.0, 36.0, 38.0, 36.0, 40.0, 34.0, 30.0, 38.0, 42.0, 44.0, 44.0, 44.0, 36.0, 31.0, 30.0, 32.0, 25.0, 20.0, 35.0, 26.0, 16.0, 12.0, 12.0, 13.0, 8.0, 11.0, 11.0, 7.0, 5.0, 3.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.5924072265625, -367.0968933105469, -355.60137939453125, -344.1058654785156, -332.6103515625, -321.1148376464844, -309.61932373046875, -298.1238098144531, -286.6282958984375, -275.1327819824219, -263.63726806640625, -252.14175415039062, -240.646240234375, -229.15072631835938, -217.65521240234375, -206.15969848632812, -194.66416931152344, -183.1686553955078, -171.6731414794922, -160.17762756347656, -148.68211364746094, -137.1865997314453, -125.69107818603516, -114.19556427001953, -102.7000503540039, -91.20453643798828, -79.70902252197266, -68.2135009765625, -56.71799087524414, -45.222476959228516, -33.726959228515625, -22.2314453125, -10.735931396484375, 0.7595834732055664, 12.255098342895508, 23.750614166259766, 35.24612808227539, 46.741641998291016, 58.237159729003906, 69.73267364501953, 81.22818756103516, 92.72370147705078, 104.2192153930664, 115.71473693847656, 127.21025085449219, 138.7057647705078, 150.20127868652344, 161.69679260253906, 173.1923065185547, 184.6878204345703, 196.18333435058594, 207.67884826660156, 219.1743621826172, 230.6698760986328, 242.1654052734375, 253.66091918945312, 265.15643310546875, 276.6519470214844, 288.1474609375, 299.6429748535156, 311.13848876953125, 322.6340026855469, 334.1295166015625, 345.6250305175781, 357.12054443359375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 15.0, 32.0, 64.0, 163.0, 305.0, 844.0, 2589.0, 13793.0, 343062.0, 3807299.0, 20917.0, 3553.0, 927.0, 364.0, 150.0, 76.0, 41.0, 21.0, 20.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-164.0, -156.578125, -149.15625, -141.734375, -134.3125, -126.890625, -119.46875, -112.046875, -104.625, -97.203125, -89.78125, -82.359375, -74.9375, -67.515625, -60.09375, -52.671875, -45.25, -37.828125, -30.40625, -22.984375, -15.5625, -8.140625, -0.71875, 6.703125, 14.125, 21.546875, 28.96875, 36.390625, 43.8125, 51.234375, 58.65625, 66.078125, 73.5, 80.921875, 88.34375, 95.765625, 103.1875, 110.609375, 118.03125, 125.453125, 132.875, 140.296875, 147.71875, 155.140625, 162.5625, 169.984375, 177.40625, 184.828125, 192.25, 199.671875, 207.09375, 214.515625, 221.9375, 229.359375, 236.78125, 244.203125, 251.625, 259.046875, 266.46875, 273.890625, 281.3125, 288.734375, 296.15625, 303.578125, 311.0]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 13.0, 11.0, 14.0, 10.0, 14.0, 29.0, 25.0, 46.0, 39.0, 40.0, 46.0, 83.0, 64.0, 42.0, 69.0, 71.0, 57.0, 60.0, 40.0, 40.0, 41.0, 25.0, 18.0, 29.0, 20.0, 11.0, 13.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -20.85205078125, -20.0166015625, -19.18115234375, -18.345703125, -17.51025390625, -16.6748046875, -15.83935546875, -15.00390625, -14.16845703125, -13.3330078125, -12.49755859375, -11.662109375, -10.82666015625, -9.9912109375, -9.15576171875, -8.3203125, -7.48486328125, -6.6494140625, -5.81396484375, -4.978515625, -4.14306640625, -3.3076171875, -2.47216796875, -1.63671875, -0.80126953125, 0.0341796875, 0.86962890625, 1.705078125, 2.54052734375, 3.3759765625, 4.21142578125, 5.046875, 5.88232421875, 6.7177734375, 7.55322265625, 8.388671875, 9.22412109375, 10.0595703125, 10.89501953125, 11.73046875, 12.56591796875, 13.4013671875, 14.23681640625, 15.072265625, 15.90771484375, 16.7431640625, 17.57861328125, 18.4140625, 19.24951171875, 20.0849609375, 20.92041015625, 21.755859375, 22.59130859375, 23.4267578125, 24.26220703125, 25.09765625, 25.93310546875, 26.7685546875, 27.60400390625, 28.439453125, 29.27490234375, 30.1103515625, 30.94580078125, 31.78125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 9.0, 13.0, 16.0, 25.0, 46.0, 78.0, 159.0, 292.0, 598.0, 1400.0, 3499.0, 11189.0, 54028.0, 3346869.0, 719334.0, 41399.0, 9538.0, 3251.0, 1262.0, 607.0, 276.0, 166.0, 87.0, 43.0, 31.0, 23.0, 11.0, 8.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.375, -80.990234375, -77.60546875, -74.220703125, -70.8359375, -67.451171875, -64.06640625, -60.681640625, -57.296875, -53.912109375, -50.52734375, -47.142578125, -43.7578125, -40.373046875, -36.98828125, -33.603515625, -30.21875, -26.833984375, -23.44921875, -20.064453125, -16.6796875, -13.294921875, -9.91015625, -6.525390625, -3.140625, 0.244140625, 3.62890625, 7.013671875, 10.3984375, 13.783203125, 17.16796875, 20.552734375, 23.9375, 27.322265625, 30.70703125, 34.091796875, 37.4765625, 40.861328125, 44.24609375, 47.630859375, 51.015625, 54.400390625, 57.78515625, 61.169921875, 64.5546875, 67.939453125, 71.32421875, 74.708984375, 78.09375, 81.478515625, 84.86328125, 88.248046875, 91.6328125, 95.017578125, 98.40234375, 101.787109375, 105.171875, 108.556640625, 111.94140625, 115.326171875, 118.7109375, 122.095703125, 125.48046875, 128.865234375, 132.25]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 16.0, 18.0, 31.0, 40.0, 78.0, 121.0, 317.0, 2651.0, 440.0, 134.0, 57.0, 51.0, 26.0, 18.0, 11.0, 16.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.1875, -33.75634765625, -32.3251953125, -30.89404296875, -29.462890625, -28.03173828125, -26.6005859375, -25.16943359375, -23.73828125, -22.30712890625, -20.8759765625, -19.44482421875, -18.013671875, -16.58251953125, -15.1513671875, -13.72021484375, -12.2890625, -10.85791015625, -9.4267578125, -7.99560546875, -6.564453125, -5.13330078125, -3.7021484375, -2.27099609375, -0.83984375, 0.59130859375, 2.0224609375, 3.45361328125, 4.884765625, 6.31591796875, 7.7470703125, 9.17822265625, 10.609375, 12.04052734375, 13.4716796875, 14.90283203125, 16.333984375, 17.76513671875, 19.1962890625, 20.62744140625, 22.05859375, 23.48974609375, 24.9208984375, 26.35205078125, 27.783203125, 29.21435546875, 30.6455078125, 32.07666015625, 33.5078125, 34.93896484375, 36.3701171875, 37.80126953125, 39.232421875, 40.66357421875, 42.0947265625, 43.52587890625, 44.95703125, 46.38818359375, 47.8193359375, 49.25048828125, 50.681640625, 52.11279296875, 53.5439453125, 54.97509765625, 56.40625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 17.0, 64.0, 378.0, 444.0, 81.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.39041137695312, -213.36802673339844, -194.34564208984375, -175.32327270507812, -156.30088806152344, -137.27850341796875, -118.2561264038086, -99.23374938964844, -80.21136474609375, -61.18898391723633, -42.166603088378906, -23.144222259521484, -4.1218414306640625, 14.900543212890625, 33.92292022705078, 52.94529724121094, 71.96768188476562, 90.99006652832031, 110.01244354248047, 129.03482055664062, 148.0572052001953, 167.07958984375, 186.10195922851562, 205.1243438720703, 224.146728515625, 243.1691131591797, 262.1914978027344, 281.2138671875, 300.23626708984375, 319.2586364746094, 338.281005859375, 357.30340576171875, 376.32574462890625, 395.3481140136719, 414.3705139160156, 433.39288330078125, 452.415283203125, 471.4376525878906, 490.46002197265625, 509.482421875, 528.5047607421875, 547.5271606445312, 566.5494995117188, 585.5718994140625, 604.5942993164062, 623.61669921875, 642.6390380859375, 661.6614379882812, 680.683837890625, 699.7062377929688, 718.7285766601562, 737.7509765625, 756.7733764648438, 775.7957763671875, 794.818115234375, 813.8405151367188, 832.8629150390625, 851.8853149414062, 870.9076538085938, 889.9300537109375, 908.9524536132812, 927.974853515625, 946.9971923828125, 966.0195922851562, 985.0419311523438]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 8.0, 8.0, 22.0, 34.0, 44.0, 52.0, 76.0, 80.0, 86.0, 103.0, 93.0, 98.0, 80.0, 61.0, 52.0, 41.0, 25.0, 14.0, 9.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.13246154785156, -152.6924591064453, -145.25247192382812, -137.81246948242188, -130.37246704101562, -122.93247985839844, -115.49247741699219, -108.05248260498047, -100.61248779296875, -93.17249298095703, -85.73249816894531, -78.29249572753906, -70.85250091552734, -63.412506103515625, -55.97250747680664, -48.532508850097656, -41.09251403808594, -33.65251922607422, -26.212520599365234, -18.772523880004883, -11.332527160644531, -3.8925323486328125, 3.547466278076172, 10.987464904785156, 18.427459716796875, 25.867456436157227, 33.30745315551758, 40.74745178222656, 48.18744659423828, 55.62744140625, 63.067440032958984, 70.50743865966797, 77.94741821289062, 85.38741302490234, 92.82740783691406, 100.26741027832031, 107.70740509033203, 115.14739990234375, 122.58740234375, 130.02740478515625, 137.46739196777344, 144.9073944091797, 152.34738159179688, 159.78738403320312, 167.22738647460938, 174.66737365722656, 182.1073760986328, 189.54736328125, 196.98736572265625, 204.4273681640625, 211.8673553466797, 219.30735778808594, 226.74734497070312, 234.18734741210938, 241.62734985351562, 249.06735229492188, 256.50732421875, 263.94732666015625, 271.3873291015625, 278.8273010253906, 286.2673034667969, 293.7073059082031, 301.1473083496094, 308.5873107910156, 316.0273132324219]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 5.0, 3.0, 15.0, 17.0, 26.0, 37.0, 58.0, 94.0, 160.0, 225.0, 454.0, 891.0, 1984.0, 4638.0, 13720.0, 47017.0, 194553.0, 522877.0, 192581.0, 46834.0, 13629.0, 4737.0, 1929.0, 913.0, 490.0, 267.0, 162.0, 95.0, 60.0, 31.0, 24.0, 13.0, 6.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.0, -92.9521484375, -89.904296875, -86.8564453125, -83.80859375, -80.7607421875, -77.712890625, -74.6650390625, -71.6171875, -68.5693359375, -65.521484375, -62.4736328125, -59.42578125, -56.3779296875, -53.330078125, -50.2822265625, -47.234375, -44.1865234375, -41.138671875, -38.0908203125, -35.04296875, -31.9951171875, -28.947265625, -25.8994140625, -22.8515625, -19.8037109375, -16.755859375, -13.7080078125, -10.66015625, -7.6123046875, -4.564453125, -1.5166015625, 1.53125, 4.5791015625, 7.626953125, 10.6748046875, 13.72265625, 16.7705078125, 19.818359375, 22.8662109375, 25.9140625, 28.9619140625, 32.009765625, 35.0576171875, 38.10546875, 41.1533203125, 44.201171875, 47.2490234375, 50.296875, 53.3447265625, 56.392578125, 59.4404296875, 62.48828125, 65.5361328125, 68.583984375, 71.6318359375, 74.6796875, 77.7275390625, 80.775390625, 83.8232421875, 86.87109375, 89.9189453125, 92.966796875, 96.0146484375, 99.0625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 11.0, 12.0, 21.0, 18.0, 16.0, 28.0, 40.0, 49.0, 54.0, 69.0, 72.0, 53.0, 83.0, 74.0, 68.0, 89.0, 56.0, 42.0, 35.0, 29.0, 16.0, 23.0, 14.0, 14.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -19.96044921875, -18.9833984375, -18.00634765625, -17.029296875, -16.05224609375, -15.0751953125, -14.09814453125, -13.12109375, -12.14404296875, -11.1669921875, -10.18994140625, -9.212890625, -8.23583984375, -7.2587890625, -6.28173828125, -5.3046875, -4.32763671875, -3.3505859375, -2.37353515625, -1.396484375, -0.41943359375, 0.5576171875, 1.53466796875, 2.51171875, 3.48876953125, 4.4658203125, 5.44287109375, 6.419921875, 7.39697265625, 8.3740234375, 9.35107421875, 10.328125, 11.30517578125, 12.2822265625, 13.25927734375, 14.236328125, 15.21337890625, 16.1904296875, 17.16748046875, 18.14453125, 19.12158203125, 20.0986328125, 21.07568359375, 22.052734375, 23.02978515625, 24.0068359375, 24.98388671875, 25.9609375, 26.93798828125, 27.9150390625, 28.89208984375, 29.869140625, 30.84619140625, 31.8232421875, 32.80029296875, 33.77734375, 34.75439453125, 35.7314453125, 36.70849609375, 37.685546875, 38.66259765625, 39.6396484375, 40.61669921875, 41.59375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 7.0, 15.0, 21.0, 24.0, 34.0, 37.0, 68.0, 70.0, 113.0, 156.0, 193.0, 310.0, 412.0, 646.0, 1173.0, 3263.0, 18975.0, 256479.0, 703385.0, 52388.0, 6421.0, 1799.0, 839.0, 488.0, 322.0, 258.0, 181.0, 108.0, 106.0, 60.0, 57.0, 35.0, 28.0, 12.0, 13.0, 12.0, 14.0, 6.0, 4.0, 4.0, 0.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-154.125, -149.1875, -144.25, -139.3125, -134.375, -129.4375, -124.5, -119.5625, -114.625, -109.6875, -104.75, -99.8125, -94.875, -89.9375, -85.0, -80.0625, -75.125, -70.1875, -65.25, -60.3125, -55.375, -50.4375, -45.5, -40.5625, -35.625, -30.6875, -25.75, -20.8125, -15.875, -10.9375, -6.0, -1.0625, 3.875, 8.8125, 13.75, 18.6875, 23.625, 28.5625, 33.5, 38.4375, 43.375, 48.3125, 53.25, 58.1875, 63.125, 68.0625, 73.0, 77.9375, 82.875, 87.8125, 92.75, 97.6875, 102.625, 107.5625, 112.5, 117.4375, 122.375, 127.3125, 132.25, 137.1875, 142.125, 147.0625, 152.0, 156.9375, 161.875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 6.0, 9.0, 6.0, 8.0, 11.0, 11.0, 16.0, 20.0, 16.0, 38.0, 34.0, 40.0, 46.0, 55.0, 45.0, 48.0, 59.0, 38.0, 43.0, 51.0, 65.0, 46.0, 37.0, 28.0, 34.0, 28.0, 23.0, 16.0, 24.0, 20.0, 13.0, 6.0, 12.0, 9.0, 5.0, 6.0, 0.0, 2.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-91.5, -88.4140625, -85.328125, -82.2421875, -79.15625, -76.0703125, -72.984375, -69.8984375, -66.8125, -63.7265625, -60.640625, -57.5546875, -54.46875, -51.3828125, -48.296875, -45.2109375, -42.125, -39.0390625, -35.953125, -32.8671875, -29.78125, -26.6953125, -23.609375, -20.5234375, -17.4375, -14.3515625, -11.265625, -8.1796875, -5.09375, -2.0078125, 1.078125, 4.1640625, 7.25, 10.3359375, 13.421875, 16.5078125, 19.59375, 22.6796875, 25.765625, 28.8515625, 31.9375, 35.0234375, 38.109375, 41.1953125, 44.28125, 47.3671875, 50.453125, 53.5390625, 56.625, 59.7109375, 62.796875, 65.8828125, 68.96875, 72.0546875, 75.140625, 78.2265625, 81.3125, 84.3984375, 87.484375, 90.5703125, 93.65625, 96.7421875, 99.828125, 102.9140625, 106.0]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 12.0, 14.0, 25.0, 50.0, 51.0, 86.0, 161.0, 273.0, 547.0, 1283.0, 3230.0, 10583.0, 50277.0, 672582.0, 270259.0, 27632.0, 7138.0, 2434.0, 894.0, 428.0, 230.0, 133.0, 74.0, 35.0, 39.0, 17.0, 10.0, 10.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.9375, -66.18798828125, -64.4384765625, -62.68896484375, -60.939453125, -59.18994140625, -57.4404296875, -55.69091796875, -53.94140625, -52.19189453125, -50.4423828125, -48.69287109375, -46.943359375, -45.19384765625, -43.4443359375, -41.69482421875, -39.9453125, -38.19580078125, -36.4462890625, -34.69677734375, -32.947265625, -31.19775390625, -29.4482421875, -27.69873046875, -25.94921875, -24.19970703125, -22.4501953125, -20.70068359375, -18.951171875, -17.20166015625, -15.4521484375, -13.70263671875, -11.953125, -10.20361328125, -8.4541015625, -6.70458984375, -4.955078125, -3.20556640625, -1.4560546875, 0.29345703125, 2.04296875, 3.79248046875, 5.5419921875, 7.29150390625, 9.041015625, 10.79052734375, 12.5400390625, 14.28955078125, 16.0390625, 17.78857421875, 19.5380859375, 21.28759765625, 23.037109375, 24.78662109375, 26.5361328125, 28.28564453125, 30.03515625, 31.78466796875, 33.5341796875, 35.28369140625, 37.033203125, 38.78271484375, 40.5322265625, 42.28173828125, 44.03125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 22.0, 21.0, 39.0, 50.0, 61.0, 103.0, 154.0, 203.0, 114.0, 71.0, 63.0, 25.0, 15.0, 12.0, 11.0, 8.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007171630859375, -0.0069618821144104, -0.006752133369445801, -0.006542384624481201, -0.0063326358795166016, -0.006122887134552002, -0.005913138389587402, -0.005703389644622803, -0.005493640899658203, -0.0052838921546936035, -0.005074143409729004, -0.004864394664764404, -0.004654645919799805, -0.004444897174835205, -0.0042351484298706055, -0.004025399684906006, -0.0038156509399414062, -0.0036059021949768066, -0.003396153450012207, -0.0031864047050476074, -0.002976655960083008, -0.002766907215118408, -0.0025571584701538086, -0.002347409725189209, -0.0021376609802246094, -0.0019279122352600098, -0.0017181634902954102, -0.0015084147453308105, -0.001298666000366211, -0.0010889172554016113, -0.0008791685104370117, -0.0006694197654724121, -0.0004596710205078125, -0.0002499222755432129, -4.017353057861328e-05, 0.00016957521438598633, 0.00037932395935058594, 0.0005890727043151855, 0.0007988214492797852, 0.0010085701942443848, 0.0012183189392089844, 0.001428067684173584, 0.0016378164291381836, 0.0018475651741027832, 0.002057313919067383, 0.0022670626640319824, 0.002476811408996582, 0.0026865601539611816, 0.0028963088989257812, 0.003106057643890381, 0.0033158063888549805, 0.00352555513381958, 0.0037353038787841797, 0.003945052623748779, 0.004154801368713379, 0.0043645501136779785, 0.004574298858642578, 0.004784047603607178, 0.004993796348571777, 0.005203545093536377, 0.0054132938385009766, 0.005623042583465576, 0.005832791328430176, 0.006042540073394775, 0.006252288818359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 11.0, 13.0, 19.0, 31.0, 41.0, 47.0, 82.0, 114.0, 188.0, 293.0, 557.0, 1072.0, 2403.0, 7590.0, 37094.0, 594176.0, 367218.0, 27197.0, 6183.0, 2024.0, 931.0, 446.0, 265.0, 164.0, 116.0, 64.0, 52.0, 39.0, 28.0, 15.0, 13.0, 16.0, 12.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.625, -55.76123046875, -53.8974609375, -52.03369140625, -50.169921875, -48.30615234375, -46.4423828125, -44.57861328125, -42.71484375, -40.85107421875, -38.9873046875, -37.12353515625, -35.259765625, -33.39599609375, -31.5322265625, -29.66845703125, -27.8046875, -25.94091796875, -24.0771484375, -22.21337890625, -20.349609375, -18.48583984375, -16.6220703125, -14.75830078125, -12.89453125, -11.03076171875, -9.1669921875, -7.30322265625, -5.439453125, -3.57568359375, -1.7119140625, 0.15185546875, 2.015625, 3.87939453125, 5.7431640625, 7.60693359375, 9.470703125, 11.33447265625, 13.1982421875, 15.06201171875, 16.92578125, 18.78955078125, 20.6533203125, 22.51708984375, 24.380859375, 26.24462890625, 28.1083984375, 29.97216796875, 31.8359375, 33.69970703125, 35.5634765625, 37.42724609375, 39.291015625, 41.15478515625, 43.0185546875, 44.88232421875, 46.74609375, 48.60986328125, 50.4736328125, 52.33740234375, 54.201171875, 56.06494140625, 57.9287109375, 59.79248046875, 61.65625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 8.0, 3.0, 8.0, 8.0, 11.0, 13.0, 14.0, 35.0, 45.0, 64.0, 100.0, 110.0, 141.0, 118.0, 87.0, 60.0, 47.0, 29.0, 26.0, 19.0, 15.0, 8.0, 10.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.625, -60.11328125, -58.6015625, -57.08984375, -55.578125, -54.06640625, -52.5546875, -51.04296875, -49.53125, -48.01953125, -46.5078125, -44.99609375, -43.484375, -41.97265625, -40.4609375, -38.94921875, -37.4375, -35.92578125, -34.4140625, -32.90234375, -31.390625, -29.87890625, -28.3671875, -26.85546875, -25.34375, -23.83203125, -22.3203125, -20.80859375, -19.296875, -17.78515625, -16.2734375, -14.76171875, -13.25, -11.73828125, -10.2265625, -8.71484375, -7.203125, -5.69140625, -4.1796875, -2.66796875, -1.15625, 0.35546875, 1.8671875, 3.37890625, 4.890625, 6.40234375, 7.9140625, 9.42578125, 10.9375, 12.44921875, 13.9609375, 15.47265625, 16.984375, 18.49609375, 20.0078125, 21.51953125, 23.03125, 24.54296875, 26.0546875, 27.56640625, 29.078125, 30.58984375, 32.1015625, 33.61328125, 35.125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 17.0, 41.0, 85.0, 172.0, 272.0, 199.0, 111.0, 49.0, 24.0, 9.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1484.2841796875, -1448.778564453125, -1413.2730712890625, -1377.7674560546875, -1342.261962890625, -1306.75634765625, -1271.2508544921875, -1235.7452392578125, -1200.23974609375, -1164.734130859375, -1129.2286376953125, -1093.7230224609375, -1058.217529296875, -1022.7119750976562, -987.2064208984375, -951.7008056640625, -916.1952514648438, -880.689697265625, -845.1841430664062, -809.6785888671875, -774.1730346679688, -738.66748046875, -703.161865234375, -667.6563720703125, -632.1507568359375, -596.6452026367188, -561.1396484375, -525.6340942382812, -490.1285400390625, -454.62298583984375, -419.1174011230469, -383.6118469238281, -348.1063232421875, -312.60076904296875, -277.09521484375, -241.5896453857422, -206.08409118652344, -170.5785369873047, -135.07296752929688, -99.56741333007812, -64.06185913085938, -28.55630111694336, 6.949256896972656, 42.45481872558594, 77.96037292480469, 113.46592712402344, 148.97149658203125, 184.47705078125, 219.98260498046875, 255.4881591796875, 290.99371337890625, 326.499267578125, 362.00482177734375, 397.5103759765625, 433.0159606933594, 468.5215148925781, 504.0270690917969, 539.5326538085938, 575.0382080078125, 610.5437622070312, 646.04931640625, 681.5548706054688, 717.0604248046875, 752.5659790039062, 788.071533203125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 5.0, 8.0, 15.0, 9.0, 16.0, 25.0, 22.0, 26.0, 32.0, 33.0, 33.0, 43.0, 43.0, 47.0, 62.0, 56.0, 39.0, 43.0, 56.0, 41.0, 50.0, 47.0, 34.0, 34.0, 26.0, 28.0, 23.0, 13.0, 16.0, 21.0, 17.0, 12.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-648.2952880859375, -630.0960083007812, -611.896728515625, -593.6974487304688, -575.4981689453125, -557.2989501953125, -539.099609375, -520.900390625, -502.70111083984375, -484.5018310546875, -466.30255126953125, -448.103271484375, -429.9040222167969, -411.7047424316406, -393.5054626464844, -375.3061828613281, -357.1069030761719, -338.9076232910156, -320.7083435058594, -302.50909423828125, -284.309814453125, -266.11053466796875, -247.9112548828125, -229.71197509765625, -211.51271057128906, -193.3134307861328, -175.11416625976562, -156.91488647460938, -138.71560668945312, -120.51634216308594, -102.31706237792969, -84.11779022216797, -65.91851806640625, -47.71924591064453, -29.519969940185547, -11.320693969726562, 6.878578186035156, 25.077850341796875, 43.277130126953125, 61.476402282714844, 79.67567443847656, 97.87494659423828, 116.07421875, 134.27349853515625, 152.4727783203125, 170.6720428466797, 188.87132263183594, 207.07058715820312, 225.26986694335938, 243.46914672851562, 261.6684265136719, 279.86767578125, 298.06695556640625, 316.2662353515625, 334.46551513671875, 352.664794921875, 370.86407470703125, 389.0633544921875, 407.26263427734375, 425.4619140625, 443.6611633300781, 461.8604431152344, 480.0597229003906, 498.2590026855469, 516.458251953125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 8.0, 19.0, 27.0, 34.0, 43.0, 50.0, 64.0, 108.0, 176.0, 291.0, 549.0, 1120.0, 2453.0, 6227.0, 20222.0, 104748.0, 3834577.0, 183036.0, 26981.0, 7856.0, 2944.0, 1224.0, 571.0, 308.0, 181.0, 124.0, 73.0, 73.0, 52.0, 26.0, 26.0, 9.0, 11.0, 10.0, 6.0, 7.0, 6.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-118.5, -114.498046875, -110.49609375, -106.494140625, -102.4921875, -98.490234375, -94.48828125, -90.486328125, -86.484375, -82.482421875, -78.48046875, -74.478515625, -70.4765625, -66.474609375, -62.47265625, -58.470703125, -54.46875, -50.466796875, -46.46484375, -42.462890625, -38.4609375, -34.458984375, -30.45703125, -26.455078125, -22.453125, -18.451171875, -14.44921875, -10.447265625, -6.4453125, -2.443359375, 1.55859375, 5.560546875, 9.5625, 13.564453125, 17.56640625, 21.568359375, 25.5703125, 29.572265625, 33.57421875, 37.576171875, 41.578125, 45.580078125, 49.58203125, 53.583984375, 57.5859375, 61.587890625, 65.58984375, 69.591796875, 73.59375, 77.595703125, 81.59765625, 85.599609375, 89.6015625, 93.603515625, 97.60546875, 101.607421875, 105.609375, 109.611328125, 113.61328125, 117.615234375, 121.6171875, 125.619140625, 129.62109375, 133.623046875, 137.625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 5.0, 1.0, 9.0, 11.0, 21.0, 13.0, 18.0, 31.0, 46.0, 42.0, 45.0, 66.0, 61.0, 93.0, 54.0, 56.0, 86.0, 82.0, 55.0, 38.0, 40.0, 34.0, 31.0, 25.0, 14.0, 12.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.61083984375, -22.4716796875, -21.33251953125, -20.193359375, -19.05419921875, -17.9150390625, -16.77587890625, -15.63671875, -14.49755859375, -13.3583984375, -12.21923828125, -11.080078125, -9.94091796875, -8.8017578125, -7.66259765625, -6.5234375, -5.38427734375, -4.2451171875, -3.10595703125, -1.966796875, -0.82763671875, 0.3115234375, 1.45068359375, 2.58984375, 3.72900390625, 4.8681640625, 6.00732421875, 7.146484375, 8.28564453125, 9.4248046875, 10.56396484375, 11.703125, 12.84228515625, 13.9814453125, 15.12060546875, 16.259765625, 17.39892578125, 18.5380859375, 19.67724609375, 20.81640625, 21.95556640625, 23.0947265625, 24.23388671875, 25.373046875, 26.51220703125, 27.6513671875, 28.79052734375, 29.9296875, 31.06884765625, 32.2080078125, 33.34716796875, 34.486328125, 35.62548828125, 36.7646484375, 37.90380859375, 39.04296875, 40.18212890625, 41.3212890625, 42.46044921875, 43.599609375, 44.73876953125, 45.8779296875, 47.01708984375, 48.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 8.0, 5.0, 15.0, 25.0, 42.0, 37.0, 85.0, 137.0, 255.0, 424.0, 781.0, 1665.0, 4542.0, 17067.0, 153410.0, 3901076.0, 94582.0, 13116.0, 3822.0, 1573.0, 727.0, 369.0, 182.0, 132.0, 84.0, 30.0, 36.0, 20.0, 12.0, 5.0, 3.0, 3.0, 8.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.875, -149.9453125, -145.015625, -140.0859375, -135.15625, -130.2265625, -125.296875, -120.3671875, -115.4375, -110.5078125, -105.578125, -100.6484375, -95.71875, -90.7890625, -85.859375, -80.9296875, -76.0, -71.0703125, -66.140625, -61.2109375, -56.28125, -51.3515625, -46.421875, -41.4921875, -36.5625, -31.6328125, -26.703125, -21.7734375, -16.84375, -11.9140625, -6.984375, -2.0546875, 2.875, 7.8046875, 12.734375, 17.6640625, 22.59375, 27.5234375, 32.453125, 37.3828125, 42.3125, 47.2421875, 52.171875, 57.1015625, 62.03125, 66.9609375, 71.890625, 76.8203125, 81.75, 86.6796875, 91.609375, 96.5390625, 101.46875, 106.3984375, 111.328125, 116.2578125, 121.1875, 126.1171875, 131.046875, 135.9765625, 140.90625, 145.8359375, 150.765625, 155.6953125, 160.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 8.0, 13.0, 18.0, 32.0, 77.0, 188.0, 2031.0, 1327.0, 189.0, 80.0, 30.0, 19.0, 11.0, 13.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-110.6875, -107.521484375, -104.35546875, -101.189453125, -98.0234375, -94.857421875, -91.69140625, -88.525390625, -85.359375, -82.193359375, -79.02734375, -75.861328125, -72.6953125, -69.529296875, -66.36328125, -63.197265625, -60.03125, -56.865234375, -53.69921875, -50.533203125, -47.3671875, -44.201171875, -41.03515625, -37.869140625, -34.703125, -31.537109375, -28.37109375, -25.205078125, -22.0390625, -18.873046875, -15.70703125, -12.541015625, -9.375, -6.208984375, -3.04296875, 0.123046875, 3.2890625, 6.455078125, 9.62109375, 12.787109375, 15.953125, 19.119140625, 22.28515625, 25.451171875, 28.6171875, 31.783203125, 34.94921875, 38.115234375, 41.28125, 44.447265625, 47.61328125, 50.779296875, 53.9453125, 57.111328125, 60.27734375, 63.443359375, 66.609375, 69.775390625, 72.94140625, 76.107421875, 79.2734375, 82.439453125, 85.60546875, 88.771484375, 91.9375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 14.0, 66.0, 126.0, 311.0, 304.0, 107.0, 29.0, 15.0, 5.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-339.3290100097656, -318.2330017089844, -297.1369934082031, -276.0409851074219, -254.94497680664062, -233.84896850585938, -212.7529754638672, -191.65696716308594, -170.5609588623047, -149.46495056152344, -128.3689422607422, -107.27294158935547, -86.17693328857422, -65.08092498779297, -43.98492431640625, -22.888916015625, -1.79290771484375, 19.303098678588867, 40.399105072021484, 61.49510955810547, 82.59111785888672, 103.68712615966797, 124.78312683105469, 145.87913513183594, 166.9751434326172, 188.07115173339844, 209.1671600341797, 230.26315307617188, 251.35916137695312, 272.4551696777344, 293.5511779785156, 314.6471862792969, 335.74322509765625, 356.8392333984375, 377.93524169921875, 399.03125, 420.12725830078125, 441.2232666015625, 462.31927490234375, 483.415283203125, 504.51129150390625, 525.6072998046875, 546.7033081054688, 567.79931640625, 588.8953247070312, 609.9913330078125, 631.0873413085938, 652.183349609375, 673.279296875, 694.3753051757812, 715.4713134765625, 736.5673217773438, 757.663330078125, 778.7593383789062, 799.8553466796875, 820.9513549804688, 842.04736328125, 863.1433715820312, 884.2393798828125, 905.3353881835938, 926.431396484375, 947.5274047851562, 968.6234130859375, 989.7194213867188, 1010.8154296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 7.0, 11.0, 22.0, 39.0, 46.0, 64.0, 87.0, 95.0, 84.0, 120.0, 83.0, 86.0, 79.0, 59.0, 37.0, 25.0, 19.0, 12.0, 6.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-365.9420166015625, -352.9200439453125, -339.8980712890625, -326.8761291503906, -313.8541564941406, -300.8321838378906, -287.8102111816406, -274.78826904296875, -261.76629638671875, -248.74432373046875, -235.7223663330078, -222.7003936767578, -209.67843627929688, -196.65646362304688, -183.63449096679688, -170.61253356933594, -157.59056091308594, -144.56858825683594, -131.546630859375, -118.524658203125, -105.50270080566406, -92.48072814941406, -79.4587631225586, -66.43679809570312, -53.414833068847656, -40.39286804199219, -27.370901107788086, -14.348934173583984, -1.3269691467285156, 11.694999694824219, 24.716964721679688, 37.738929748535156, 50.760894775390625, 63.782859802246094, 76.80482482910156, 89.82679748535156, 102.8487548828125, 115.8707275390625, 128.8927001953125, 141.91465759277344, 154.93661499023438, 167.95858764648438, 180.9805450439453, 194.0025177001953, 207.02447509765625, 220.04644775390625, 233.06842041015625, 246.0903778076172, 259.11236572265625, 272.13433837890625, 285.15631103515625, 298.1782531738281, 311.2002258300781, 324.2221984863281, 337.2441711425781, 350.26611328125, 363.2880859375, 376.31005859375, 389.33203125, 402.3539733886719, 415.3759460449219, 428.3979187011719, 441.4198913574219, 454.44183349609375, 467.46380615234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 23.0, 23.0, 27.0, 50.0, 83.0, 155.0, 315.0, 672.0, 1602.0, 5382.0, 20877.0, 96457.0, 453223.0, 372011.0, 74582.0, 16171.0, 4308.0, 1356.0, 555.0, 299.0, 158.0, 77.0, 46.0, 39.0, 20.0, 11.0, 8.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-127.5, -123.23828125, -118.9765625, -114.71484375, -110.453125, -106.19140625, -101.9296875, -97.66796875, -93.40625, -89.14453125, -84.8828125, -80.62109375, -76.359375, -72.09765625, -67.8359375, -63.57421875, -59.3125, -55.05078125, -50.7890625, -46.52734375, -42.265625, -38.00390625, -33.7421875, -29.48046875, -25.21875, -20.95703125, -16.6953125, -12.43359375, -8.171875, -3.91015625, 0.3515625, 4.61328125, 8.875, 13.13671875, 17.3984375, 21.66015625, 25.921875, 30.18359375, 34.4453125, 38.70703125, 42.96875, 47.23046875, 51.4921875, 55.75390625, 60.015625, 64.27734375, 68.5390625, 72.80078125, 77.0625, 81.32421875, 85.5859375, 89.84765625, 94.109375, 98.37109375, 102.6328125, 106.89453125, 111.15625, 115.41796875, 119.6796875, 123.94140625, 128.203125, 132.46484375, 136.7265625, 140.98828125, 145.25]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 10.0, 9.0, 16.0, 35.0, 31.0, 46.0, 66.0, 73.0, 75.0, 75.0, 85.0, 79.0, 88.0, 71.0, 65.0, 41.0, 43.0, 40.0, 17.0, 13.0, 10.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5625, -28.1982421875, -26.833984375, -25.4697265625, -24.10546875, -22.7412109375, -21.376953125, -20.0126953125, -18.6484375, -17.2841796875, -15.919921875, -14.5556640625, -13.19140625, -11.8271484375, -10.462890625, -9.0986328125, -7.734375, -6.3701171875, -5.005859375, -3.6416015625, -2.27734375, -0.9130859375, 0.451171875, 1.8154296875, 3.1796875, 4.5439453125, 5.908203125, 7.2724609375, 8.63671875, 10.0009765625, 11.365234375, 12.7294921875, 14.09375, 15.4580078125, 16.822265625, 18.1865234375, 19.55078125, 20.9150390625, 22.279296875, 23.6435546875, 25.0078125, 26.3720703125, 27.736328125, 29.1005859375, 30.46484375, 31.8291015625, 33.193359375, 34.5576171875, 35.921875, 37.2861328125, 38.650390625, 40.0146484375, 41.37890625, 42.7431640625, 44.107421875, 45.4716796875, 46.8359375, 48.2001953125, 49.564453125, 50.9287109375, 52.29296875, 53.6572265625, 55.021484375, 56.3857421875, 57.75]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 10.0, 10.0, 8.0, 13.0, 19.0, 25.0, 44.0, 44.0, 68.0, 105.0, 189.0, 240.0, 406.0, 715.0, 1478.0, 5263.0, 51064.0, 801384.0, 172726.0, 10151.0, 2271.0, 903.0, 498.0, 305.0, 190.0, 137.0, 94.0, 52.0, 38.0, 25.0, 19.0, 22.0, 10.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-278.5, -270.232421875, -261.96484375, -253.697265625, -245.4296875, -237.162109375, -228.89453125, -220.626953125, -212.359375, -204.091796875, -195.82421875, -187.556640625, -179.2890625, -171.021484375, -162.75390625, -154.486328125, -146.21875, -137.951171875, -129.68359375, -121.416015625, -113.1484375, -104.880859375, -96.61328125, -88.345703125, -80.078125, -71.810546875, -63.54296875, -55.275390625, -47.0078125, -38.740234375, -30.47265625, -22.205078125, -13.9375, -5.669921875, 2.59765625, 10.865234375, 19.1328125, 27.400390625, 35.66796875, 43.935546875, 52.203125, 60.470703125, 68.73828125, 77.005859375, 85.2734375, 93.541015625, 101.80859375, 110.076171875, 118.34375, 126.611328125, 134.87890625, 143.146484375, 151.4140625, 159.681640625, 167.94921875, 176.216796875, 184.484375, 192.751953125, 201.01953125, 209.287109375, 217.5546875, 225.822265625, 234.08984375, 242.357421875, 250.625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 9.0, 9.0, 10.0, 15.0, 12.0, 12.0, 23.0, 19.0, 25.0, 30.0, 35.0, 35.0, 36.0, 48.0, 53.0, 52.0, 46.0, 35.0, 66.0, 52.0, 49.0, 37.0, 40.0, 29.0, 32.0, 35.0, 28.0, 17.0, 14.0, 22.0, 15.0, 14.0, 8.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.125, -122.79296875, -118.4609375, -114.12890625, -109.796875, -105.46484375, -101.1328125, -96.80078125, -92.46875, -88.13671875, -83.8046875, -79.47265625, -75.140625, -70.80859375, -66.4765625, -62.14453125, -57.8125, -53.48046875, -49.1484375, -44.81640625, -40.484375, -36.15234375, -31.8203125, -27.48828125, -23.15625, -18.82421875, -14.4921875, -10.16015625, -5.828125, -1.49609375, 2.8359375, 7.16796875, 11.5, 15.83203125, 20.1640625, 24.49609375, 28.828125, 33.16015625, 37.4921875, 41.82421875, 46.15625, 50.48828125, 54.8203125, 59.15234375, 63.484375, 67.81640625, 72.1484375, 76.48046875, 80.8125, 85.14453125, 89.4765625, 93.80859375, 98.140625, 102.47265625, 106.8046875, 111.13671875, 115.46875, 119.80078125, 124.1328125, 128.46484375, 132.796875, 137.12890625, 141.4609375, 145.79296875, 150.125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 7.0, 12.0, 15.0, 28.0, 40.0, 44.0, 68.0, 83.0, 162.0, 263.0, 407.0, 787.0, 1520.0, 3534.0, 9237.0, 30349.0, 140452.0, 545589.0, 245056.0, 48501.0, 13358.0, 4714.0, 2046.0, 973.0, 513.0, 280.0, 164.0, 100.0, 57.0, 52.0, 41.0, 21.0, 17.0, 9.0, 10.0, 10.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.34375, -45.8486328125, -44.353515625, -42.8583984375, -41.36328125, -39.8681640625, -38.373046875, -36.8779296875, -35.3828125, -33.8876953125, -32.392578125, -30.8974609375, -29.40234375, -27.9072265625, -26.412109375, -24.9169921875, -23.421875, -21.9267578125, -20.431640625, -18.9365234375, -17.44140625, -15.9462890625, -14.451171875, -12.9560546875, -11.4609375, -9.9658203125, -8.470703125, -6.9755859375, -5.48046875, -3.9853515625, -2.490234375, -0.9951171875, 0.5, 1.9951171875, 3.490234375, 4.9853515625, 6.48046875, 7.9755859375, 9.470703125, 10.9658203125, 12.4609375, 13.9560546875, 15.451171875, 16.9462890625, 18.44140625, 19.9365234375, 21.431640625, 22.9267578125, 24.421875, 25.9169921875, 27.412109375, 28.9072265625, 30.40234375, 31.8974609375, 33.392578125, 34.8876953125, 36.3828125, 37.8779296875, 39.373046875, 40.8681640625, 42.36328125, 43.8583984375, 45.353515625, 46.8486328125, 48.34375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 13.0, 19.0, 22.0, 31.0, 36.0, 56.0, 90.0, 85.0, 97.0, 121.0, 111.0, 80.0, 62.0, 49.0, 28.0, 21.0, 16.0, 14.0, 12.0, 3.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00638580322265625, -0.006151080131530762, -0.0059163570404052734, -0.005681633949279785, -0.005446910858154297, -0.005212187767028809, -0.00497746467590332, -0.004742741584777832, -0.004508018493652344, -0.0042732954025268555, -0.004038572311401367, -0.003803849220275879, -0.0035691261291503906, -0.0033344030380249023, -0.003099679946899414, -0.0028649568557739258, -0.0026302337646484375, -0.0023955106735229492, -0.002160787582397461, -0.0019260644912719727, -0.0016913414001464844, -0.001456618309020996, -0.0012218952178955078, -0.0009871721267700195, -0.0007524490356445312, -0.000517725944519043, -0.0002830028533935547, -4.8279762268066406e-05, 0.00018644332885742188, 0.00042116641998291016, 0.0006558895111083984, 0.0008906126022338867, 0.001125335693359375, 0.0013600587844848633, 0.0015947818756103516, 0.0018295049667358398, 0.002064228057861328, 0.0022989511489868164, 0.0025336742401123047, 0.002768397331237793, 0.0030031204223632812, 0.0032378435134887695, 0.003472566604614258, 0.003707289695739746, 0.003942012786865234, 0.004176735877990723, 0.004411458969116211, 0.004646182060241699, 0.0048809051513671875, 0.005115628242492676, 0.005350351333618164, 0.005585074424743652, 0.005819797515869141, 0.006054520606994629, 0.006289243698120117, 0.0065239667892456055, 0.006758689880371094, 0.006993412971496582, 0.00722813606262207, 0.007462859153747559, 0.007697582244873047, 0.007932305335998535, 0.008167028427124023, 0.008401751518249512, 0.008636474609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 12.0, 18.0, 13.0, 43.0, 46.0, 68.0, 104.0, 179.0, 318.0, 587.0, 1215.0, 3364.0, 14316.0, 117098.0, 754400.0, 134801.0, 15524.0, 3662.0, 1329.0, 606.0, 301.0, 208.0, 94.0, 67.0, 43.0, 30.0, 22.0, 25.0, 14.0, 8.0, 5.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-75.3125, -72.9970703125, -70.681640625, -68.3662109375, -66.05078125, -63.7353515625, -61.419921875, -59.1044921875, -56.7890625, -54.4736328125, -52.158203125, -49.8427734375, -47.52734375, -45.2119140625, -42.896484375, -40.5810546875, -38.265625, -35.9501953125, -33.634765625, -31.3193359375, -29.00390625, -26.6884765625, -24.373046875, -22.0576171875, -19.7421875, -17.4267578125, -15.111328125, -12.7958984375, -10.48046875, -8.1650390625, -5.849609375, -3.5341796875, -1.21875, 1.0966796875, 3.412109375, 5.7275390625, 8.04296875, 10.3583984375, 12.673828125, 14.9892578125, 17.3046875, 19.6201171875, 21.935546875, 24.2509765625, 26.56640625, 28.8818359375, 31.197265625, 33.5126953125, 35.828125, 38.1435546875, 40.458984375, 42.7744140625, 45.08984375, 47.4052734375, 49.720703125, 52.0361328125, 54.3515625, 56.6669921875, 58.982421875, 61.2978515625, 63.61328125, 65.9287109375, 68.244140625, 70.5595703125, 72.875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 6.0, 8.0, 7.0, 9.0, 15.0, 18.0, 19.0, 34.0, 39.0, 44.0, 60.0, 98.0, 104.0, 86.0, 106.0, 77.0, 66.0, 47.0, 48.0, 25.0, 14.0, 22.0, 17.0, 8.0, 6.0, 5.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.65625, -42.974609375, -41.29296875, -39.611328125, -37.9296875, -36.248046875, -34.56640625, -32.884765625, -31.203125, -29.521484375, -27.83984375, -26.158203125, -24.4765625, -22.794921875, -21.11328125, -19.431640625, -17.75, -16.068359375, -14.38671875, -12.705078125, -11.0234375, -9.341796875, -7.66015625, -5.978515625, -4.296875, -2.615234375, -0.93359375, 0.748046875, 2.4296875, 4.111328125, 5.79296875, 7.474609375, 9.15625, 10.837890625, 12.51953125, 14.201171875, 15.8828125, 17.564453125, 19.24609375, 20.927734375, 22.609375, 24.291015625, 25.97265625, 27.654296875, 29.3359375, 31.017578125, 32.69921875, 34.380859375, 36.0625, 37.744140625, 39.42578125, 41.107421875, 42.7890625, 44.470703125, 46.15234375, 47.833984375, 49.515625, 51.197265625, 52.87890625, 54.560546875, 56.2421875, 57.923828125, 59.60546875, 61.287109375, 62.96875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 17.0, 40.0, 164.0, 288.0, 281.0, 123.0, 51.0, 23.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1671.16015625, -1615.161376953125, -1559.16259765625, -1503.163818359375, -1447.1650390625, -1391.166259765625, -1335.16748046875, -1279.168701171875, -1223.169921875, -1167.171142578125, -1111.17236328125, -1055.173583984375, -999.1748046875, -943.176025390625, -887.1771850585938, -831.1784057617188, -775.1795654296875, -719.1807861328125, -663.1820068359375, -607.1832275390625, -551.1844482421875, -495.1856384277344, -439.18682861328125, -383.18804931640625, -327.18927001953125, -271.19049072265625, -215.1916961669922, -159.19290161132812, -103.19412231445312, -47.195343017578125, 8.803466796875, 64.80224609375, 120.8009033203125, 176.7996826171875, 232.79847717285156, 288.7972717285156, 344.7960510253906, 400.7948303222656, 456.79364013671875, 512.7924194335938, 568.7911987304688, 624.7899780273438, 680.7887573242188, 736.78759765625, 792.786376953125, 848.78515625, 904.783935546875, 960.78271484375, 1016.781494140625, 1072.7802734375, 1128.779052734375, 1184.77783203125, 1240.776611328125, 1296.775390625, 1352.774169921875, 1408.77294921875, 1464.771728515625, 1520.7705078125, 1576.769287109375, 1632.76806640625, 1688.766845703125, 1744.765625, 1800.764404296875, 1856.76318359375, 1912.7620849609375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 5.0, 3.0, 10.0, 12.0, 12.0, 17.0, 17.0, 24.0, 22.0, 24.0, 35.0, 30.0, 40.0, 43.0, 40.0, 43.0, 41.0, 45.0, 45.0, 50.0, 46.0, 46.0, 39.0, 45.0, 41.0, 40.0, 28.0, 15.0, 26.0, 21.0, 16.0, 12.0, 8.0, 8.0, 7.0, 8.0, 5.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-729.532470703125, -708.1761474609375, -686.81982421875, -665.4635009765625, -644.107177734375, -622.7507934570312, -601.3944702148438, -580.0381469726562, -558.6818237304688, -537.3255004882812, -515.9691772460938, -494.6128234863281, -473.2565002441406, -451.9001770019531, -430.5438232421875, -409.1875, -387.8311767578125, -366.474853515625, -345.1185302734375, -323.7621765136719, -302.4058532714844, -281.0495300292969, -259.69317626953125, -238.33685302734375, -216.98052978515625, -195.62420654296875, -174.2678680419922, -152.91152954101562, -131.55520629882812, -110.1988754272461, -88.84254455566406, -67.4862060546875, -46.1298828125, -24.77355194091797, -3.4172210693359375, 17.939109802246094, 39.295440673828125, 60.651771545410156, 82.00810241699219, 103.36444091796875, 124.72076416015625, 146.07708740234375, 167.4334259033203, 188.78976440429688, 210.14608764648438, 231.50241088867188, 252.85874938964844, 274.215087890625, 295.5714111328125, 316.927734375, 338.2840576171875, 359.6404113769531, 380.9967346191406, 402.3530578613281, 423.70941162109375, 445.06573486328125, 466.42205810546875, 487.77838134765625, 509.13470458984375, 530.4910278320312, 551.847412109375, 573.2037353515625, 594.56005859375, 615.9163818359375, 637.272705078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 10.0, 5.0, 24.0, 28.0, 58.0, 100.0, 170.0, 352.0, 875.0, 2577.0, 20211.0, 4148973.0, 16993.0, 2379.0, 762.0, 352.0, 192.0, 84.0, 33.0, 32.0, 19.0, 8.0, 9.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-295.75, -286.3515625, -276.953125, -267.5546875, -258.15625, -248.7578125, -239.359375, -229.9609375, -220.5625, -211.1640625, -201.765625, -192.3671875, -182.96875, -173.5703125, -164.171875, -154.7734375, -145.375, -135.9765625, -126.578125, -117.1796875, -107.78125, -98.3828125, -88.984375, -79.5859375, -70.1875, -60.7890625, -51.390625, -41.9921875, -32.59375, -23.1953125, -13.796875, -4.3984375, 5.0, 14.3984375, 23.796875, 33.1953125, 42.59375, 51.9921875, 61.390625, 70.7890625, 80.1875, 89.5859375, 98.984375, 108.3828125, 117.78125, 127.1796875, 136.578125, 145.9765625, 155.375, 164.7734375, 174.171875, 183.5703125, 192.96875, 202.3671875, 211.765625, 221.1640625, 230.5625, 239.9609375, 249.359375, 258.7578125, 268.15625, 277.5546875, 286.953125, 296.3515625, 305.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 9.0, 2.0, 9.0, 5.0, 8.0, 16.0, 31.0, 28.0, 46.0, 60.0, 55.0, 88.0, 70.0, 94.0, 83.0, 92.0, 76.0, 58.0, 48.0, 37.0, 36.0, 19.0, 12.0, 9.0, 8.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.3125, -48.5625, -46.8125, -45.0625, -43.3125, -41.5625, -39.8125, -38.0625, -36.3125, -34.5625, -32.8125, -31.0625, -29.3125, -27.5625, -25.8125, -24.0625, -22.3125, -20.5625, -18.8125, -17.0625, -15.3125, -13.5625, -11.8125, -10.0625, -8.3125, -6.5625, -4.8125, -3.0625, -1.3125, 0.4375, 2.1875, 3.9375, 5.6875, 7.4375, 9.1875, 10.9375, 12.6875, 14.4375, 16.1875, 17.9375, 19.6875, 21.4375, 23.1875, 24.9375, 26.6875, 28.4375, 30.1875, 31.9375, 33.6875, 35.4375, 37.1875, 38.9375, 40.6875, 42.4375, 44.1875, 45.9375, 47.6875, 49.4375, 51.1875, 52.9375, 54.6875, 56.4375, 58.1875, 59.9375, 61.6875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 7.0, 4.0, 11.0, 14.0, 17.0, 28.0, 34.0, 42.0, 47.0, 80.0, 121.0, 168.0, 236.0, 355.0, 613.0, 1033.0, 2039.0, 4670.0, 14135.0, 115891.0, 4009301.0, 31281.0, 7620.0, 2926.0, 1420.0, 790.0, 456.0, 262.0, 194.0, 136.0, 93.0, 74.0, 51.0, 34.0, 27.0, 25.0, 16.0, 11.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.375, -142.94140625, -138.5078125, -134.07421875, -129.640625, -125.20703125, -120.7734375, -116.33984375, -111.90625, -107.47265625, -103.0390625, -98.60546875, -94.171875, -89.73828125, -85.3046875, -80.87109375, -76.4375, -72.00390625, -67.5703125, -63.13671875, -58.703125, -54.26953125, -49.8359375, -45.40234375, -40.96875, -36.53515625, -32.1015625, -27.66796875, -23.234375, -18.80078125, -14.3671875, -9.93359375, -5.5, -1.06640625, 3.3671875, 7.80078125, 12.234375, 16.66796875, 21.1015625, 25.53515625, 29.96875, 34.40234375, 38.8359375, 43.26953125, 47.703125, 52.13671875, 56.5703125, 61.00390625, 65.4375, 69.87109375, 74.3046875, 78.73828125, 83.171875, 87.60546875, 92.0390625, 96.47265625, 100.90625, 105.33984375, 109.7734375, 114.20703125, 118.640625, 123.07421875, 127.5078125, 131.94140625, 136.375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 3.0, 7.0, 12.0, 37.0, 92.0, 3590.0, 213.0, 55.0, 22.0, 8.0, 7.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.78125, -51.42041015625, -50.0595703125, -48.69873046875, -47.337890625, -45.97705078125, -44.6162109375, -43.25537109375, -41.89453125, -40.53369140625, -39.1728515625, -37.81201171875, -36.451171875, -35.09033203125, -33.7294921875, -32.36865234375, -31.0078125, -29.64697265625, -28.2861328125, -26.92529296875, -25.564453125, -24.20361328125, -22.8427734375, -21.48193359375, -20.12109375, -18.76025390625, -17.3994140625, -16.03857421875, -14.677734375, -13.31689453125, -11.9560546875, -10.59521484375, -9.234375, -7.87353515625, -6.5126953125, -5.15185546875, -3.791015625, -2.43017578125, -1.0693359375, 0.29150390625, 1.65234375, 3.01318359375, 4.3740234375, 5.73486328125, 7.095703125, 8.45654296875, 9.8173828125, 11.17822265625, 12.5390625, 13.89990234375, 15.2607421875, 16.62158203125, 17.982421875, 19.34326171875, 20.7041015625, 22.06494140625, 23.42578125, 24.78662109375, 26.1474609375, 27.50830078125, 28.869140625, 30.22998046875, 31.5908203125, 32.95166015625, 34.3125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 11.0, 38.0, 124.0, 275.0, 365.0, 143.0, 36.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-347.22235107421875, -338.36297607421875, -329.50360107421875, -320.6442565917969, -311.7848815917969, -302.9255065917969, -294.0661315917969, -285.2067565917969, -276.347412109375, -267.488037109375, -258.628662109375, -249.76930236816406, -240.90994262695312, -232.05056762695312, -223.19119262695312, -214.33181762695312, -205.47244262695312, -196.61306762695312, -187.7537078857422, -178.8943328857422, -170.03497314453125, -161.17559814453125, -152.31622314453125, -143.45684814453125, -134.5974884033203, -125.73812103271484, -116.87875366210938, -108.01937866210938, -99.1600112915039, -90.30064392089844, -81.44126892089844, -72.58190155029297, -63.7225341796875, -54.86316680908203, -46.0037956237793, -37.14442443847656, -28.285057067871094, -19.425689697265625, -10.56631851196289, -1.7069473266601562, 7.1524200439453125, 16.011789321899414, 24.871158599853516, 33.73052978515625, 42.58989715576172, 51.44926452636719, 60.30863571166992, 69.16800689697266, 78.02737426757812, 86.8867416381836, 95.74610900878906, 104.60548400878906, 113.46485137939453, 122.32421875, 131.18359375, 140.04296875, 148.90232849121094, 157.76170349121094, 166.62106323242188, 175.48043823242188, 184.33981323242188, 193.1991729736328, 202.0585479736328, 210.91790771484375, 219.77728271484375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 4.0, 4.0, 5.0, 6.0, 12.0, 9.0, 14.0, 14.0, 24.0, 24.0, 19.0, 24.0, 33.0, 17.0, 28.0, 34.0, 31.0, 36.0, 26.0, 41.0, 37.0, 41.0, 45.0, 37.0, 31.0, 41.0, 27.0, 36.0, 36.0, 31.0, 34.0, 29.0, 28.0, 30.0, 21.0, 13.0, 15.0, 14.0, 8.0, 12.0, 7.0, 8.0, 8.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.54640197753906, -45.96523666381836, -44.384071350097656, -42.80290603637695, -41.22174072265625, -39.64057159423828, -38.059410095214844, -36.478240966796875, -34.89707565307617, -33.31591033935547, -31.734745025634766, -30.153579711914062, -28.572412490844727, -26.991247177124023, -25.41008186340332, -23.828914642333984, -22.247751235961914, -20.66658592224121, -19.085420608520508, -17.504253387451172, -15.923088073730469, -14.341922760009766, -12.760757446289062, -11.179591178894043, -9.59842586517334, -8.017260551452637, -6.436094284057617, -4.854928970336914, -3.2737631797790527, -1.6925973892211914, -0.11143207550048828, 1.4697341918945312, 3.0508995056152344, 4.632065296173096, 6.213231086730957, 7.79439640045166, 9.37556266784668, 10.956727981567383, 12.537893295288086, 14.119059562683105, 15.700224876403809, 17.281391143798828, 18.86255645751953, 20.443721771240234, 22.024887084960938, 23.60605239868164, 25.187217712402344, 26.76838493347168, 28.349550247192383, 29.930715560913086, 31.51188087463379, 33.093048095703125, 34.67421340942383, 36.25537872314453, 37.836544036865234, 39.41770935058594, 40.99887466430664, 42.580039978027344, 44.16120529174805, 45.74237060546875, 47.32353591918945, 48.904701232910156, 50.485870361328125, 52.06703567504883, 53.64820098876953]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 8.0, 15.0, 24.0, 40.0, 49.0, 104.0, 153.0, 237.0, 479.0, 840.0, 1795.0, 4218.0, 11702.0, 39015.0, 142741.0, 393163.0, 315531.0, 96873.0, 26764.0, 8505.0, 3189.0, 1499.0, 672.0, 367.0, 208.0, 135.0, 78.0, 52.0, 38.0, 18.0, 12.0, 10.0, 4.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.0, -106.6513671875, -103.302734375, -99.9541015625, -96.60546875, -93.2568359375, -89.908203125, -86.5595703125, -83.2109375, -79.8623046875, -76.513671875, -73.1650390625, -69.81640625, -66.4677734375, -63.119140625, -59.7705078125, -56.421875, -53.0732421875, -49.724609375, -46.3759765625, -43.02734375, -39.6787109375, -36.330078125, -32.9814453125, -29.6328125, -26.2841796875, -22.935546875, -19.5869140625, -16.23828125, -12.8896484375, -9.541015625, -6.1923828125, -2.84375, 0.5048828125, 3.853515625, 7.2021484375, 10.55078125, 13.8994140625, 17.248046875, 20.5966796875, 23.9453125, 27.2939453125, 30.642578125, 33.9912109375, 37.33984375, 40.6884765625, 44.037109375, 47.3857421875, 50.734375, 54.0830078125, 57.431640625, 60.7802734375, 64.12890625, 67.4775390625, 70.826171875, 74.1748046875, 77.5234375, 80.8720703125, 84.220703125, 87.5693359375, 90.91796875, 94.2666015625, 97.615234375, 100.9638671875, 104.3125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 2.0, 6.0, 10.0, 15.0, 24.0, 25.0, 38.0, 44.0, 68.0, 73.0, 83.0, 72.0, 84.0, 83.0, 89.0, 74.0, 58.0, 42.0, 28.0, 27.0, 20.0, 13.0, 11.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.53125, -48.74462890625, -46.9580078125, -45.17138671875, -43.384765625, -41.59814453125, -39.8115234375, -38.02490234375, -36.23828125, -34.45166015625, -32.6650390625, -30.87841796875, -29.091796875, -27.30517578125, -25.5185546875, -23.73193359375, -21.9453125, -20.15869140625, -18.3720703125, -16.58544921875, -14.798828125, -13.01220703125, -11.2255859375, -9.43896484375, -7.65234375, -5.86572265625, -4.0791015625, -2.29248046875, -0.505859375, 1.28076171875, 3.0673828125, 4.85400390625, 6.640625, 8.42724609375, 10.2138671875, 12.00048828125, 13.787109375, 15.57373046875, 17.3603515625, 19.14697265625, 20.93359375, 22.72021484375, 24.5068359375, 26.29345703125, 28.080078125, 29.86669921875, 31.6533203125, 33.43994140625, 35.2265625, 37.01318359375, 38.7998046875, 40.58642578125, 42.373046875, 44.15966796875, 45.9462890625, 47.73291015625, 49.51953125, 51.30615234375, 53.0927734375, 54.87939453125, 56.666015625, 58.45263671875, 60.2392578125, 62.02587890625, 63.8125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 3.0, 11.0, 10.0, 20.0, 18.0, 34.0, 54.0, 58.0, 114.0, 127.0, 166.0, 236.0, 409.0, 637.0, 1090.0, 2984.0, 23384.0, 709338.0, 294113.0, 11176.0, 1976.0, 942.0, 510.0, 333.0, 215.0, 173.0, 128.0, 83.0, 60.0, 36.0, 22.0, 27.0, 12.0, 13.0, 10.0, 7.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.75, -275.84765625, -265.9453125, -256.04296875, -246.140625, -236.23828125, -226.3359375, -216.43359375, -206.53125, -196.62890625, -186.7265625, -176.82421875, -166.921875, -157.01953125, -147.1171875, -137.21484375, -127.3125, -117.41015625, -107.5078125, -97.60546875, -87.703125, -77.80078125, -67.8984375, -57.99609375, -48.09375, -38.19140625, -28.2890625, -18.38671875, -8.484375, 1.41796875, 11.3203125, 21.22265625, 31.125, 41.02734375, 50.9296875, 60.83203125, 70.734375, 80.63671875, 90.5390625, 100.44140625, 110.34375, 120.24609375, 130.1484375, 140.05078125, 149.953125, 159.85546875, 169.7578125, 179.66015625, 189.5625, 199.46484375, 209.3671875, 219.26953125, 229.171875, 239.07421875, 248.9765625, 258.87890625, 268.78125, 278.68359375, 288.5859375, 298.48828125, 308.390625, 318.29296875, 328.1953125, 338.09765625, 348.0]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 3.0, 3.0, 4.0, 8.0, 14.0, 13.0, 15.0, 27.0, 30.0, 15.0, 18.0, 43.0, 34.0, 44.0, 52.0, 46.0, 57.0, 46.0, 45.0, 44.0, 47.0, 47.0, 48.0, 43.0, 35.0, 30.0, 32.0, 26.0, 19.0, 18.0, 16.0, 20.0, 14.0, 12.0, 5.0, 4.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-184.0, -178.4140625, -172.828125, -167.2421875, -161.65625, -156.0703125, -150.484375, -144.8984375, -139.3125, -133.7265625, -128.140625, -122.5546875, -116.96875, -111.3828125, -105.796875, -100.2109375, -94.625, -89.0390625, -83.453125, -77.8671875, -72.28125, -66.6953125, -61.109375, -55.5234375, -49.9375, -44.3515625, -38.765625, -33.1796875, -27.59375, -22.0078125, -16.421875, -10.8359375, -5.25, 0.3359375, 5.921875, 11.5078125, 17.09375, 22.6796875, 28.265625, 33.8515625, 39.4375, 45.0234375, 50.609375, 56.1953125, 61.78125, 67.3671875, 72.953125, 78.5390625, 84.125, 89.7109375, 95.296875, 100.8828125, 106.46875, 112.0546875, 117.640625, 123.2265625, 128.8125, 134.3984375, 139.984375, 145.5703125, 151.15625, 156.7421875, 162.328125, 167.9140625, 173.5]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 4.0, 15.0, 19.0, 27.0, 18.0, 53.0, 61.0, 105.0, 130.0, 221.0, 409.0, 791.0, 1994.0, 5782.0, 25629.0, 207531.0, 688434.0, 95464.0, 14857.0, 3986.0, 1440.0, 644.0, 331.0, 189.0, 120.0, 78.0, 60.0, 31.0, 26.0, 23.0, 10.0, 10.0, 8.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0], "bins": [-83.0625, -80.7763671875, -78.490234375, -76.2041015625, -73.91796875, -71.6318359375, -69.345703125, -67.0595703125, -64.7734375, -62.4873046875, -60.201171875, -57.9150390625, -55.62890625, -53.3427734375, -51.056640625, -48.7705078125, -46.484375, -44.1982421875, -41.912109375, -39.6259765625, -37.33984375, -35.0537109375, -32.767578125, -30.4814453125, -28.1953125, -25.9091796875, -23.623046875, -21.3369140625, -19.05078125, -16.7646484375, -14.478515625, -12.1923828125, -9.90625, -7.6201171875, -5.333984375, -3.0478515625, -0.76171875, 1.5244140625, 3.810546875, 6.0966796875, 8.3828125, 10.6689453125, 12.955078125, 15.2412109375, 17.52734375, 19.8134765625, 22.099609375, 24.3857421875, 26.671875, 28.9580078125, 31.244140625, 33.5302734375, 35.81640625, 38.1025390625, 40.388671875, 42.6748046875, 44.9609375, 47.2470703125, 49.533203125, 51.8193359375, 54.10546875, 56.3916015625, 58.677734375, 60.9638671875, 63.25]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 3.0, 3.0, 10.0, 8.0, 13.0, 13.0, 26.0, 30.0, 54.0, 48.0, 84.0, 96.0, 118.0, 116.0, 88.0, 76.0, 55.0, 42.0, 27.0, 24.0, 16.0, 13.0, 11.0, 6.0, 0.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007373809814453125, -0.007077634334564209, -0.006781458854675293, -0.006485283374786377, -0.006189107894897461, -0.005892932415008545, -0.005596756935119629, -0.005300581455230713, -0.005004405975341797, -0.004708230495452881, -0.004412055015563965, -0.004115879535675049, -0.003819704055786133, -0.003523528575897217, -0.0032273530960083008, -0.0029311776161193848, -0.0026350021362304688, -0.0023388266563415527, -0.0020426511764526367, -0.0017464756965637207, -0.0014503002166748047, -0.0011541247367858887, -0.0008579492568969727, -0.0005617737770080566, -0.0002655982971191406, 3.057718276977539e-05, 0.0003267526626586914, 0.0006229281425476074, 0.0009191036224365234, 0.0012152791023254395, 0.0015114545822143555, 0.0018076300621032715, 0.0021038055419921875, 0.0023999810218811035, 0.0026961565017700195, 0.0029923319816589355, 0.0032885074615478516, 0.0035846829414367676, 0.0038808584213256836, 0.0041770339012146, 0.004473209381103516, 0.004769384860992432, 0.005065560340881348, 0.005361735820770264, 0.00565791130065918, 0.005954086780548096, 0.006250262260437012, 0.006546437740325928, 0.006842613220214844, 0.00713878870010376, 0.007434964179992676, 0.007731139659881592, 0.008027315139770508, 0.008323490619659424, 0.00861966609954834, 0.008915841579437256, 0.009212017059326172, 0.009508192539215088, 0.009804368019104004, 0.01010054349899292, 0.010396718978881836, 0.010692894458770752, 0.010989069938659668, 0.011285245418548584, 0.0115814208984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 14.0, 25.0, 26.0, 40.0, 75.0, 130.0, 291.0, 782.0, 2977.0, 27711.0, 893993.0, 114656.0, 5775.0, 1218.0, 417.0, 164.0, 95.0, 55.0, 42.0, 25.0, 16.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.9375, -100.5068359375, -96.076171875, -91.6455078125, -87.21484375, -82.7841796875, -78.353515625, -73.9228515625, -69.4921875, -65.0615234375, -60.630859375, -56.2001953125, -51.76953125, -47.3388671875, -42.908203125, -38.4775390625, -34.046875, -29.6162109375, -25.185546875, -20.7548828125, -16.32421875, -11.8935546875, -7.462890625, -3.0322265625, 1.3984375, 5.8291015625, 10.259765625, 14.6904296875, 19.12109375, 23.5517578125, 27.982421875, 32.4130859375, 36.84375, 41.2744140625, 45.705078125, 50.1357421875, 54.56640625, 58.9970703125, 63.427734375, 67.8583984375, 72.2890625, 76.7197265625, 81.150390625, 85.5810546875, 90.01171875, 94.4423828125, 98.873046875, 103.3037109375, 107.734375, 112.1650390625, 116.595703125, 121.0263671875, 125.45703125, 129.8876953125, 134.318359375, 138.7490234375, 143.1796875, 147.6103515625, 152.041015625, 156.4716796875, 160.90234375, 165.3330078125, 169.763671875, 174.1943359375, 178.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 4.0, 8.0, 9.0, 26.0, 26.0, 35.0, 54.0, 53.0, 64.0, 80.0, 114.0, 121.0, 116.0, 68.0, 59.0, 36.0, 46.0, 22.0, 12.0, 15.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.09375, -51.82958984375, -49.5654296875, -47.30126953125, -45.037109375, -42.77294921875, -40.5087890625, -38.24462890625, -35.98046875, -33.71630859375, -31.4521484375, -29.18798828125, -26.923828125, -24.65966796875, -22.3955078125, -20.13134765625, -17.8671875, -15.60302734375, -13.3388671875, -11.07470703125, -8.810546875, -6.54638671875, -4.2822265625, -2.01806640625, 0.24609375, 2.51025390625, 4.7744140625, 7.03857421875, 9.302734375, 11.56689453125, 13.8310546875, 16.09521484375, 18.359375, 20.62353515625, 22.8876953125, 25.15185546875, 27.416015625, 29.68017578125, 31.9443359375, 34.20849609375, 36.47265625, 38.73681640625, 41.0009765625, 43.26513671875, 45.529296875, 47.79345703125, 50.0576171875, 52.32177734375, 54.5859375, 56.85009765625, 59.1142578125, 61.37841796875, 63.642578125, 65.90673828125, 68.1708984375, 70.43505859375, 72.69921875, 74.96337890625, 77.2275390625, 79.49169921875, 81.755859375, 84.02001953125, 86.2841796875, 88.54833984375, 90.8125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 10.0, 39.0, 85.0, 169.0, 273.0, 250.0, 112.0, 45.0, 10.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1913.9091796875, -1853.7603759765625, -1793.6114501953125, -1733.462646484375, -1673.3138427734375, -1613.1650390625, -1553.01611328125, -1492.8673095703125, -1432.718505859375, -1372.5697021484375, -1312.4207763671875, -1252.27197265625, -1192.1231689453125, -1131.974365234375, -1071.825439453125, -1011.6766357421875, -951.5277099609375, -891.3788452148438, -831.2300415039062, -771.0811767578125, -710.932373046875, -650.7835083007812, -590.6346435546875, -530.48583984375, -470.33697509765625, -410.1881408691406, -350.039306640625, -289.89044189453125, -229.74160766601562, -169.5927734375, -109.44390869140625, -49.295074462890625, 10.8536376953125, 71.00247955322266, 131.1513214111328, 191.3001708984375, 251.44900512695312, 311.59783935546875, 371.7467041015625, 431.8955383300781, 492.04437255859375, 552.1932373046875, 612.342041015625, 672.4909057617188, 732.6397705078125, 792.78857421875, 852.9374389648438, 913.0863037109375, 973.235107421875, 1033.3839111328125, 1093.5328369140625, 1153.681640625, 1213.8304443359375, 1273.979248046875, 1334.128173828125, 1394.2769775390625, 1454.42578125, 1514.5745849609375, 1574.7235107421875, 1634.872314453125, 1695.0211181640625, 1755.169921875, 1815.31884765625, 1875.4676513671875, 1935.6165771484375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 9.0, 7.0, 14.0, 11.0, 17.0, 24.0, 23.0, 32.0, 29.0, 38.0, 33.0, 43.0, 45.0, 46.0, 62.0, 51.0, 64.0, 43.0, 37.0, 53.0, 43.0, 41.0, 34.0, 28.0, 32.0, 21.0, 22.0, 26.0, 18.0, 16.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-933.82958984375, -908.5966186523438, -883.3636474609375, -858.1306762695312, -832.897705078125, -807.6646728515625, -782.4317016601562, -757.19873046875, -731.9657592773438, -706.7327880859375, -681.4998168945312, -656.266845703125, -631.0338134765625, -605.8008422851562, -580.56787109375, -555.3348999023438, -530.1019287109375, -504.86895751953125, -479.635986328125, -454.4029846191406, -429.1700134277344, -403.9370422363281, -378.70404052734375, -353.4710693359375, -328.23809814453125, -303.005126953125, -277.77215576171875, -252.53915405273438, -227.30618286132812, -202.07321166992188, -176.84022521972656, -151.60723876953125, -126.37432861328125, -101.14134979248047, -75.90837097167969, -50.675392150878906, -25.442413330078125, -0.20943450927734375, 25.023544311523438, 50.25653076171875, 75.489501953125, 100.72248077392578, 125.95545959472656, 151.18844604492188, 176.42141723632812, 201.65438842773438, 226.8873748779297, 252.120361328125, 277.35333251953125, 302.5863037109375, 327.81927490234375, 353.0522766113281, 378.2852478027344, 403.5182189941406, 428.751220703125, 453.98419189453125, 479.2171630859375, 504.45013427734375, 529.68310546875, 554.9160766601562, 580.1490478515625, 605.382080078125, 630.6150512695312, 655.8480224609375, 681.0809936523438]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 12.0, 8.0, 18.0, 15.0, 28.0, 46.0, 62.0, 92.0, 128.0, 231.0, 402.0, 679.0, 1348.0, 3027.0, 7936.0, 27341.0, 757264.0, 3353516.0, 28213.0, 7994.0, 3009.0, 1277.0, 678.0, 348.0, 212.0, 111.0, 94.0, 55.0, 41.0, 27.0, 26.0, 13.0, 10.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.8125, -96.7880859375, -93.763671875, -90.7392578125, -87.71484375, -84.6904296875, -81.666015625, -78.6416015625, -75.6171875, -72.5927734375, -69.568359375, -66.5439453125, -63.51953125, -60.4951171875, -57.470703125, -54.4462890625, -51.421875, -48.3974609375, -45.373046875, -42.3486328125, -39.32421875, -36.2998046875, -33.275390625, -30.2509765625, -27.2265625, -24.2021484375, -21.177734375, -18.1533203125, -15.12890625, -12.1044921875, -9.080078125, -6.0556640625, -3.03125, -0.0068359375, 3.017578125, 6.0419921875, 9.06640625, 12.0908203125, 15.115234375, 18.1396484375, 21.1640625, 24.1884765625, 27.212890625, 30.2373046875, 33.26171875, 36.2861328125, 39.310546875, 42.3349609375, 45.359375, 48.3837890625, 51.408203125, 54.4326171875, 57.45703125, 60.4814453125, 63.505859375, 66.5302734375, 69.5546875, 72.5791015625, 75.603515625, 78.6279296875, 81.65234375, 84.6767578125, 87.701171875, 90.7255859375, 93.75]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 2.0, 7.0, 7.0, 7.0, 18.0, 21.0, 36.0, 41.0, 50.0, 52.0, 71.0, 57.0, 82.0, 65.0, 70.0, 76.0, 62.0, 48.0, 54.0, 32.0, 41.0, 28.0, 21.0, 13.0, 10.0, 7.0, 5.0, 5.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.28125, -42.736328125, -41.19140625, -39.646484375, -38.1015625, -36.556640625, -35.01171875, -33.466796875, -31.921875, -30.376953125, -28.83203125, -27.287109375, -25.7421875, -24.197265625, -22.65234375, -21.107421875, -19.5625, -18.017578125, -16.47265625, -14.927734375, -13.3828125, -11.837890625, -10.29296875, -8.748046875, -7.203125, -5.658203125, -4.11328125, -2.568359375, -1.0234375, 0.521484375, 2.06640625, 3.611328125, 5.15625, 6.701171875, 8.24609375, 9.791015625, 11.3359375, 12.880859375, 14.42578125, 15.970703125, 17.515625, 19.060546875, 20.60546875, 22.150390625, 23.6953125, 25.240234375, 26.78515625, 28.330078125, 29.875, 31.419921875, 32.96484375, 34.509765625, 36.0546875, 37.599609375, 39.14453125, 40.689453125, 42.234375, 43.779296875, 45.32421875, 46.869140625, 48.4140625, 49.958984375, 51.50390625, 53.048828125, 54.59375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 10.0, 12.0, 16.0, 22.0, 36.0, 69.0, 90.0, 98.0, 156.0, 251.0, 365.0, 620.0, 813.0, 1432.0, 2299.0, 3979.0, 7997.0, 21597.0, 83390.0, 3870854.0, 147744.0, 29899.0, 10496.0, 4880.0, 2654.0, 1526.0, 1044.0, 620.0, 429.0, 265.0, 199.0, 124.0, 92.0, 52.0, 51.0, 21.0, 22.0, 17.0, 8.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.9375, -67.4072265625, -64.876953125, -62.3466796875, -59.81640625, -57.2861328125, -54.755859375, -52.2255859375, -49.6953125, -47.1650390625, -44.634765625, -42.1044921875, -39.57421875, -37.0439453125, -34.513671875, -31.9833984375, -29.453125, -26.9228515625, -24.392578125, -21.8623046875, -19.33203125, -16.8017578125, -14.271484375, -11.7412109375, -9.2109375, -6.6806640625, -4.150390625, -1.6201171875, 0.91015625, 3.4404296875, 5.970703125, 8.5009765625, 11.03125, 13.5615234375, 16.091796875, 18.6220703125, 21.15234375, 23.6826171875, 26.212890625, 28.7431640625, 31.2734375, 33.8037109375, 36.333984375, 38.8642578125, 41.39453125, 43.9248046875, 46.455078125, 48.9853515625, 51.515625, 54.0458984375, 56.576171875, 59.1064453125, 61.63671875, 64.1669921875, 66.697265625, 69.2275390625, 71.7578125, 74.2880859375, 76.818359375, 79.3486328125, 81.87890625, 84.4091796875, 86.939453125, 89.4697265625, 92.0]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 10.0, 9.0, 29.0, 41.0, 67.0, 187.0, 3363.0, 189.0, 69.0, 40.0, 20.0, 8.0, 6.0, 6.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.84375, -42.7880859375, -41.732421875, -40.6767578125, -39.62109375, -38.5654296875, -37.509765625, -36.4541015625, -35.3984375, -34.3427734375, -33.287109375, -32.2314453125, -31.17578125, -30.1201171875, -29.064453125, -28.0087890625, -26.953125, -25.8974609375, -24.841796875, -23.7861328125, -22.73046875, -21.6748046875, -20.619140625, -19.5634765625, -18.5078125, -17.4521484375, -16.396484375, -15.3408203125, -14.28515625, -13.2294921875, -12.173828125, -11.1181640625, -10.0625, -9.0068359375, -7.951171875, -6.8955078125, -5.83984375, -4.7841796875, -3.728515625, -2.6728515625, -1.6171875, -0.5615234375, 0.494140625, 1.5498046875, 2.60546875, 3.6611328125, 4.716796875, 5.7724609375, 6.828125, 7.8837890625, 8.939453125, 9.9951171875, 11.05078125, 12.1064453125, 13.162109375, 14.2177734375, 15.2734375, 16.3291015625, 17.384765625, 18.4404296875, 19.49609375, 20.5517578125, 21.607421875, 22.6630859375, 23.71875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 10.0, 6.0, 10.0, 15.0, 29.0, 64.0, 66.0, 82.0, 136.0, 130.0, 118.0, 109.0, 62.0, 53.0, 42.0, 28.0, 8.0, 8.0, 6.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.57127380371094, -133.9714813232422, -130.37167358398438, -126.77188110351562, -123.17208099365234, -119.57228088378906, -115.97248077392578, -112.3726806640625, -108.77288818359375, -105.17308807373047, -101.57328796386719, -97.97349548339844, -94.37369537353516, -90.77389526367188, -87.1740951538086, -83.57429504394531, -79.97449493408203, -76.37469482421875, -72.77489471435547, -69.17509460449219, -65.57530212402344, -61.975502014160156, -58.375701904296875, -54.775901794433594, -51.17610549926758, -47.5763053894043, -43.97650909423828, -40.376708984375, -36.77690887451172, -33.1771125793457, -29.577312469482422, -25.977514266967773, -22.377716064453125, -18.777917861938477, -15.178118705749512, -11.578319549560547, -7.978521347045898, -4.37872314453125, -0.7789230346679688, 2.8208751678466797, 6.420673370361328, 10.020471572875977, 13.620270729064941, 17.220069885253906, 20.819868087768555, 24.419666290283203, 28.019466400146484, 31.619264602661133, 35.21906280517578, 38.81886291503906, 42.41865921020508, 46.01845932006836, 49.618255615234375, 53.218055725097656, 56.81785583496094, 60.41765594482422, 64.0174560546875, 67.61725616455078, 71.21705627441406, 74.81684875488281, 78.4166488647461, 82.01644897460938, 85.61624908447266, 89.21604919433594, 92.81584167480469]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 11.0, 11.0, 12.0, 8.0, 14.0, 8.0, 12.0, 26.0, 22.0, 31.0, 23.0, 34.0, 40.0, 36.0, 29.0, 43.0, 37.0, 41.0, 36.0, 36.0, 41.0, 50.0, 40.0, 49.0, 36.0, 32.0, 36.0, 21.0, 18.0, 26.0, 21.0, 17.0, 14.0, 15.0, 8.0, 9.0, 7.0, 6.0, 6.0, 7.0, 8.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.90528869628906, -49.03809356689453, -47.1708984375, -45.30370330810547, -43.43650436401367, -41.56930923461914, -39.70211410522461, -37.83491897583008, -35.96772003173828, -34.10052490234375, -32.23332977294922, -30.366132736206055, -28.49893569946289, -26.63174057006836, -24.764545440673828, -22.897350311279297, -21.030155181884766, -19.162960052490234, -17.29576301574707, -15.428567886352539, -13.561371803283691, -11.694175720214844, -9.826980590820312, -7.959784507751465, -6.092588424682617, -4.2253923416137695, -2.35819673538208, -0.4910011291503906, 1.376194953918457, 3.2433910369873047, 5.110586166381836, 6.977782249450684, 8.844978332519531, 10.712174415588379, 12.579370498657227, 14.446565628051758, 16.313762664794922, 18.180957794189453, 20.048152923583984, 21.915348052978516, 23.78254508972168, 25.64974021911621, 27.516937255859375, 29.384132385253906, 31.251327514648438, 33.11852264404297, 34.9857177734375, 36.8529167175293, 38.72011184692383, 40.58730697631836, 42.45450210571289, 44.32170104980469, 46.18889617919922, 48.05609130859375, 49.92328643798828, 51.79048156738281, 53.657676696777344, 55.524871826171875, 57.392066955566406, 59.25926208496094, 61.126461029052734, 62.993656158447266, 64.86085510253906, 66.7280502319336, 68.59524536132812]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 12.0, 11.0, 22.0, 46.0, 52.0, 81.0, 147.0, 227.0, 423.0, 672.0, 1183.0, 2381.0, 4474.0, 9756.0, 23857.0, 64417.0, 183830.0, 357562.0, 248944.0, 92298.0, 33034.0, 13073.0, 5722.0, 2815.0, 1496.0, 810.0, 466.0, 266.0, 164.0, 108.0, 76.0, 43.0, 32.0, 14.0, 8.0, 13.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.5, -72.955078125, -70.41015625, -67.865234375, -65.3203125, -62.775390625, -60.23046875, -57.685546875, -55.140625, -52.595703125, -50.05078125, -47.505859375, -44.9609375, -42.416015625, -39.87109375, -37.326171875, -34.78125, -32.236328125, -29.69140625, -27.146484375, -24.6015625, -22.056640625, -19.51171875, -16.966796875, -14.421875, -11.876953125, -9.33203125, -6.787109375, -4.2421875, -1.697265625, 0.84765625, 3.392578125, 5.9375, 8.482421875, 11.02734375, 13.572265625, 16.1171875, 18.662109375, 21.20703125, 23.751953125, 26.296875, 28.841796875, 31.38671875, 33.931640625, 36.4765625, 39.021484375, 41.56640625, 44.111328125, 46.65625, 49.201171875, 51.74609375, 54.291015625, 56.8359375, 59.380859375, 61.92578125, 64.470703125, 67.015625, 69.560546875, 72.10546875, 74.650390625, 77.1953125, 79.740234375, 82.28515625, 84.830078125, 87.375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 6.0, 3.0, 7.0, 6.0, 7.0, 19.0, 15.0, 32.0, 43.0, 45.0, 56.0, 58.0, 77.0, 62.0, 76.0, 74.0, 61.0, 52.0, 65.0, 44.0, 44.0, 36.0, 33.0, 16.0, 16.0, 16.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.84375, -44.26025390625, -42.6767578125, -41.09326171875, -39.509765625, -37.92626953125, -36.3427734375, -34.75927734375, -33.17578125, -31.59228515625, -30.0087890625, -28.42529296875, -26.841796875, -25.25830078125, -23.6748046875, -22.09130859375, -20.5078125, -18.92431640625, -17.3408203125, -15.75732421875, -14.173828125, -12.59033203125, -11.0068359375, -9.42333984375, -7.83984375, -6.25634765625, -4.6728515625, -3.08935546875, -1.505859375, 0.07763671875, 1.6611328125, 3.24462890625, 4.828125, 6.41162109375, 7.9951171875, 9.57861328125, 11.162109375, 12.74560546875, 14.3291015625, 15.91259765625, 17.49609375, 19.07958984375, 20.6630859375, 22.24658203125, 23.830078125, 25.41357421875, 26.9970703125, 28.58056640625, 30.1640625, 31.74755859375, 33.3310546875, 34.91455078125, 36.498046875, 38.08154296875, 39.6650390625, 41.24853515625, 42.83203125, 44.41552734375, 45.9990234375, 47.58251953125, 49.166015625, 50.74951171875, 52.3330078125, 53.91650390625, 55.5]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 7.0, 10.0, 18.0, 19.0, 29.0, 49.0, 62.0, 83.0, 130.0, 210.0, 339.0, 570.0, 1049.0, 2513.0, 13791.0, 625376.0, 389510.0, 10155.0, 2278.0, 918.0, 508.0, 321.0, 190.0, 122.0, 88.0, 53.0, 43.0, 29.0, 19.0, 15.0, 6.0, 7.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-269.25, -259.25390625, -249.2578125, -239.26171875, -229.265625, -219.26953125, -209.2734375, -199.27734375, -189.28125, -179.28515625, -169.2890625, -159.29296875, -149.296875, -139.30078125, -129.3046875, -119.30859375, -109.3125, -99.31640625, -89.3203125, -79.32421875, -69.328125, -59.33203125, -49.3359375, -39.33984375, -29.34375, -19.34765625, -9.3515625, 0.64453125, 10.640625, 20.63671875, 30.6328125, 40.62890625, 50.625, 60.62109375, 70.6171875, 80.61328125, 90.609375, 100.60546875, 110.6015625, 120.59765625, 130.59375, 140.58984375, 150.5859375, 160.58203125, 170.578125, 180.57421875, 190.5703125, 200.56640625, 210.5625, 220.55859375, 230.5546875, 240.55078125, 250.546875, 260.54296875, 270.5390625, 280.53515625, 290.53125, 300.52734375, 310.5234375, 320.51953125, 330.515625, 340.51171875, 350.5078125, 360.50390625, 370.5]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 19.0, 18.0, 19.0, 35.0, 31.0, 37.0, 40.0, 65.0, 58.0, 72.0, 49.0, 63.0, 64.0, 60.0, 62.0, 42.0, 53.0, 48.0, 33.0, 30.0, 27.0, 13.0, 18.0, 8.0, 7.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-193.625, -186.623046875, -179.62109375, -172.619140625, -165.6171875, -158.615234375, -151.61328125, -144.611328125, -137.609375, -130.607421875, -123.60546875, -116.603515625, -109.6015625, -102.599609375, -95.59765625, -88.595703125, -81.59375, -74.591796875, -67.58984375, -60.587890625, -53.5859375, -46.583984375, -39.58203125, -32.580078125, -25.578125, -18.576171875, -11.57421875, -4.572265625, 2.4296875, 9.431640625, 16.43359375, 23.435546875, 30.4375, 37.439453125, 44.44140625, 51.443359375, 58.4453125, 65.447265625, 72.44921875, 79.451171875, 86.453125, 93.455078125, 100.45703125, 107.458984375, 114.4609375, 121.462890625, 128.46484375, 135.466796875, 142.46875, 149.470703125, 156.47265625, 163.474609375, 170.4765625, 177.478515625, 184.48046875, 191.482421875, 198.484375, 205.486328125, 212.48828125, 219.490234375, 226.4921875, 233.494140625, 240.49609375, 247.498046875, 254.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 8.0, 7.0, 9.0, 6.0, 13.0, 16.0, 28.0, 34.0, 50.0, 58.0, 102.0, 145.0, 222.0, 391.0, 988.0, 3025.0, 17805.0, 362650.0, 628938.0, 27612.0, 4009.0, 1164.0, 497.0, 260.0, 159.0, 99.0, 57.0, 58.0, 35.0, 30.0, 17.0, 16.0, 11.0, 6.0, 3.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-101.5625, -98.2958984375, -95.029296875, -91.7626953125, -88.49609375, -85.2294921875, -81.962890625, -78.6962890625, -75.4296875, -72.1630859375, -68.896484375, -65.6298828125, -62.36328125, -59.0966796875, -55.830078125, -52.5634765625, -49.296875, -46.0302734375, -42.763671875, -39.4970703125, -36.23046875, -32.9638671875, -29.697265625, -26.4306640625, -23.1640625, -19.8974609375, -16.630859375, -13.3642578125, -10.09765625, -6.8310546875, -3.564453125, -0.2978515625, 2.96875, 6.2353515625, 9.501953125, 12.7685546875, 16.03515625, 19.3017578125, 22.568359375, 25.8349609375, 29.1015625, 32.3681640625, 35.634765625, 38.9013671875, 42.16796875, 45.4345703125, 48.701171875, 51.9677734375, 55.234375, 58.5009765625, 61.767578125, 65.0341796875, 68.30078125, 71.5673828125, 74.833984375, 78.1005859375, 81.3671875, 84.6337890625, 87.900390625, 91.1669921875, 94.43359375, 97.7001953125, 100.966796875, 104.2333984375, 107.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 3.0, 15.0, 9.0, 23.0, 38.0, 41.0, 70.0, 72.0, 92.0, 116.0, 113.0, 103.0, 76.0, 60.0, 34.0, 18.0, 35.0, 14.0, 12.0, 18.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007762908935546875, -0.007476508617401123, -0.007190108299255371, -0.006903707981109619, -0.006617307662963867, -0.006330907344818115, -0.006044507026672363, -0.005758106708526611, -0.005471706390380859, -0.005185306072235107, -0.0048989057540893555, -0.0046125054359436035, -0.0043261051177978516, -0.0040397047996521, -0.0037533044815063477, -0.0034669041633605957, -0.0031805038452148438, -0.002894103527069092, -0.00260770320892334, -0.002321302890777588, -0.002034902572631836, -0.001748502254486084, -0.001462101936340332, -0.00117570161819458, -0.0008893013000488281, -0.0006029009819030762, -0.0003165006637573242, -3.0100345611572266e-05, 0.0002562999725341797, 0.0005427002906799316, 0.0008291006088256836, 0.0011155009269714355, 0.0014019012451171875, 0.0016883015632629395, 0.0019747018814086914, 0.0022611021995544434, 0.0025475025177001953, 0.0028339028358459473, 0.0031203031539916992, 0.003406703472137451, 0.003693103790283203, 0.003979504108428955, 0.004265904426574707, 0.004552304744720459, 0.004838705062866211, 0.005125105381011963, 0.005411505699157715, 0.005697906017303467, 0.005984306335449219, 0.006270706653594971, 0.006557106971740723, 0.006843507289886475, 0.0071299076080322266, 0.0074163079261779785, 0.0077027082443237305, 0.007989108562469482, 0.008275508880615234, 0.008561909198760986, 0.008848309516906738, 0.00913470983505249, 0.009421110153198242, 0.009707510471343994, 0.009993910789489746, 0.010280311107635498, 0.01056671142578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 11.0, 11.0, 15.0, 25.0, 33.0, 38.0, 63.0, 114.0, 205.0, 407.0, 1041.0, 3774.0, 27205.0, 839918.0, 163271.0, 9129.0, 1902.0, 650.0, 289.0, 164.0, 95.0, 56.0, 33.0, 24.0, 19.0, 13.0, 12.0, 7.0, 9.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.5, -119.349609375, -115.19921875, -111.048828125, -106.8984375, -102.748046875, -98.59765625, -94.447265625, -90.296875, -86.146484375, -81.99609375, -77.845703125, -73.6953125, -69.544921875, -65.39453125, -61.244140625, -57.09375, -52.943359375, -48.79296875, -44.642578125, -40.4921875, -36.341796875, -32.19140625, -28.041015625, -23.890625, -19.740234375, -15.58984375, -11.439453125, -7.2890625, -3.138671875, 1.01171875, 5.162109375, 9.3125, 13.462890625, 17.61328125, 21.763671875, 25.9140625, 30.064453125, 34.21484375, 38.365234375, 42.515625, 46.666015625, 50.81640625, 54.966796875, 59.1171875, 63.267578125, 67.41796875, 71.568359375, 75.71875, 79.869140625, 84.01953125, 88.169921875, 92.3203125, 96.470703125, 100.62109375, 104.771484375, 108.921875, 113.072265625, 117.22265625, 121.373046875, 125.5234375, 129.673828125, 133.82421875, 137.974609375, 142.125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 23.0, 13.0, 36.0, 32.0, 48.0, 71.0, 77.0, 91.0, 100.0, 97.0, 98.0, 73.0, 55.0, 52.0, 23.0, 19.0, 17.0, 4.0, 11.0, 7.0, 10.0, 2.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.875, -70.7255859375, -68.576171875, -66.4267578125, -64.27734375, -62.1279296875, -59.978515625, -57.8291015625, -55.6796875, -53.5302734375, -51.380859375, -49.2314453125, -47.08203125, -44.9326171875, -42.783203125, -40.6337890625, -38.484375, -36.3349609375, -34.185546875, -32.0361328125, -29.88671875, -27.7373046875, -25.587890625, -23.4384765625, -21.2890625, -19.1396484375, -16.990234375, -14.8408203125, -12.69140625, -10.5419921875, -8.392578125, -6.2431640625, -4.09375, -1.9443359375, 0.205078125, 2.3544921875, 4.50390625, 6.6533203125, 8.802734375, 10.9521484375, 13.1015625, 15.2509765625, 17.400390625, 19.5498046875, 21.69921875, 23.8486328125, 25.998046875, 28.1474609375, 30.296875, 32.4462890625, 34.595703125, 36.7451171875, 38.89453125, 41.0439453125, 43.193359375, 45.3427734375, 47.4921875, 49.6416015625, 51.791015625, 53.9404296875, 56.08984375, 58.2392578125, 60.388671875, 62.5380859375, 64.6875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 22.0, 113.0, 489.0, 321.0, 50.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6015.5625, -5881.4345703125, -5747.306640625, -5613.17919921875, -5479.05126953125, -5344.92333984375, -5210.7958984375, -5076.66796875, -4942.5400390625, -4808.412109375, -4674.2841796875, -4540.15673828125, -4406.02880859375, -4271.90087890625, -4137.7734375, -4003.6455078125, -3869.517578125, -3735.3896484375, -3601.261962890625, -3467.13427734375, -3333.00634765625, -3198.87841796875, -3064.750732421875, -2930.623046875, -2796.4951171875, -2662.3671875, -2528.239501953125, -2394.11181640625, -2259.98388671875, -2125.85595703125, -1991.728271484375, -1857.6004638671875, -1723.47216796875, -1589.3443603515625, -1455.216552734375, -1321.0887451171875, -1186.9609375, -1052.8331298828125, -918.705322265625, -784.5775146484375, -650.44970703125, -516.3218994140625, -382.194091796875, -248.0662841796875, -113.9384765625, 20.1893310546875, 154.317138671875, 288.4449462890625, 422.57275390625, 556.7005615234375, 690.828369140625, 824.9561767578125, 959.083984375, 1093.2117919921875, 1227.339599609375, 1361.4674072265625, 1495.59521484375, 1629.7230224609375, 1763.850830078125, 1897.9786376953125, 2032.1064453125, 2166.234375, 2300.362060546875, 2434.48974609375, 2568.61767578125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 8.0, 8.0, 12.0, 13.0, 27.0, 15.0, 21.0, 27.0, 27.0, 35.0, 39.0, 54.0, 44.0, 57.0, 45.0, 55.0, 67.0, 54.0, 47.0, 39.0, 44.0, 34.0, 36.0, 24.0, 22.0, 24.0, 23.0, 18.0, 14.0, 13.0, 11.0, 9.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-850.74365234375, -823.8064575195312, -796.8692626953125, -769.9320678710938, -742.994873046875, -716.0576171875, -689.1204223632812, -662.1832275390625, -635.2460327148438, -608.308837890625, -581.3716430664062, -554.4344482421875, -527.4971923828125, -500.5600280761719, -473.622802734375, -446.68560791015625, -419.7484130859375, -392.81121826171875, -365.8740234375, -338.9367980957031, -311.9996032714844, -285.0624084472656, -258.12518310546875, -231.18798828125, -204.25079345703125, -177.3135986328125, -150.3763885498047, -123.4391860961914, -96.50198364257812, -69.56478881835938, -42.62757873535156, -15.69036865234375, 11.24688720703125, 38.18408966064453, 65.12129211425781, 92.0584945678711, 118.99569702148438, 145.93289184570312, 172.87010192871094, 199.80731201171875, 226.7445068359375, 253.68170166015625, 280.618896484375, 307.5561218261719, 334.4933166503906, 361.4305114746094, 388.36773681640625, 415.304931640625, 442.24212646484375, 469.1793212890625, 496.11651611328125, 523.0537109375, 549.990966796875, 576.9281005859375, 603.8653564453125, 630.8025512695312, 657.73974609375, 684.6769409179688, 711.6141357421875, 738.5513305664062, 765.488525390625, 792.42578125, 819.3629760742188, 846.3001708984375, 873.2373657226562]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 15.0, 11.0, 22.0, 35.0, 32.0, 48.0, 74.0, 93.0, 136.0, 198.0, 305.0, 549.0, 892.0, 1648.0, 3344.0, 8942.0, 47621.0, 4095070.0, 23219.0, 6109.0, 2551.0, 1330.0, 727.0, 442.0, 282.0, 177.0, 122.0, 77.0, 41.0, 44.0, 30.0, 14.0, 19.0, 13.0, 15.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-151.5, -147.3291015625, -143.158203125, -138.9873046875, -134.81640625, -130.6455078125, -126.474609375, -122.3037109375, -118.1328125, -113.9619140625, -109.791015625, -105.6201171875, -101.44921875, -97.2783203125, -93.107421875, -88.9365234375, -84.765625, -80.5947265625, -76.423828125, -72.2529296875, -68.08203125, -63.9111328125, -59.740234375, -55.5693359375, -51.3984375, -47.2275390625, -43.056640625, -38.8857421875, -34.71484375, -30.5439453125, -26.373046875, -22.2021484375, -18.03125, -13.8603515625, -9.689453125, -5.5185546875, -1.34765625, 2.8232421875, 6.994140625, 11.1650390625, 15.3359375, 19.5068359375, 23.677734375, 27.8486328125, 32.01953125, 36.1904296875, 40.361328125, 44.5322265625, 48.703125, 52.8740234375, 57.044921875, 61.2158203125, 65.38671875, 69.5576171875, 73.728515625, 77.8994140625, 82.0703125, 86.2412109375, 90.412109375, 94.5830078125, 98.75390625, 102.9248046875, 107.095703125, 111.2666015625, 115.4375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 7.0, 5.0, 13.0, 8.0, 17.0, 23.0, 20.0, 31.0, 41.0, 45.0, 57.0, 48.0, 65.0, 66.0, 78.0, 53.0, 57.0, 57.0, 52.0, 47.0, 35.0, 26.0, 28.0, 27.0, 21.0, 9.0, 12.0, 9.0, 10.0, 3.0, 4.0, 8.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.28125, -38.927734375, -37.57421875, -36.220703125, -34.8671875, -33.513671875, -32.16015625, -30.806640625, -29.453125, -28.099609375, -26.74609375, -25.392578125, -24.0390625, -22.685546875, -21.33203125, -19.978515625, -18.625, -17.271484375, -15.91796875, -14.564453125, -13.2109375, -11.857421875, -10.50390625, -9.150390625, -7.796875, -6.443359375, -5.08984375, -3.736328125, -2.3828125, -1.029296875, 0.32421875, 1.677734375, 3.03125, 4.384765625, 5.73828125, 7.091796875, 8.4453125, 9.798828125, 11.15234375, 12.505859375, 13.859375, 15.212890625, 16.56640625, 17.919921875, 19.2734375, 20.626953125, 21.98046875, 23.333984375, 24.6875, 26.041015625, 27.39453125, 28.748046875, 30.1015625, 31.455078125, 32.80859375, 34.162109375, 35.515625, 36.869140625, 38.22265625, 39.576171875, 40.9296875, 42.283203125, 43.63671875, 44.990234375, 46.34375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 5.0, 11.0, 13.0, 18.0, 35.0, 36.0, 61.0, 66.0, 123.0, 213.0, 285.0, 387.0, 723.0, 1157.0, 1935.0, 3979.0, 8436.0, 23371.0, 116076.0, 3968214.0, 43367.0, 13429.0, 5698.0, 2821.0, 1382.0, 843.0, 528.0, 333.0, 237.0, 154.0, 121.0, 73.0, 47.0, 32.0, 20.0, 15.0, 16.0, 6.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.25, -86.6435546875, -84.037109375, -81.4306640625, -78.82421875, -76.2177734375, -73.611328125, -71.0048828125, -68.3984375, -65.7919921875, -63.185546875, -60.5791015625, -57.97265625, -55.3662109375, -52.759765625, -50.1533203125, -47.546875, -44.9404296875, -42.333984375, -39.7275390625, -37.12109375, -34.5146484375, -31.908203125, -29.3017578125, -26.6953125, -24.0888671875, -21.482421875, -18.8759765625, -16.26953125, -13.6630859375, -11.056640625, -8.4501953125, -5.84375, -3.2373046875, -0.630859375, 1.9755859375, 4.58203125, 7.1884765625, 9.794921875, 12.4013671875, 15.0078125, 17.6142578125, 20.220703125, 22.8271484375, 25.43359375, 28.0400390625, 30.646484375, 33.2529296875, 35.859375, 38.4658203125, 41.072265625, 43.6787109375, 46.28515625, 48.8916015625, 51.498046875, 54.1044921875, 56.7109375, 59.3173828125, 61.923828125, 64.5302734375, 67.13671875, 69.7431640625, 72.349609375, 74.9560546875, 77.5625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 13.0, 18.0, 19.0, 49.0, 107.0, 3595.0, 114.0, 38.0, 26.0, 18.0, 11.0, 15.0, 3.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.21875, -21.411376953125, -20.60400390625, -19.796630859375, -18.9892578125, -18.181884765625, -17.37451171875, -16.567138671875, -15.759765625, -14.952392578125, -14.14501953125, -13.337646484375, -12.5302734375, -11.722900390625, -10.91552734375, -10.108154296875, -9.30078125, -8.493408203125, -7.68603515625, -6.878662109375, -6.0712890625, -5.263916015625, -4.45654296875, -3.649169921875, -2.841796875, -2.034423828125, -1.22705078125, -0.419677734375, 0.3876953125, 1.195068359375, 2.00244140625, 2.809814453125, 3.6171875, 4.424560546875, 5.23193359375, 6.039306640625, 6.8466796875, 7.654052734375, 8.46142578125, 9.268798828125, 10.076171875, 10.883544921875, 11.69091796875, 12.498291015625, 13.3056640625, 14.113037109375, 14.92041015625, 15.727783203125, 16.53515625, 17.342529296875, 18.14990234375, 18.957275390625, 19.7646484375, 20.572021484375, 21.37939453125, 22.186767578125, 22.994140625, 23.801513671875, 24.60888671875, 25.416259765625, 26.2236328125, 27.031005859375, 27.83837890625, 28.645751953125, 29.453125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 8.0, 20.0, 66.0, 142.0, 243.0, 239.0, 178.0, 59.0, 23.0, 14.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.30206298828125, -229.56483459472656, -223.82760620117188, -218.09036254882812, -212.35313415527344, -206.61590576171875, -200.87867736816406, -195.14144897460938, -189.40420532226562, -183.66697692871094, -177.92974853515625, -172.1925048828125, -166.4552764892578, -160.71804809570312, -154.98081970214844, -149.24359130859375, -143.50636291503906, -137.76913452148438, -132.0319061279297, -126.29467010498047, -120.55743408203125, -114.82020568847656, -109.08297729492188, -103.34574890136719, -97.60851287841797, -91.87128448486328, -86.13404846191406, -80.39682006835938, -74.65959167480469, -68.92235565185547, -63.18512725830078, -57.44789505004883, -51.710662841796875, -45.97343063354492, -40.23619842529297, -34.49897003173828, -28.761737823486328, -23.024505615234375, -17.287277221679688, -11.550045013427734, -5.812812805175781, -0.07558155059814453, 5.661649703979492, 11.398880004882812, 17.136112213134766, 22.87334442138672, 28.610572814941406, 34.34780502319336, 40.08503723144531, 45.822269439697266, 51.55950164794922, 57.296730041503906, 63.03396224975586, 68.77119445800781, 74.5084228515625, 80.24565124511719, 85.9828872680664, 91.7201156616211, 97.45735168457031, 103.194580078125, 108.93180847167969, 114.6690444946289, 120.4062728881836, 126.14350891113281, 131.8807373046875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 5.0, 3.0, 13.0, 8.0, 10.0, 14.0, 18.0, 16.0, 30.0, 28.0, 32.0, 39.0, 43.0, 35.0, 42.0, 56.0, 58.0, 50.0, 57.0, 39.0, 52.0, 40.0, 41.0, 37.0, 34.0, 40.0, 28.0, 28.0, 27.0, 14.0, 16.0, 8.0, 8.0, 3.0, 14.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-63.07673645019531, -61.28229904174805, -59.48786163330078, -57.693424224853516, -55.89898681640625, -54.10455322265625, -52.31011199951172, -50.51567840576172, -48.72124099731445, -46.92680358886719, -45.13236618041992, -43.337928771972656, -41.54349136352539, -39.749053955078125, -37.954620361328125, -36.16018295288086, -34.365745544433594, -32.57130813598633, -30.776870727539062, -28.982433319091797, -27.187997817993164, -25.3935604095459, -23.599123001098633, -21.8046875, -20.01024627685547, -18.215808868408203, -16.421371459960938, -14.626935005187988, -12.832498550415039, -11.038061141967773, -9.243623733520508, -7.449187278747559, -5.654750823974609, -3.860313892364502, -2.0658767223358154, -0.2714395523071289, 1.5229973793029785, 3.317434310913086, 5.111871719360352, 6.906308174133301, 8.700745582580566, 10.495182991027832, 12.289619445800781, 14.084056854248047, 15.878494262695312, 17.672931671142578, 19.467369079589844, 21.261804580688477, 23.056241989135742, 24.850679397583008, 26.645116806030273, 28.439552307128906, 30.233989715576172, 32.02842712402344, 33.8228645324707, 35.61730194091797, 37.411739349365234, 39.2061767578125, 41.000614166259766, 42.79505157470703, 44.5894889831543, 46.38392639160156, 48.17835998535156, 49.97279739379883, 51.767234802246094]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 11.0, 10.0, 16.0, 18.0, 35.0, 49.0, 95.0, 140.0, 220.0, 438.0, 833.0, 1627.0, 3483.0, 8801.0, 25460.0, 95778.0, 392989.0, 384310.0, 93687.0, 25064.0, 8519.0, 3483.0, 1673.0, 775.0, 405.0, 224.0, 140.0, 79.0, 56.0, 36.0, 24.0, 8.0, 11.0, 12.0, 4.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-131.125, -127.150390625, -123.17578125, -119.201171875, -115.2265625, -111.251953125, -107.27734375, -103.302734375, -99.328125, -95.353515625, -91.37890625, -87.404296875, -83.4296875, -79.455078125, -75.48046875, -71.505859375, -67.53125, -63.556640625, -59.58203125, -55.607421875, -51.6328125, -47.658203125, -43.68359375, -39.708984375, -35.734375, -31.759765625, -27.78515625, -23.810546875, -19.8359375, -15.861328125, -11.88671875, -7.912109375, -3.9375, 0.037109375, 4.01171875, 7.986328125, 11.9609375, 15.935546875, 19.91015625, 23.884765625, 27.859375, 31.833984375, 35.80859375, 39.783203125, 43.7578125, 47.732421875, 51.70703125, 55.681640625, 59.65625, 63.630859375, 67.60546875, 71.580078125, 75.5546875, 79.529296875, 83.50390625, 87.478515625, 91.453125, 95.427734375, 99.40234375, 103.376953125, 107.3515625, 111.326171875, 115.30078125, 119.275390625, 123.25]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 7.0, 3.0, 5.0, 8.0, 12.0, 12.0, 25.0, 22.0, 28.0, 44.0, 39.0, 44.0, 48.0, 60.0, 54.0, 63.0, 62.0, 61.0, 56.0, 40.0, 42.0, 43.0, 46.0, 30.0, 25.0, 19.0, 16.0, 19.0, 12.0, 8.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.02978515625, -34.7158203125, -33.40185546875, -32.087890625, -30.77392578125, -29.4599609375, -28.14599609375, -26.83203125, -25.51806640625, -24.2041015625, -22.89013671875, -21.576171875, -20.26220703125, -18.9482421875, -17.63427734375, -16.3203125, -15.00634765625, -13.6923828125, -12.37841796875, -11.064453125, -9.75048828125, -8.4365234375, -7.12255859375, -5.80859375, -4.49462890625, -3.1806640625, -1.86669921875, -0.552734375, 0.76123046875, 2.0751953125, 3.38916015625, 4.703125, 6.01708984375, 7.3310546875, 8.64501953125, 9.958984375, 11.27294921875, 12.5869140625, 13.90087890625, 15.21484375, 16.52880859375, 17.8427734375, 19.15673828125, 20.470703125, 21.78466796875, 23.0986328125, 24.41259765625, 25.7265625, 27.04052734375, 28.3544921875, 29.66845703125, 30.982421875, 32.29638671875, 33.6103515625, 34.92431640625, 36.23828125, 37.55224609375, 38.8662109375, 40.18017578125, 41.494140625, 42.80810546875, 44.1220703125, 45.43603515625, 46.75]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 8.0, 14.0, 16.0, 45.0, 69.0, 110.0, 195.0, 345.0, 759.0, 2007.0, 26142.0, 1001818.0, 13868.0, 1725.0, 670.0, 355.0, 177.0, 92.0, 52.0, 30.0, 26.0, 17.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-641.0, -623.875, -606.75, -589.625, -572.5, -555.375, -538.25, -521.125, -504.0, -486.875, -469.75, -452.625, -435.5, -418.375, -401.25, -384.125, -367.0, -349.875, -332.75, -315.625, -298.5, -281.375, -264.25, -247.125, -230.0, -212.875, -195.75, -178.625, -161.5, -144.375, -127.25, -110.125, -93.0, -75.875, -58.75, -41.625, -24.5, -7.375, 9.75, 26.875, 44.0, 61.125, 78.25, 95.375, 112.5, 129.625, 146.75, 163.875, 181.0, 198.125, 215.25, 232.375, 249.5, 266.625, 283.75, 300.875, 318.0, 335.125, 352.25, 369.375, 386.5, 403.625, 420.75, 437.875, 455.0]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 1.0, 7.0, 7.0, 10.0, 18.0, 9.0, 20.0, 30.0, 19.0, 28.0, 33.0, 27.0, 39.0, 52.0, 39.0, 46.0, 47.0, 38.0, 44.0, 33.0, 42.0, 34.0, 44.0, 27.0, 42.0, 36.0, 40.0, 32.0, 20.0, 15.0, 18.0, 19.0, 14.0, 13.0, 7.0, 6.0, 7.0, 10.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0], "bins": [-183.25, -178.064453125, -172.87890625, -167.693359375, -162.5078125, -157.322265625, -152.13671875, -146.951171875, -141.765625, -136.580078125, -131.39453125, -126.208984375, -121.0234375, -115.837890625, -110.65234375, -105.466796875, -100.28125, -95.095703125, -89.91015625, -84.724609375, -79.5390625, -74.353515625, -69.16796875, -63.982421875, -58.796875, -53.611328125, -48.42578125, -43.240234375, -38.0546875, -32.869140625, -27.68359375, -22.498046875, -17.3125, -12.126953125, -6.94140625, -1.755859375, 3.4296875, 8.615234375, 13.80078125, 18.986328125, 24.171875, 29.357421875, 34.54296875, 39.728515625, 44.9140625, 50.099609375, 55.28515625, 60.470703125, 65.65625, 70.841796875, 76.02734375, 81.212890625, 86.3984375, 91.583984375, 96.76953125, 101.955078125, 107.140625, 112.326171875, 117.51171875, 122.697265625, 127.8828125, 133.068359375, 138.25390625, 143.439453125, 148.625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 9.0, 8.0, 7.0, 10.0, 16.0, 24.0, 24.0, 30.0, 43.0, 53.0, 65.0, 102.0, 191.0, 369.0, 978.0, 6575.0, 913070.0, 122358.0, 3144.0, 693.0, 258.0, 131.0, 84.0, 68.0, 51.0, 39.0, 27.0, 25.0, 20.0, 19.0, 15.0, 6.0, 7.0, 4.0, 2.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-318.75, -309.046875, -299.34375, -289.640625, -279.9375, -270.234375, -260.53125, -250.828125, -241.125, -231.421875, -221.71875, -212.015625, -202.3125, -192.609375, -182.90625, -173.203125, -163.5, -153.796875, -144.09375, -134.390625, -124.6875, -114.984375, -105.28125, -95.578125, -85.875, -76.171875, -66.46875, -56.765625, -47.0625, -37.359375, -27.65625, -17.953125, -8.25, 1.453125, 11.15625, 20.859375, 30.5625, 40.265625, 49.96875, 59.671875, 69.375, 79.078125, 88.78125, 98.484375, 108.1875, 117.890625, 127.59375, 137.296875, 147.0, 156.703125, 166.40625, 176.109375, 185.8125, 195.515625, 205.21875, 214.921875, 224.625, 234.328125, 244.03125, 253.734375, 263.4375, 273.140625, 282.84375, 292.546875, 302.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 12.0, 18.0, 35.0, 50.0, 63.0, 131.0, 210.0, 164.0, 112.0, 84.0, 36.0, 20.0, 18.0, 10.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0137176513671875, -0.0131683349609375, -0.0126190185546875, -0.0120697021484375, -0.0115203857421875, -0.0109710693359375, -0.0104217529296875, -0.0098724365234375, -0.0093231201171875, -0.0087738037109375, -0.0082244873046875, -0.0076751708984375, -0.0071258544921875, -0.0065765380859375, -0.0060272216796875, -0.0054779052734375, -0.0049285888671875, -0.0043792724609375, -0.0038299560546875, -0.0032806396484375, -0.0027313232421875, -0.0021820068359375, -0.0016326904296875, -0.0010833740234375, -0.0005340576171875, 1.52587890625e-05, 0.0005645751953125, 0.0011138916015625, 0.0016632080078125, 0.0022125244140625, 0.0027618408203125, 0.0033111572265625, 0.0038604736328125, 0.0044097900390625, 0.0049591064453125, 0.0055084228515625, 0.0060577392578125, 0.0066070556640625, 0.0071563720703125, 0.0077056884765625, 0.0082550048828125, 0.0088043212890625, 0.0093536376953125, 0.0099029541015625, 0.0104522705078125, 0.0110015869140625, 0.0115509033203125, 0.0121002197265625, 0.0126495361328125, 0.0131988525390625, 0.0137481689453125, 0.0142974853515625, 0.0148468017578125, 0.0153961181640625, 0.0159454345703125, 0.0164947509765625, 0.0170440673828125, 0.0175933837890625, 0.0181427001953125, 0.0186920166015625, 0.0192413330078125, 0.0197906494140625, 0.0203399658203125, 0.0208892822265625, 0.0214385986328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 11.0, 9.0, 7.0, 18.0, 29.0, 41.0, 57.0, 91.0, 144.0, 254.0, 602.0, 1647.0, 6777.0, 69629.0, 943402.0, 20411.0, 3481.0, 1032.0, 381.0, 209.0, 99.0, 59.0, 43.0, 32.0, 19.0, 21.0, 16.0, 8.0, 6.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.0, -208.74609375, -200.4921875, -192.23828125, -183.984375, -175.73046875, -167.4765625, -159.22265625, -150.96875, -142.71484375, -134.4609375, -126.20703125, -117.953125, -109.69921875, -101.4453125, -93.19140625, -84.9375, -76.68359375, -68.4296875, -60.17578125, -51.921875, -43.66796875, -35.4140625, -27.16015625, -18.90625, -10.65234375, -2.3984375, 5.85546875, 14.109375, 22.36328125, 30.6171875, 38.87109375, 47.125, 55.37890625, 63.6328125, 71.88671875, 80.140625, 88.39453125, 96.6484375, 104.90234375, 113.15625, 121.41015625, 129.6640625, 137.91796875, 146.171875, 154.42578125, 162.6796875, 170.93359375, 179.1875, 187.44140625, 195.6953125, 203.94921875, 212.203125, 220.45703125, 228.7109375, 236.96484375, 245.21875, 253.47265625, 261.7265625, 269.98046875, 278.234375, 286.48828125, 294.7421875, 302.99609375, 311.25]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 6.0, 4.0, 4.0, 13.0, 21.0, 16.0, 18.0, 24.0, 47.0, 76.0, 134.0, 133.0, 162.0, 106.0, 67.0, 43.0, 33.0, 21.0, 15.0, 20.0, 8.0, 4.0, 4.0, 7.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.25, -127.658203125, -123.06640625, -118.474609375, -113.8828125, -109.291015625, -104.69921875, -100.107421875, -95.515625, -90.923828125, -86.33203125, -81.740234375, -77.1484375, -72.556640625, -67.96484375, -63.373046875, -58.78125, -54.189453125, -49.59765625, -45.005859375, -40.4140625, -35.822265625, -31.23046875, -26.638671875, -22.046875, -17.455078125, -12.86328125, -8.271484375, -3.6796875, 0.912109375, 5.50390625, 10.095703125, 14.6875, 19.279296875, 23.87109375, 28.462890625, 33.0546875, 37.646484375, 42.23828125, 46.830078125, 51.421875, 56.013671875, 60.60546875, 65.197265625, 69.7890625, 74.380859375, 78.97265625, 83.564453125, 88.15625, 92.748046875, 97.33984375, 101.931640625, 106.5234375, 111.115234375, 115.70703125, 120.298828125, 124.890625, 129.482421875, 134.07421875, 138.666015625, 143.2578125, 147.849609375, 152.44140625, 157.033203125, 161.625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 13.0, 126.0, 532.0, 290.0, 30.0, 10.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3490.555908203125, -3336.560546875, -3182.56494140625, -3028.5693359375, -2874.573974609375, -2720.57861328125, -2566.5830078125, -2412.58740234375, -2258.592041015625, -2104.5966796875, -1950.60107421875, -1796.6055908203125, -1642.610107421875, -1488.6146240234375, -1334.619140625, -1180.6236572265625, -1026.628173828125, -872.6326904296875, -718.63720703125, -564.6417236328125, -410.646240234375, -256.6507568359375, -102.6552734375, 51.3402099609375, 205.335693359375, 359.3311767578125, 513.32666015625, 667.3221435546875, 821.317626953125, 975.3131103515625, 1129.30859375, 1283.3040771484375, 1437.2998046875, 1591.2952880859375, 1745.290771484375, 1899.2862548828125, 2053.28173828125, 2207.27734375, 2361.272705078125, 2515.26806640625, 2669.263671875, 2823.25927734375, 2977.254638671875, 3131.25, 3285.24560546875, 3439.2412109375, 3593.236572265625, 3747.23193359375, 3901.2275390625, 4055.22314453125, 4209.21875, 4363.2138671875, 4517.20947265625, 4671.205078125, 4825.2001953125, 4979.19580078125, 5133.19140625, 5287.18701171875, 5441.1826171875, 5595.177734375, 5749.17333984375, 5903.1689453125, 6057.1640625, 6211.15966796875, 6365.1552734375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 7.0, 8.0, 9.0, 17.0, 17.0, 15.0, 25.0, 30.0, 24.0, 42.0, 34.0, 31.0, 57.0, 72.0, 49.0, 44.0, 50.0, 58.0, 53.0, 47.0, 40.0, 40.0, 38.0, 28.0, 36.0, 24.0, 13.0, 22.0, 14.0, 4.0, 10.0, 4.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1033.558349609375, -1004.7240600585938, -975.8897705078125, -947.0555419921875, -918.2212524414062, -889.386962890625, -860.5526733398438, -831.7183837890625, -802.8841552734375, -774.0498657226562, -745.215576171875, -716.38134765625, -687.5470581054688, -658.7127685546875, -629.8784790039062, -601.044189453125, -572.2099609375, -543.3756713867188, -514.5413818359375, -485.7071228027344, -456.87286376953125, -428.03857421875, -399.20428466796875, -370.3700256347656, -341.53570556640625, -312.701416015625, -283.8671569824219, -255.03286743164062, -226.1986083984375, -197.36431884765625, -168.53004455566406, -139.69577026367188, -110.86151123046875, -82.02723693847656, -53.19295883178711, -24.358680725097656, 4.475593566894531, 33.30987548828125, 62.14414978027344, 90.97842407226562, 119.81269836425781, 148.64697265625, 177.4812469482422, 206.31552124023438, 235.14981079101562, 263.98406982421875, 292.818359375, 321.65264892578125, 350.4869079589844, 379.3211975097656, 408.15545654296875, 436.98974609375, 465.8240051269531, 494.6582946777344, 523.4925537109375, 552.3268432617188, 581.1611328125, 609.9954223632812, 638.8297119140625, 667.6639404296875, 696.4982299804688, 725.33251953125, 754.1668090820312, 783.0010986328125, 811.8353271484375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 20.0, 24.0, 37.0, 46.0, 98.0, 156.0, 290.0, 541.0, 1015.0, 2402.0, 5668.0, 17883.0, 123069.0, 3992427.0, 35130.0, 8975.0, 3460.0, 1484.0, 708.0, 342.0, 179.0, 110.0, 50.0, 44.0, 21.0, 16.0, 15.0, 11.0, 7.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-109.75, -106.54296875, -103.3359375, -100.12890625, -96.921875, -93.71484375, -90.5078125, -87.30078125, -84.09375, -80.88671875, -77.6796875, -74.47265625, -71.265625, -68.05859375, -64.8515625, -61.64453125, -58.4375, -55.23046875, -52.0234375, -48.81640625, -45.609375, -42.40234375, -39.1953125, -35.98828125, -32.78125, -29.57421875, -26.3671875, -23.16015625, -19.953125, -16.74609375, -13.5390625, -10.33203125, -7.125, -3.91796875, -0.7109375, 2.49609375, 5.703125, 8.91015625, 12.1171875, 15.32421875, 18.53125, 21.73828125, 24.9453125, 28.15234375, 31.359375, 34.56640625, 37.7734375, 40.98046875, 44.1875, 47.39453125, 50.6015625, 53.80859375, 57.015625, 60.22265625, 63.4296875, 66.63671875, 69.84375, 73.05078125, 76.2578125, 79.46484375, 82.671875, 85.87890625, 89.0859375, 92.29296875, 95.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 10.0, 9.0, 9.0, 26.0, 44.0, 64.0, 81.0, 69.0, 103.0, 98.0, 103.0, 93.0, 88.0, 46.0, 54.0, 29.0, 20.0, 19.0, 13.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-92.5, -90.17333984375, -87.8466796875, -85.52001953125, -83.193359375, -80.86669921875, -78.5400390625, -76.21337890625, -73.88671875, -71.56005859375, -69.2333984375, -66.90673828125, -64.580078125, -62.25341796875, -59.9267578125, -57.60009765625, -55.2734375, -52.94677734375, -50.6201171875, -48.29345703125, -45.966796875, -43.64013671875, -41.3134765625, -38.98681640625, -36.66015625, -34.33349609375, -32.0068359375, -29.68017578125, -27.353515625, -25.02685546875, -22.7001953125, -20.37353515625, -18.046875, -15.72021484375, -13.3935546875, -11.06689453125, -8.740234375, -6.41357421875, -4.0869140625, -1.76025390625, 0.56640625, 2.89306640625, 5.2197265625, 7.54638671875, 9.873046875, 12.19970703125, 14.5263671875, 16.85302734375, 19.1796875, 21.50634765625, 23.8330078125, 26.15966796875, 28.486328125, 30.81298828125, 33.1396484375, 35.46630859375, 37.79296875, 40.11962890625, 42.4462890625, 44.77294921875, 47.099609375, 49.42626953125, 51.7529296875, 54.07958984375, 56.40625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 7.0, 10.0, 16.0, 11.0, 4.0, 13.0, 22.0, 23.0, 39.0, 36.0, 62.0, 95.0, 229.0, 469.0, 1182.0, 3763.0, 27866.0, 4103345.0, 49513.0, 5099.0, 1335.0, 529.0, 202.0, 125.0, 84.0, 54.0, 30.0, 20.0, 16.0, 20.0, 12.0, 15.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-266.0, -258.923828125, -251.84765625, -244.771484375, -237.6953125, -230.619140625, -223.54296875, -216.466796875, -209.390625, -202.314453125, -195.23828125, -188.162109375, -181.0859375, -174.009765625, -166.93359375, -159.857421875, -152.78125, -145.705078125, -138.62890625, -131.552734375, -124.4765625, -117.400390625, -110.32421875, -103.248046875, -96.171875, -89.095703125, -82.01953125, -74.943359375, -67.8671875, -60.791015625, -53.71484375, -46.638671875, -39.5625, -32.486328125, -25.41015625, -18.333984375, -11.2578125, -4.181640625, 2.89453125, 9.970703125, 17.046875, 24.123046875, 31.19921875, 38.275390625, 45.3515625, 52.427734375, 59.50390625, 66.580078125, 73.65625, 80.732421875, 87.80859375, 94.884765625, 101.9609375, 109.037109375, 116.11328125, 123.189453125, 130.265625, 137.341796875, 144.41796875, 151.494140625, 158.5703125, 165.646484375, 172.72265625, 179.798828125, 186.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 10.0, 13.0, 42.0, 90.0, 3266.0, 509.0, 80.0, 27.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-143.875, -140.740234375, -137.60546875, -134.470703125, -131.3359375, -128.201171875, -125.06640625, -121.931640625, -118.796875, -115.662109375, -112.52734375, -109.392578125, -106.2578125, -103.123046875, -99.98828125, -96.853515625, -93.71875, -90.583984375, -87.44921875, -84.314453125, -81.1796875, -78.044921875, -74.91015625, -71.775390625, -68.640625, -65.505859375, -62.37109375, -59.236328125, -56.1015625, -52.966796875, -49.83203125, -46.697265625, -43.5625, -40.427734375, -37.29296875, -34.158203125, -31.0234375, -27.888671875, -24.75390625, -21.619140625, -18.484375, -15.349609375, -12.21484375, -9.080078125, -5.9453125, -2.810546875, 0.32421875, 3.458984375, 6.59375, 9.728515625, 12.86328125, 15.998046875, 19.1328125, 22.267578125, 25.40234375, 28.537109375, 31.671875, 34.806640625, 37.94140625, 41.076171875, 44.2109375, 47.345703125, 50.48046875, 53.615234375, 56.75]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 14.0, 29.0, 143.0, 317.0, 298.0, 145.0, 32.0, 17.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1023.88720703125, -1005.2698364257812, -986.6524658203125, -968.0350952148438, -949.417724609375, -930.8003540039062, -912.1829833984375, -893.5656127929688, -874.9482421875, -856.3308715820312, -837.7135009765625, -819.0961303710938, -800.478759765625, -781.8613891601562, -763.2440185546875, -744.6266479492188, -726.00927734375, -707.3919067382812, -688.7745361328125, -670.1571655273438, -651.539794921875, -632.9224243164062, -614.3050537109375, -595.6876831054688, -577.0703125, -558.4529418945312, -539.8355712890625, -521.2182006835938, -502.600830078125, -483.98345947265625, -465.3660888671875, -446.74871826171875, -428.13140869140625, -409.5140380859375, -390.89666748046875, -372.279296875, -353.66192626953125, -335.0445556640625, -316.42718505859375, -297.809814453125, -279.19244384765625, -260.5750732421875, -241.95770263671875, -223.34033203125, -204.72296142578125, -186.1055908203125, -167.48822021484375, -148.870849609375, -130.25347900390625, -111.6361083984375, -93.01873779296875, -74.4013671875, -55.78399658203125, -37.1666259765625, -18.54925537109375, 0.068115234375, 18.68548583984375, 37.3028564453125, 55.92022705078125, 74.53759765625, 93.15496826171875, 111.7723388671875, 130.38970947265625, 149.007080078125, 167.62445068359375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 12.0, 21.0, 25.0, 31.0, 33.0, 59.0, 65.0, 78.0, 81.0, 95.0, 89.0, 86.0, 79.0, 67.0, 43.0, 36.0, 34.0, 26.0, 15.0, 14.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.74136352539062, -236.0111846923828, -227.28102111816406, -218.55084228515625, -209.8206787109375, -201.0904998779297, -192.36032104492188, -183.63015747070312, -174.8999786376953, -166.1697998046875, -157.43963623046875, -148.70945739746094, -139.97927856445312, -131.24911499023438, -122.51893615722656, -113.78876495361328, -105.05859375, -96.32842254638672, -87.59825134277344, -78.86807250976562, -70.13790130615234, -61.40773010253906, -52.677555084228516, -43.94738006591797, -35.21720886230469, -26.487035751342773, -17.75686264038086, -9.026689529418945, -0.29651641845703125, 8.43365478515625, 17.163829803466797, 25.894004821777344, 34.62420654296875, 43.35437774658203, 52.08455276489258, 60.814727783203125, 69.5448989868164, 78.27507019042969, 87.0052490234375, 95.73542022705078, 104.46559143066406, 113.19576263427734, 121.92593383789062, 130.65611267089844, 139.38629150390625, 148.116455078125, 156.8466339111328, 165.57681274414062, 174.30697631835938, 183.0371551513672, 191.76731872558594, 200.49749755859375, 209.2276611328125, 217.9578399658203, 226.68801879882812, 235.41818237304688, 244.1483612060547, 252.8785400390625, 261.60870361328125, 270.3388671875, 279.0690612792969, 287.7992248535156, 296.5293884277344, 305.25958251953125, 313.98974609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 10.0, 3.0, 6.0, 1.0, 11.0, 15.0, 32.0, 33.0, 43.0, 73.0, 130.0, 168.0, 298.0, 540.0, 932.0, 1723.0, 3957.0, 10667.0, 40975.0, 250033.0, 572525.0, 128693.0, 24142.0, 7305.0, 2961.0, 1360.0, 795.0, 424.0, 225.0, 154.0, 110.0, 66.0, 40.0, 29.0, 23.0, 17.0, 16.0, 6.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-165.0, -160.048828125, -155.09765625, -150.146484375, -145.1953125, -140.244140625, -135.29296875, -130.341796875, -125.390625, -120.439453125, -115.48828125, -110.537109375, -105.5859375, -100.634765625, -95.68359375, -90.732421875, -85.78125, -80.830078125, -75.87890625, -70.927734375, -65.9765625, -61.025390625, -56.07421875, -51.123046875, -46.171875, -41.220703125, -36.26953125, -31.318359375, -26.3671875, -21.416015625, -16.46484375, -11.513671875, -6.5625, -1.611328125, 3.33984375, 8.291015625, 13.2421875, 18.193359375, 23.14453125, 28.095703125, 33.046875, 37.998046875, 42.94921875, 47.900390625, 52.8515625, 57.802734375, 62.75390625, 67.705078125, 72.65625, 77.607421875, 82.55859375, 87.509765625, 92.4609375, 97.412109375, 102.36328125, 107.314453125, 112.265625, 117.216796875, 122.16796875, 127.119140625, 132.0703125, 137.021484375, 141.97265625, 146.923828125, 151.875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 3.0, 8.0, 16.0, 14.0, 21.0, 27.0, 39.0, 60.0, 65.0, 77.0, 81.0, 103.0, 83.0, 76.0, 74.0, 59.0, 49.0, 41.0, 30.0, 21.0, 15.0, 7.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.25, -81.1103515625, -78.970703125, -76.8310546875, -74.69140625, -72.5517578125, -70.412109375, -68.2724609375, -66.1328125, -63.9931640625, -61.853515625, -59.7138671875, -57.57421875, -55.4345703125, -53.294921875, -51.1552734375, -49.015625, -46.8759765625, -44.736328125, -42.5966796875, -40.45703125, -38.3173828125, -36.177734375, -34.0380859375, -31.8984375, -29.7587890625, -27.619140625, -25.4794921875, -23.33984375, -21.2001953125, -19.060546875, -16.9208984375, -14.78125, -12.6416015625, -10.501953125, -8.3623046875, -6.22265625, -4.0830078125, -1.943359375, 0.1962890625, 2.3359375, 4.4755859375, 6.615234375, 8.7548828125, 10.89453125, 13.0341796875, 15.173828125, 17.3134765625, 19.453125, 21.5927734375, 23.732421875, 25.8720703125, 28.01171875, 30.1513671875, 32.291015625, 34.4306640625, 36.5703125, 38.7099609375, 40.849609375, 42.9892578125, 45.12890625, 47.2685546875, 49.408203125, 51.5478515625, 53.6875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 5.0, 10.0, 9.0, 26.0, 46.0, 55.0, 72.0, 89.0, 150.0, 234.0, 451.0, 682.0, 1419.0, 3742.0, 18116.0, 531906.0, 467796.0, 16973.0, 3547.0, 1418.0, 697.0, 411.0, 224.0, 153.0, 97.0, 70.0, 40.0, 34.0, 15.0, 21.0, 6.0, 7.0, 6.0, 10.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5, -280.72265625, -271.9453125, -263.16796875, -254.390625, -245.61328125, -236.8359375, -228.05859375, -219.28125, -210.50390625, -201.7265625, -192.94921875, -184.171875, -175.39453125, -166.6171875, -157.83984375, -149.0625, -140.28515625, -131.5078125, -122.73046875, -113.953125, -105.17578125, -96.3984375, -87.62109375, -78.84375, -70.06640625, -61.2890625, -52.51171875, -43.734375, -34.95703125, -26.1796875, -17.40234375, -8.625, 0.15234375, 8.9296875, 17.70703125, 26.484375, 35.26171875, 44.0390625, 52.81640625, 61.59375, 70.37109375, 79.1484375, 87.92578125, 96.703125, 105.48046875, 114.2578125, 123.03515625, 131.8125, 140.58984375, 149.3671875, 158.14453125, 166.921875, 175.69921875, 184.4765625, 193.25390625, 202.03125, 210.80859375, 219.5859375, 228.36328125, 237.140625, 245.91796875, 254.6953125, 263.47265625, 272.25]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 13.0, 18.0, 27.0, 31.0, 51.0, 64.0, 64.0, 93.0, 112.0, 101.0, 83.0, 85.0, 84.0, 61.0, 35.0, 27.0, 15.0, 13.0, 11.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-485.25, -474.462890625, -463.67578125, -452.888671875, -442.1015625, -431.314453125, -420.52734375, -409.740234375, -398.953125, -388.166015625, -377.37890625, -366.591796875, -355.8046875, -345.017578125, -334.23046875, -323.443359375, -312.65625, -301.869140625, -291.08203125, -280.294921875, -269.5078125, -258.720703125, -247.93359375, -237.146484375, -226.359375, -215.572265625, -204.78515625, -193.998046875, -183.2109375, -172.423828125, -161.63671875, -150.849609375, -140.0625, -129.275390625, -118.48828125, -107.701171875, -96.9140625, -86.126953125, -75.33984375, -64.552734375, -53.765625, -42.978515625, -32.19140625, -21.404296875, -10.6171875, 0.169921875, 10.95703125, 21.744140625, 32.53125, 43.318359375, 54.10546875, 64.892578125, 75.6796875, 86.466796875, 97.25390625, 108.041015625, 118.828125, 129.615234375, 140.40234375, 151.189453125, 161.9765625, 172.763671875, 183.55078125, 194.337890625, 205.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 9.0, 4.0, 8.0, 7.0, 13.0, 18.0, 12.0, 22.0, 32.0, 38.0, 55.0, 68.0, 96.0, 179.0, 342.0, 670.0, 1972.0, 10057.0, 221397.0, 785068.0, 23173.0, 3300.0, 926.0, 394.0, 206.0, 140.0, 75.0, 53.0, 54.0, 36.0, 20.0, 24.0, 16.0, 10.0, 10.0, 2.0, 6.0, 7.0, 6.0, 5.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-108.25, -104.9873046875, -101.724609375, -98.4619140625, -95.19921875, -91.9365234375, -88.673828125, -85.4111328125, -82.1484375, -78.8857421875, -75.623046875, -72.3603515625, -69.09765625, -65.8349609375, -62.572265625, -59.3095703125, -56.046875, -52.7841796875, -49.521484375, -46.2587890625, -42.99609375, -39.7333984375, -36.470703125, -33.2080078125, -29.9453125, -26.6826171875, -23.419921875, -20.1572265625, -16.89453125, -13.6318359375, -10.369140625, -7.1064453125, -3.84375, -0.5810546875, 2.681640625, 5.9443359375, 9.20703125, 12.4697265625, 15.732421875, 18.9951171875, 22.2578125, 25.5205078125, 28.783203125, 32.0458984375, 35.30859375, 38.5712890625, 41.833984375, 45.0966796875, 48.359375, 51.6220703125, 54.884765625, 58.1474609375, 61.41015625, 64.6728515625, 67.935546875, 71.1982421875, 74.4609375, 77.7236328125, 80.986328125, 84.2490234375, 87.51171875, 90.7744140625, 94.037109375, 97.2998046875, 100.5625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 0.0, 6.0, 7.0, 8.0, 6.0, 12.0, 17.0, 16.0, 22.0, 45.0, 59.0, 70.0, 82.0, 124.0, 113.0, 105.0, 78.0, 51.0, 44.0, 23.0, 31.0, 17.0, 18.0, 11.0, 4.0, 7.0, 3.0, 6.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00843048095703125, -0.008150339126586914, -0.007870197296142578, -0.007590055465698242, -0.007309913635253906, -0.00702977180480957, -0.006749629974365234, -0.0064694881439208984, -0.0061893463134765625, -0.0059092044830322266, -0.005629062652587891, -0.005348920822143555, -0.005068778991699219, -0.004788637161254883, -0.004508495330810547, -0.004228353500366211, -0.003948211669921875, -0.003668069839477539, -0.003387928009033203, -0.003107786178588867, -0.0028276443481445312, -0.0025475025177001953, -0.0022673606872558594, -0.0019872188568115234, -0.0017070770263671875, -0.0014269351959228516, -0.0011467933654785156, -0.0008666515350341797, -0.0005865097045898438, -0.0003063678741455078, -2.6226043701171875e-05, 0.00025391578674316406, 0.0005340576171875, 0.0008141994476318359, 0.0010943412780761719, 0.0013744831085205078, 0.0016546249389648438, 0.0019347667694091797, 0.0022149085998535156, 0.0024950504302978516, 0.0027751922607421875, 0.0030553340911865234, 0.0033354759216308594, 0.0036156177520751953, 0.0038957595825195312, 0.004175901412963867, 0.004456043243408203, 0.004736185073852539, 0.005016326904296875, 0.005296468734741211, 0.005576610565185547, 0.005856752395629883, 0.006136894226074219, 0.006417036056518555, 0.006697177886962891, 0.0069773197174072266, 0.0072574615478515625, 0.0075376033782958984, 0.007817745208740234, 0.00809788703918457, 0.008378028869628906, 0.008658170700073242, 0.008938312530517578, 0.009218454360961914, 0.00949859619140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 8.0, 5.0, 6.0, 10.0, 17.0, 19.0, 49.0, 65.0, 111.0, 240.0, 448.0, 1016.0, 2542.0, 8130.0, 56474.0, 914908.0, 52286.0, 7779.0, 2475.0, 981.0, 450.0, 184.0, 118.0, 70.0, 43.0, 27.0, 18.0, 17.0, 8.0, 11.0, 5.0, 8.0, 4.0, 2.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-151.625, -147.580078125, -143.53515625, -139.490234375, -135.4453125, -131.400390625, -127.35546875, -123.310546875, -119.265625, -115.220703125, -111.17578125, -107.130859375, -103.0859375, -99.041015625, -94.99609375, -90.951171875, -86.90625, -82.861328125, -78.81640625, -74.771484375, -70.7265625, -66.681640625, -62.63671875, -58.591796875, -54.546875, -50.501953125, -46.45703125, -42.412109375, -38.3671875, -34.322265625, -30.27734375, -26.232421875, -22.1875, -18.142578125, -14.09765625, -10.052734375, -6.0078125, -1.962890625, 2.08203125, 6.126953125, 10.171875, 14.216796875, 18.26171875, 22.306640625, 26.3515625, 30.396484375, 34.44140625, 38.486328125, 42.53125, 46.576171875, 50.62109375, 54.666015625, 58.7109375, 62.755859375, 66.80078125, 70.845703125, 74.890625, 78.935546875, 82.98046875, 87.025390625, 91.0703125, 95.115234375, 99.16015625, 103.205078125, 107.25]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 7.0, 7.0, 19.0, 36.0, 62.0, 106.0, 180.0, 183.0, 136.0, 94.0, 60.0, 42.0, 13.0, 13.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.75, -84.15234375, -80.5546875, -76.95703125, -73.359375, -69.76171875, -66.1640625, -62.56640625, -58.96875, -55.37109375, -51.7734375, -48.17578125, -44.578125, -40.98046875, -37.3828125, -33.78515625, -30.1875, -26.58984375, -22.9921875, -19.39453125, -15.796875, -12.19921875, -8.6015625, -5.00390625, -1.40625, 2.19140625, 5.7890625, 9.38671875, 12.984375, 16.58203125, 20.1796875, 23.77734375, 27.375, 30.97265625, 34.5703125, 38.16796875, 41.765625, 45.36328125, 48.9609375, 52.55859375, 56.15625, 59.75390625, 63.3515625, 66.94921875, 70.546875, 74.14453125, 77.7421875, 81.33984375, 84.9375, 88.53515625, 92.1328125, 95.73046875, 99.328125, 102.92578125, 106.5234375, 110.12109375, 113.71875, 117.31640625, 120.9140625, 124.51171875, 128.109375, 131.70703125, 135.3046875, 138.90234375, 142.5]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 6.0, 14.0, 44.0, 94.0, 219.0, 281.0, 180.0, 93.0, 33.0, 18.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3132.603515625, -3066.642822265625, -3000.681884765625, -2934.72119140625, -2868.76025390625, -2802.799560546875, -2736.838623046875, -2670.8779296875, -2604.9169921875, -2538.956298828125, -2472.995361328125, -2407.03466796875, -2341.07373046875, -2275.113037109375, -2209.152099609375, -2143.19140625, -2077.23046875, -2011.2696533203125, -1945.308837890625, -1879.3480224609375, -1813.38720703125, -1747.4263916015625, -1681.465576171875, -1615.5048828125, -1549.544189453125, -1483.5833740234375, -1417.62255859375, -1351.6617431640625, -1285.700927734375, -1219.7401123046875, -1153.779296875, -1087.818603515625, -1021.857666015625, -955.8968505859375, -889.93603515625, -823.9752197265625, -758.014404296875, -692.0535888671875, -626.0928344726562, -560.1320190429688, -494.17120361328125, -428.21038818359375, -362.24957275390625, -296.2887878417969, -230.32797241210938, -164.36715698242188, -98.4063720703125, -32.445556640625, 33.5152587890625, 99.47606658935547, 165.43687438964844, 231.39767456054688, 297.3584899902344, 363.3193054199219, 429.28009033203125, 495.24090576171875, 561.2017211914062, 627.1625366210938, 693.1233520507812, 759.0841064453125, 825.044921875, 891.0057373046875, 956.966552734375, 1022.9273681640625, 1088.88818359375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 7.0, 10.0, 11.0, 14.0, 23.0, 36.0, 41.0, 35.0, 56.0, 61.0, 60.0, 65.0, 75.0, 72.0, 56.0, 51.0, 53.0, 41.0, 43.0, 34.0, 37.0, 22.0, 23.0, 19.0, 9.0, 5.0, 10.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1139.2607421875, -1104.7119140625, -1070.1630859375, -1035.6141357421875, -1001.0653076171875, -966.5164794921875, -931.9675903320312, -897.418701171875, -862.869873046875, -828.321044921875, -793.7721557617188, -759.2232666015625, -724.6744384765625, -690.1256103515625, -655.5767211914062, -621.02783203125, -586.47900390625, -551.93017578125, -517.3812866210938, -482.8324279785156, -448.2835693359375, -413.7347106933594, -379.18585205078125, -344.6369934082031, -310.088134765625, -275.5392761230469, -240.99041748046875, -206.44155883789062, -171.8927001953125, -137.34384155273438, -102.79498291015625, -68.24612426757812, -33.6971435546875, 0.851715087890625, 35.40057373046875, 69.94943237304688, 104.498291015625, 139.04714965820312, 173.59600830078125, 208.14486694335938, 242.6937255859375, 277.2425842285156, 311.79144287109375, 346.3403015136719, 380.88916015625, 415.4380187988281, 449.98687744140625, 484.5357360839844, 519.0845947265625, 553.6334228515625, 588.1823120117188, 622.731201171875, 657.280029296875, 691.828857421875, 726.3777465820312, 760.9266357421875, 795.4754638671875, 830.0242919921875, 864.5731811523438, 899.1220703125, 933.6708984375, 968.2197265625, 1002.7686157226562, 1037.3175048828125, 1071.8663330078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 4.0, 8.0, 4.0, 8.0, 12.0, 13.0, 11.0, 27.0, 30.0, 53.0, 76.0, 134.0, 216.0, 475.0, 1066.0, 3056.0, 11482.0, 72450.0, 3759963.0, 311821.0, 24527.0, 5647.0, 1700.0, 707.0, 317.0, 169.0, 99.0, 62.0, 36.0, 31.0, 17.0, 12.0, 6.0, 8.0, 6.0, 2.0, 6.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0], "bins": [-131.625, -127.197265625, -122.76953125, -118.341796875, -113.9140625, -109.486328125, -105.05859375, -100.630859375, -96.203125, -91.775390625, -87.34765625, -82.919921875, -78.4921875, -74.064453125, -69.63671875, -65.208984375, -60.78125, -56.353515625, -51.92578125, -47.498046875, -43.0703125, -38.642578125, -34.21484375, -29.787109375, -25.359375, -20.931640625, -16.50390625, -12.076171875, -7.6484375, -3.220703125, 1.20703125, 5.634765625, 10.0625, 14.490234375, 18.91796875, 23.345703125, 27.7734375, 32.201171875, 36.62890625, 41.056640625, 45.484375, 49.912109375, 54.33984375, 58.767578125, 63.1953125, 67.623046875, 72.05078125, 76.478515625, 80.90625, 85.333984375, 89.76171875, 94.189453125, 98.6171875, 103.044921875, 107.47265625, 111.900390625, 116.328125, 120.755859375, 125.18359375, 129.611328125, 134.0390625, 138.466796875, 142.89453125, 147.322265625, 151.75]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 8.0, 6.0, 8.0, 5.0, 7.0, 23.0, 16.0, 23.0, 36.0, 32.0, 46.0, 49.0, 51.0, 47.0, 54.0, 67.0, 49.0, 51.0, 62.0, 50.0, 43.0, 49.0, 48.0, 31.0, 32.0, 29.0, 21.0, 14.0, 14.0, 10.0, 8.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.96875, -39.7138671875, -38.458984375, -37.2041015625, -35.94921875, -34.6943359375, -33.439453125, -32.1845703125, -30.9296875, -29.6748046875, -28.419921875, -27.1650390625, -25.91015625, -24.6552734375, -23.400390625, -22.1455078125, -20.890625, -19.6357421875, -18.380859375, -17.1259765625, -15.87109375, -14.6162109375, -13.361328125, -12.1064453125, -10.8515625, -9.5966796875, -8.341796875, -7.0869140625, -5.83203125, -4.5771484375, -3.322265625, -2.0673828125, -0.8125, 0.4423828125, 1.697265625, 2.9521484375, 4.20703125, 5.4619140625, 6.716796875, 7.9716796875, 9.2265625, 10.4814453125, 11.736328125, 12.9912109375, 14.24609375, 15.5009765625, 16.755859375, 18.0107421875, 19.265625, 20.5205078125, 21.775390625, 23.0302734375, 24.28515625, 25.5400390625, 26.794921875, 28.0498046875, 29.3046875, 30.5595703125, 31.814453125, 33.0693359375, 34.32421875, 35.5791015625, 36.833984375, 38.0888671875, 39.34375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 10.0, 8.0, 17.0, 34.0, 48.0, 106.0, 186.0, 469.0, 1749.0, 10491.0, 174818.0, 3946128.0, 53394.0, 5230.0, 1020.0, 310.0, 111.0, 59.0, 30.0, 20.0, 10.0, 7.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.125, -121.494140625, -114.86328125, -108.232421875, -101.6015625, -94.970703125, -88.33984375, -81.708984375, -75.078125, -68.447265625, -61.81640625, -55.185546875, -48.5546875, -41.923828125, -35.29296875, -28.662109375, -22.03125, -15.400390625, -8.76953125, -2.138671875, 4.4921875, 11.123046875, 17.75390625, 24.384765625, 31.015625, 37.646484375, 44.27734375, 50.908203125, 57.5390625, 64.169921875, 70.80078125, 77.431640625, 84.0625, 90.693359375, 97.32421875, 103.955078125, 110.5859375, 117.216796875, 123.84765625, 130.478515625, 137.109375, 143.740234375, 150.37109375, 157.001953125, 163.6328125, 170.263671875, 176.89453125, 183.525390625, 190.15625, 196.787109375, 203.41796875, 210.048828125, 216.6796875, 223.310546875, 229.94140625, 236.572265625, 243.203125, 249.833984375, 256.46484375, 263.095703125, 269.7265625, 276.357421875, 282.98828125, 289.619140625, 296.25]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 10.0, 11.0, 15.0, 18.0, 21.0, 24.0, 50.0, 76.0, 122.0, 238.0, 718.0, 1598.0, 637.0, 206.0, 86.0, 70.0, 44.0, 44.0, 16.0, 11.0, 12.0, 11.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-133.5, -129.728515625, -125.95703125, -122.185546875, -118.4140625, -114.642578125, -110.87109375, -107.099609375, -103.328125, -99.556640625, -95.78515625, -92.013671875, -88.2421875, -84.470703125, -80.69921875, -76.927734375, -73.15625, -69.384765625, -65.61328125, -61.841796875, -58.0703125, -54.298828125, -50.52734375, -46.755859375, -42.984375, -39.212890625, -35.44140625, -31.669921875, -27.8984375, -24.126953125, -20.35546875, -16.583984375, -12.8125, -9.041015625, -5.26953125, -1.498046875, 2.2734375, 6.044921875, 9.81640625, 13.587890625, 17.359375, 21.130859375, 24.90234375, 28.673828125, 32.4453125, 36.216796875, 39.98828125, 43.759765625, 47.53125, 51.302734375, 55.07421875, 58.845703125, 62.6171875, 66.388671875, 70.16015625, 73.931640625, 77.703125, 81.474609375, 85.24609375, 89.017578125, 92.7890625, 96.560546875, 100.33203125, 104.103515625, 107.875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 12.0, 16.0, 54.0, 196.0, 411.0, 241.0, 41.0, 20.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3091.7822265625, -3024.01318359375, -2956.244384765625, -2888.475341796875, -2820.706298828125, -2752.9375, -2685.16845703125, -2617.3994140625, -2549.63037109375, -2481.861328125, -2414.092529296875, -2346.323486328125, -2278.554443359375, -2210.78564453125, -2143.0166015625, -2075.24755859375, -2007.478759765625, -1939.7098388671875, -1871.9407958984375, -1804.171875, -1736.40283203125, -1668.6339111328125, -1600.864990234375, -1533.095947265625, -1465.3270263671875, -1397.55810546875, -1329.7890625, -1262.0201416015625, -1194.251220703125, -1126.482177734375, -1058.7132568359375, -990.9442749023438, -923.175537109375, -855.4065551757812, -787.6375732421875, -719.86865234375, -652.0996704101562, -584.3306884765625, -516.561767578125, -448.79278564453125, -381.0238037109375, -313.25482177734375, -245.48587036132812, -177.71690368652344, -109.94793701171875, -42.178955078125, 25.589996337890625, 93.35894775390625, 161.1279296875, 228.8968963623047, 296.6658630371094, 364.434814453125, 432.20379638671875, 499.9727783203125, 567.74169921875, 635.5106811523438, 703.2796630859375, 771.0486450195312, 838.817626953125, 906.5865478515625, 974.3555297851562, 1042.12451171875, 1109.8934326171875, 1177.662353515625, 1245.431396484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 6.0, 2.0, 7.0, 14.0, 18.0, 17.0, 27.0, 23.0, 18.0, 24.0, 36.0, 33.0, 42.0, 39.0, 57.0, 44.0, 48.0, 44.0, 47.0, 51.0, 45.0, 39.0, 51.0, 32.0, 39.0, 38.0, 26.0, 23.0, 14.0, 24.0, 16.0, 12.0, 11.0, 5.0, 4.0, 1.0, 1.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0], "bins": [-602.1848754882812, -586.462646484375, -570.740478515625, -555.0182495117188, -539.2960205078125, -523.5737915039062, -507.8515930175781, -492.12939453125, -476.40716552734375, -460.6849670410156, -444.9627380371094, -429.24053955078125, -413.518310546875, -397.7961120605469, -382.0738830566406, -366.3516845703125, -350.62945556640625, -334.9072570800781, -319.1850280761719, -303.46282958984375, -287.7406005859375, -272.0184020996094, -256.2961730957031, -240.573974609375, -224.85177612304688, -209.1295623779297, -193.4073486328125, -177.6851348876953, -161.96292114257812, -146.24072265625, -130.51849365234375, -114.7962875366211, -99.07406616210938, -83.35185241699219, -67.629638671875, -51.90742874145508, -36.18521499633789, -20.46300506591797, -4.740791320800781, 10.981422424316406, 26.703636169433594, 42.42584991455078, 58.14806365966797, 73.87026977539062, 89.59248352050781, 105.314697265625, 121.03691101074219, 136.75912475585938, 152.48133850097656, 168.20355224609375, 183.92576599121094, 199.64797973632812, 215.3701934814453, 231.0924072265625, 246.81460571289062, 262.5368347167969, 278.259033203125, 293.9812316894531, 309.7034606933594, 325.4256591796875, 341.14788818359375, 356.8700866699219, 372.5923156738281, 388.31451416015625, 404.0367431640625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 14.0, 18.0, 38.0, 69.0, 125.0, 246.0, 552.0, 1396.0, 4870.0, 28061.0, 379187.0, 582439.0, 42034.0, 6460.0, 1766.0, 654.0, 300.0, 142.0, 67.0, 29.0, 26.0, 16.0, 13.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.125, -212.296875, -205.46875, -198.640625, -191.8125, -184.984375, -178.15625, -171.328125, -164.5, -157.671875, -150.84375, -144.015625, -137.1875, -130.359375, -123.53125, -116.703125, -109.875, -103.046875, -96.21875, -89.390625, -82.5625, -75.734375, -68.90625, -62.078125, -55.25, -48.421875, -41.59375, -34.765625, -27.9375, -21.109375, -14.28125, -7.453125, -0.625, 6.203125, 13.03125, 19.859375, 26.6875, 33.515625, 40.34375, 47.171875, 54.0, 60.828125, 67.65625, 74.484375, 81.3125, 88.140625, 94.96875, 101.796875, 108.625, 115.453125, 122.28125, 129.109375, 135.9375, 142.765625, 149.59375, 156.421875, 163.25, 170.078125, 176.90625, 183.734375, 190.5625, 197.390625, 204.21875, 211.046875, 217.875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 7.0, 5.0, 8.0, 11.0, 16.0, 22.0, 27.0, 30.0, 32.0, 30.0, 44.0, 60.0, 61.0, 58.0, 56.0, 55.0, 62.0, 53.0, 39.0, 51.0, 48.0, 47.0, 33.0, 22.0, 26.0, 16.0, 12.0, 16.0, 13.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.05712890625, -33.7705078125, -32.48388671875, -31.197265625, -29.91064453125, -28.6240234375, -27.33740234375, -26.05078125, -24.76416015625, -23.4775390625, -22.19091796875, -20.904296875, -19.61767578125, -18.3310546875, -17.04443359375, -15.7578125, -14.47119140625, -13.1845703125, -11.89794921875, -10.611328125, -9.32470703125, -8.0380859375, -6.75146484375, -5.46484375, -4.17822265625, -2.8916015625, -1.60498046875, -0.318359375, 0.96826171875, 2.2548828125, 3.54150390625, 4.828125, 6.11474609375, 7.4013671875, 8.68798828125, 9.974609375, 11.26123046875, 12.5478515625, 13.83447265625, 15.12109375, 16.40771484375, 17.6943359375, 18.98095703125, 20.267578125, 21.55419921875, 22.8408203125, 24.12744140625, 25.4140625, 26.70068359375, 27.9873046875, 29.27392578125, 30.560546875, 31.84716796875, 33.1337890625, 34.42041015625, 35.70703125, 36.99365234375, 38.2802734375, 39.56689453125, 40.853515625, 42.14013671875, 43.4267578125, 44.71337890625, 46.0]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 9.0, 6.0, 8.0, 20.0, 21.0, 29.0, 56.0, 85.0, 124.0, 258.0, 430.0, 830.0, 2172.0, 8703.0, 154857.0, 849077.0, 25320.0, 3881.0, 1281.0, 569.0, 308.0, 162.0, 117.0, 78.0, 47.0, 27.0, 25.0, 10.0, 12.0, 13.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-275.25, -265.50390625, -255.7578125, -246.01171875, -236.265625, -226.51953125, -216.7734375, -207.02734375, -197.28125, -187.53515625, -177.7890625, -168.04296875, -158.296875, -148.55078125, -138.8046875, -129.05859375, -119.3125, -109.56640625, -99.8203125, -90.07421875, -80.328125, -70.58203125, -60.8359375, -51.08984375, -41.34375, -31.59765625, -21.8515625, -12.10546875, -2.359375, 7.38671875, 17.1328125, 26.87890625, 36.625, 46.37109375, 56.1171875, 65.86328125, 75.609375, 85.35546875, 95.1015625, 104.84765625, 114.59375, 124.33984375, 134.0859375, 143.83203125, 153.578125, 163.32421875, 173.0703125, 182.81640625, 192.5625, 202.30859375, 212.0546875, 221.80078125, 231.546875, 241.29296875, 251.0390625, 260.78515625, 270.53125, 280.27734375, 290.0234375, 299.76953125, 309.515625, 319.26171875, 329.0078125, 338.75390625, 348.5]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 9.0, 5.0, 5.0, 12.0, 16.0, 16.0, 20.0, 19.0, 28.0, 28.0, 31.0, 40.0, 34.0, 55.0, 41.0, 44.0, 57.0, 44.0, 55.0, 49.0, 51.0, 49.0, 34.0, 30.0, 44.0, 30.0, 27.0, 19.0, 22.0, 16.0, 11.0, 11.0, 6.0, 7.0, 10.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-152.5, -147.4765625, -142.453125, -137.4296875, -132.40625, -127.3828125, -122.359375, -117.3359375, -112.3125, -107.2890625, -102.265625, -97.2421875, -92.21875, -87.1953125, -82.171875, -77.1484375, -72.125, -67.1015625, -62.078125, -57.0546875, -52.03125, -47.0078125, -41.984375, -36.9609375, -31.9375, -26.9140625, -21.890625, -16.8671875, -11.84375, -6.8203125, -1.796875, 3.2265625, 8.25, 13.2734375, 18.296875, 23.3203125, 28.34375, 33.3671875, 38.390625, 43.4140625, 48.4375, 53.4609375, 58.484375, 63.5078125, 68.53125, 73.5546875, 78.578125, 83.6015625, 88.625, 93.6484375, 98.671875, 103.6953125, 108.71875, 113.7421875, 118.765625, 123.7890625, 128.8125, 133.8359375, 138.859375, 143.8828125, 148.90625, 153.9296875, 158.953125, 163.9765625, 169.0]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 11.0, 8.0, 10.0, 17.0, 17.0, 29.0, 41.0, 62.0, 103.0, 210.0, 480.0, 1731.0, 12817.0, 1000879.0, 28516.0, 2380.0, 642.0, 268.0, 103.0, 69.0, 42.0, 24.0, 24.0, 17.0, 12.0, 12.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.75, -220.05859375, -212.3671875, -204.67578125, -196.984375, -189.29296875, -181.6015625, -173.91015625, -166.21875, -158.52734375, -150.8359375, -143.14453125, -135.453125, -127.76171875, -120.0703125, -112.37890625, -104.6875, -96.99609375, -89.3046875, -81.61328125, -73.921875, -66.23046875, -58.5390625, -50.84765625, -43.15625, -35.46484375, -27.7734375, -20.08203125, -12.390625, -4.69921875, 2.9921875, 10.68359375, 18.375, 26.06640625, 33.7578125, 41.44921875, 49.140625, 56.83203125, 64.5234375, 72.21484375, 79.90625, 87.59765625, 95.2890625, 102.98046875, 110.671875, 118.36328125, 126.0546875, 133.74609375, 141.4375, 149.12890625, 156.8203125, 164.51171875, 172.203125, 179.89453125, 187.5859375, 195.27734375, 202.96875, 210.66015625, 218.3515625, 226.04296875, 233.734375, 241.42578125, 249.1171875, 256.80859375, 264.5]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 17.0, 30.0, 55.0, 128.0, 263.0, 262.0, 129.0, 60.0, 21.0, 11.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0266876220703125, -0.025855302810668945, -0.02502298355102539, -0.024190664291381836, -0.02335834503173828, -0.022526025772094727, -0.021693706512451172, -0.020861387252807617, -0.020029067993164062, -0.019196748733520508, -0.018364429473876953, -0.0175321102142334, -0.016699790954589844, -0.01586747169494629, -0.015035152435302734, -0.01420283317565918, -0.013370513916015625, -0.01253819465637207, -0.011705875396728516, -0.010873556137084961, -0.010041236877441406, -0.009208917617797852, -0.008376598358154297, -0.007544279098510742, -0.0067119598388671875, -0.005879640579223633, -0.005047321319580078, -0.0042150020599365234, -0.0033826828002929688, -0.002550363540649414, -0.0017180442810058594, -0.0008857250213623047, -5.340576171875e-05, 0.0007789134979248047, 0.0016112327575683594, 0.002443552017211914, 0.0032758712768554688, 0.0041081905364990234, 0.004940509796142578, 0.005772829055786133, 0.0066051483154296875, 0.007437467575073242, 0.008269786834716797, 0.009102106094360352, 0.009934425354003906, 0.010766744613647461, 0.011599063873291016, 0.01243138313293457, 0.013263702392578125, 0.01409602165222168, 0.014928340911865234, 0.01576066017150879, 0.016592979431152344, 0.0174252986907959, 0.018257617950439453, 0.019089937210083008, 0.019922256469726562, 0.020754575729370117, 0.021586894989013672, 0.022419214248657227, 0.02325153350830078, 0.024083852767944336, 0.02491617202758789, 0.025748491287231445, 0.026580810546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 13.0, 9.0, 18.0, 37.0, 29.0, 66.0, 86.0, 221.0, 480.0, 1260.0, 4983.0, 47196.0, 961710.0, 26760.0, 3736.0, 1057.0, 406.0, 176.0, 109.0, 67.0, 39.0, 21.0, 17.0, 9.0, 11.0, 9.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-202.625, -196.736328125, -190.84765625, -184.958984375, -179.0703125, -173.181640625, -167.29296875, -161.404296875, -155.515625, -149.626953125, -143.73828125, -137.849609375, -131.9609375, -126.072265625, -120.18359375, -114.294921875, -108.40625, -102.517578125, -96.62890625, -90.740234375, -84.8515625, -78.962890625, -73.07421875, -67.185546875, -61.296875, -55.408203125, -49.51953125, -43.630859375, -37.7421875, -31.853515625, -25.96484375, -20.076171875, -14.1875, -8.298828125, -2.41015625, 3.478515625, 9.3671875, 15.255859375, 21.14453125, 27.033203125, 32.921875, 38.810546875, 44.69921875, 50.587890625, 56.4765625, 62.365234375, 68.25390625, 74.142578125, 80.03125, 85.919921875, 91.80859375, 97.697265625, 103.5859375, 109.474609375, 115.36328125, 121.251953125, 127.140625, 133.029296875, 138.91796875, 144.806640625, 150.6953125, 156.583984375, 162.47265625, 168.361328125, 174.25]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 4.0, 10.0, 8.0, 11.0, 8.0, 17.0, 23.0, 24.0, 49.0, 93.0, 134.0, 135.0, 133.0, 114.0, 78.0, 44.0, 21.0, 19.0, 14.0, 6.0, 6.0, 11.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-109.75, -106.50390625, -103.2578125, -100.01171875, -96.765625, -93.51953125, -90.2734375, -87.02734375, -83.78125, -80.53515625, -77.2890625, -74.04296875, -70.796875, -67.55078125, -64.3046875, -61.05859375, -57.8125, -54.56640625, -51.3203125, -48.07421875, -44.828125, -41.58203125, -38.3359375, -35.08984375, -31.84375, -28.59765625, -25.3515625, -22.10546875, -18.859375, -15.61328125, -12.3671875, -9.12109375, -5.875, -2.62890625, 0.6171875, 3.86328125, 7.109375, 10.35546875, 13.6015625, 16.84765625, 20.09375, 23.33984375, 26.5859375, 29.83203125, 33.078125, 36.32421875, 39.5703125, 42.81640625, 46.0625, 49.30859375, 52.5546875, 55.80078125, 59.046875, 62.29296875, 65.5390625, 68.78515625, 72.03125, 75.27734375, 78.5234375, 81.76953125, 85.015625, 88.26171875, 91.5078125, 94.75390625, 98.0]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 12.0, 39.0, 127.0, 343.0, 313.0, 119.0, 33.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1218.513916015625, -1142.3702392578125, -1066.2266845703125, -990.0830078125, -913.939453125, -837.7957763671875, -761.6521606445312, -685.508544921875, -609.3649291992188, -533.2213134765625, -457.07769775390625, -380.9340515136719, -304.7904357910156, -228.64682006835938, -152.503173828125, -76.35955810546875, -0.2159423828125, 75.92768096923828, 152.07130432128906, 228.21493530273438, 304.3585510253906, 380.5021667480469, 456.64581298828125, 532.7894287109375, 608.9330444335938, 685.07666015625, 761.2202758789062, 837.3638916015625, 913.507568359375, 989.651123046875, 1065.7947998046875, 1141.9384765625, 1218.08203125, 1294.2257080078125, 1370.3692626953125, 1446.512939453125, 1522.656494140625, 1598.8001708984375, 1674.94384765625, 1751.08740234375, 1827.23095703125, 1903.3746337890625, 1979.5181884765625, 2055.661865234375, 2131.805419921875, 2207.948974609375, 2284.0927734375, 2360.236328125, 2436.3798828125, 2512.5234375, 2588.667236328125, 2664.810791015625, 2740.954345703125, 2817.097900390625, 2893.24169921875, 2969.38525390625, 3045.529052734375, 3121.672607421875, 3197.81640625, 3273.9599609375, 3350.103515625, 3426.2470703125, 3502.390869140625, 3578.534423828125, 3654.677978515625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 7.0, 4.0, 8.0, 12.0, 12.0, 14.0, 14.0, 21.0, 36.0, 18.0, 35.0, 39.0, 35.0, 51.0, 54.0, 62.0, 62.0, 69.0, 46.0, 60.0, 37.0, 56.0, 40.0, 29.0, 33.0, 26.0, 18.0, 24.0, 16.0, 11.0, 16.0, 5.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-765.71240234375, -741.8490600585938, -717.9856567382812, -694.122314453125, -670.2589111328125, -646.3955688476562, -622.5322265625, -598.6688232421875, -574.805419921875, -550.9420776367188, -527.0786743164062, -503.21533203125, -479.3519287109375, -455.48858642578125, -431.6252136230469, -407.7618408203125, -383.89849853515625, -360.0351257324219, -336.1717529296875, -312.30841064453125, -288.44500732421875, -264.5816650390625, -240.71829223632812, -216.85491943359375, -192.99154663085938, -169.128173828125, -145.26480102539062, -121.40144348144531, -97.53807067871094, -73.67469787597656, -49.81134033203125, -25.947967529296875, -2.08465576171875, 21.77871322631836, 45.64208221435547, 69.50544738769531, 93.36882019042969, 117.23219299316406, 141.09555053710938, 164.95892333984375, 188.82229614257812, 212.6856689453125, 236.54904174804688, 260.41241455078125, 284.2757568359375, 308.13916015625, 332.00250244140625, 355.8658752441406, 379.729248046875, 403.5926208496094, 427.45599365234375, 451.3193359375, 475.1827392578125, 499.04608154296875, 522.909423828125, 546.7728271484375, 570.63623046875, 594.4995727539062, 618.3629760742188, 642.226318359375, 666.0897216796875, 689.9530639648438, 713.81640625, 737.6798095703125, 761.5431518554688]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 8.0, 10.0, 10.0, 14.0, 17.0, 35.0, 55.0, 58.0, 98.0, 162.0, 282.0, 483.0, 1002.0, 2408.0, 7244.0, 32457.0, 577502.0, 3475254.0, 76796.0, 13405.0, 3927.0, 1484.0, 696.0, 333.0, 194.0, 110.0, 58.0, 64.0, 32.0, 24.0, 18.0, 7.0, 12.0, 6.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.5, -92.3388671875, -89.177734375, -86.0166015625, -82.85546875, -79.6943359375, -76.533203125, -73.3720703125, -70.2109375, -67.0498046875, -63.888671875, -60.7275390625, -57.56640625, -54.4052734375, -51.244140625, -48.0830078125, -44.921875, -41.7607421875, -38.599609375, -35.4384765625, -32.27734375, -29.1162109375, -25.955078125, -22.7939453125, -19.6328125, -16.4716796875, -13.310546875, -10.1494140625, -6.98828125, -3.8271484375, -0.666015625, 2.4951171875, 5.65625, 8.8173828125, 11.978515625, 15.1396484375, 18.30078125, 21.4619140625, 24.623046875, 27.7841796875, 30.9453125, 34.1064453125, 37.267578125, 40.4287109375, 43.58984375, 46.7509765625, 49.912109375, 53.0732421875, 56.234375, 59.3955078125, 62.556640625, 65.7177734375, 68.87890625, 72.0400390625, 75.201171875, 78.3623046875, 81.5234375, 84.6845703125, 87.845703125, 91.0068359375, 94.16796875, 97.3291015625, 100.490234375, 103.6513671875, 106.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 4.0, 9.0, 13.0, 28.0, 31.0, 40.0, 60.0, 64.0, 71.0, 91.0, 84.0, 91.0, 62.0, 66.0, 59.0, 55.0, 38.0, 40.0, 24.0, 20.0, 19.0, 5.0, 9.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.125, -60.3525390625, -58.580078125, -56.8076171875, -55.03515625, -53.2626953125, -51.490234375, -49.7177734375, -47.9453125, -46.1728515625, -44.400390625, -42.6279296875, -40.85546875, -39.0830078125, -37.310546875, -35.5380859375, -33.765625, -31.9931640625, -30.220703125, -28.4482421875, -26.67578125, -24.9033203125, -23.130859375, -21.3583984375, -19.5859375, -17.8134765625, -16.041015625, -14.2685546875, -12.49609375, -10.7236328125, -8.951171875, -7.1787109375, -5.40625, -3.6337890625, -1.861328125, -0.0888671875, 1.68359375, 3.4560546875, 5.228515625, 7.0009765625, 8.7734375, 10.5458984375, 12.318359375, 14.0908203125, 15.86328125, 17.6357421875, 19.408203125, 21.1806640625, 22.953125, 24.7255859375, 26.498046875, 28.2705078125, 30.04296875, 31.8154296875, 33.587890625, 35.3603515625, 37.1328125, 38.9052734375, 40.677734375, 42.4501953125, 44.22265625, 45.9951171875, 47.767578125, 49.5400390625, 51.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 15.0, 17.0, 28.0, 48.0, 96.0, 138.0, 297.0, 924.0, 3580.0, 20039.0, 304146.0, 3771930.0, 79422.0, 10385.0, 2173.0, 599.0, 202.0, 92.0, 55.0, 29.0, 30.0, 15.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.1875, -110.6337890625, -106.080078125, -101.5263671875, -96.97265625, -92.4189453125, -87.865234375, -83.3115234375, -78.7578125, -74.2041015625, -69.650390625, -65.0966796875, -60.54296875, -55.9892578125, -51.435546875, -46.8818359375, -42.328125, -37.7744140625, -33.220703125, -28.6669921875, -24.11328125, -19.5595703125, -15.005859375, -10.4521484375, -5.8984375, -1.3447265625, 3.208984375, 7.7626953125, 12.31640625, 16.8701171875, 21.423828125, 25.9775390625, 30.53125, 35.0849609375, 39.638671875, 44.1923828125, 48.74609375, 53.2998046875, 57.853515625, 62.4072265625, 66.9609375, 71.5146484375, 76.068359375, 80.6220703125, 85.17578125, 89.7294921875, 94.283203125, 98.8369140625, 103.390625, 107.9443359375, 112.498046875, 117.0517578125, 121.60546875, 126.1591796875, 130.712890625, 135.2666015625, 139.8203125, 144.3740234375, 148.927734375, 153.4814453125, 158.03515625, 162.5888671875, 167.142578125, 171.6962890625, 176.25]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 2.0, 9.0, 12.0, 15.0, 39.0, 57.0, 121.0, 344.0, 1092.0, 1504.0, 491.0, 154.0, 85.0, 52.0, 31.0, 23.0, 15.0, 9.0, 4.0, 5.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-175.25, -171.0908203125, -166.931640625, -162.7724609375, -158.61328125, -154.4541015625, -150.294921875, -146.1357421875, -141.9765625, -137.8173828125, -133.658203125, -129.4990234375, -125.33984375, -121.1806640625, -117.021484375, -112.8623046875, -108.703125, -104.5439453125, -100.384765625, -96.2255859375, -92.06640625, -87.9072265625, -83.748046875, -79.5888671875, -75.4296875, -71.2705078125, -67.111328125, -62.9521484375, -58.79296875, -54.6337890625, -50.474609375, -46.3154296875, -42.15625, -37.9970703125, -33.837890625, -29.6787109375, -25.51953125, -21.3603515625, -17.201171875, -13.0419921875, -8.8828125, -4.7236328125, -0.564453125, 3.5947265625, 7.75390625, 11.9130859375, 16.072265625, 20.2314453125, 24.390625, 28.5498046875, 32.708984375, 36.8681640625, 41.02734375, 45.1865234375, 49.345703125, 53.5048828125, 57.6640625, 61.8232421875, 65.982421875, 70.1416015625, 74.30078125, 78.4599609375, 82.619140625, 86.7783203125, 90.9375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 9.0, 17.0, 29.0, 56.0, 107.0, 163.0, 196.0, 155.0, 124.0, 51.0, 25.0, 21.0, 5.0, 10.0, 5.0, 4.0, 0.0, 0.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-666.39501953125, -644.3047485351562, -622.2144165039062, -600.1241455078125, -578.0338134765625, -555.9435424804688, -533.853271484375, -511.762939453125, -489.6726379394531, -467.58233642578125, -445.4920349121094, -423.4017333984375, -401.31146240234375, -379.22113037109375, -357.130859375, -335.0405578613281, -312.95025634765625, -290.8599548339844, -268.7696533203125, -246.6793670654297, -224.5890655517578, -202.49876403808594, -180.40847778320312, -158.31817626953125, -136.22787475585938, -114.1375732421875, -92.04727935791016, -69.95698547363281, -47.86668395996094, -25.776382446289062, -3.68609619140625, 18.404205322265625, 40.4945068359375, 62.58480453491211, 84.67510223388672, 106.76539611816406, 128.85569763183594, 150.9459991455078, 173.03628540039062, 195.1265869140625, 217.21688842773438, 239.30718994140625, 261.3974914550781, 283.48779296875, 305.57806396484375, 327.66839599609375, 349.7586669921875, 371.8489685058594, 393.93927001953125, 416.0295715332031, 438.119873046875, 460.21014404296875, 482.30047607421875, 504.3907470703125, 526.4810791015625, 548.5713500976562, 570.66162109375, 592.7518920898438, 614.8422241210938, 636.9324951171875, 659.0228271484375, 681.1130981445312, 703.203369140625, 725.293701171875, 747.384033203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 10.0, 7.0, 15.0, 17.0, 12.0, 15.0, 30.0, 30.0, 35.0, 37.0, 35.0, 41.0, 49.0, 43.0, 40.0, 46.0, 50.0, 43.0, 52.0, 45.0, 41.0, 37.0, 47.0, 41.0, 32.0, 28.0, 20.0, 13.0, 18.0, 19.0, 9.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-409.6883850097656, -398.821044921875, -387.9537353515625, -377.0863952636719, -366.21905517578125, -355.35174560546875, -344.4844055175781, -333.6170654296875, -322.749755859375, -311.8824157714844, -301.0151062011719, -290.14776611328125, -279.2804260253906, -268.4130859375, -257.5457763671875, -246.67843627929688, -235.81109619140625, -224.9437713623047, -214.07643127441406, -203.2091064453125, -192.34176635742188, -181.4744415283203, -170.60711669921875, -159.73977661132812, -148.87245178222656, -138.005126953125, -127.13778686523438, -116.27046203613281, -105.40312957763672, -94.53579711914062, -83.66847229003906, -72.80113983154297, -61.93377685546875, -51.066444396972656, -40.19911575317383, -29.331787109375, -18.464454650878906, -7.5971221923828125, 3.27020263671875, 14.137535095214844, 25.004867553710938, 35.87220001220703, 46.73952865600586, 57.60685729980469, 68.47418975830078, 79.34152221679688, 90.20884704589844, 101.07617950439453, 111.94351196289062, 122.81084442138672, 133.6781768798828, 144.54550170898438, 155.412841796875, 166.28016662597656, 177.14749145507812, 188.01483154296875, 198.8821563720703, 209.74948120117188, 220.6168212890625, 231.48414611816406, 242.35147094726562, 253.21881103515625, 264.08612060546875, 274.9534606933594, 285.82080078125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 6.0, 9.0, 3.0, 12.0, 11.0, 13.0, 23.0, 29.0, 25.0, 39.0, 70.0, 78.0, 130.0, 196.0, 316.0, 512.0, 925.0, 1889.0, 3750.0, 8413.0, 20089.0, 52341.0, 148511.0, 373817.0, 278684.0, 97312.0, 35154.0, 14009.0, 6062.0, 2714.0, 1389.0, 698.0, 402.0, 296.0, 181.0, 124.0, 100.0, 50.0, 47.0, 40.0, 22.0, 15.0, 14.0, 11.0, 8.0, 4.0, 4.0, 5.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.75, -69.5625, -67.375, -65.1875, -63.0, -60.8125, -58.625, -56.4375, -54.25, -52.0625, -49.875, -47.6875, -45.5, -43.3125, -41.125, -38.9375, -36.75, -34.5625, -32.375, -30.1875, -28.0, -25.8125, -23.625, -21.4375, -19.25, -17.0625, -14.875, -12.6875, -10.5, -8.3125, -6.125, -3.9375, -1.75, 0.4375, 2.625, 4.8125, 7.0, 9.1875, 11.375, 13.5625, 15.75, 17.9375, 20.125, 22.3125, 24.5, 26.6875, 28.875, 31.0625, 33.25, 35.4375, 37.625, 39.8125, 42.0, 44.1875, 46.375, 48.5625, 50.75, 52.9375, 55.125, 57.3125, 59.5, 61.6875, 63.875, 66.0625, 68.25]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 7.0, 17.0, 15.0, 39.0, 29.0, 48.0, 60.0, 63.0, 74.0, 75.0, 75.0, 65.0, 83.0, 73.0, 45.0, 53.0, 36.0, 26.0, 22.0, 27.0, 21.0, 15.0, 5.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.28125, -52.63134765625, -50.9814453125, -49.33154296875, -47.681640625, -46.03173828125, -44.3818359375, -42.73193359375, -41.08203125, -39.43212890625, -37.7822265625, -36.13232421875, -34.482421875, -32.83251953125, -31.1826171875, -29.53271484375, -27.8828125, -26.23291015625, -24.5830078125, -22.93310546875, -21.283203125, -19.63330078125, -17.9833984375, -16.33349609375, -14.68359375, -13.03369140625, -11.3837890625, -9.73388671875, -8.083984375, -6.43408203125, -4.7841796875, -3.13427734375, -1.484375, 0.16552734375, 1.8154296875, 3.46533203125, 5.115234375, 6.76513671875, 8.4150390625, 10.06494140625, 11.71484375, 13.36474609375, 15.0146484375, 16.66455078125, 18.314453125, 19.96435546875, 21.6142578125, 23.26416015625, 24.9140625, 26.56396484375, 28.2138671875, 29.86376953125, 31.513671875, 33.16357421875, 34.8134765625, 36.46337890625, 38.11328125, 39.76318359375, 41.4130859375, 43.06298828125, 44.712890625, 46.36279296875, 48.0126953125, 49.66259765625, 51.3125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 3.0, 8.0, 15.0, 13.0, 21.0, 34.0, 55.0, 86.0, 129.0, 239.0, 443.0, 899.0, 2372.0, 8759.0, 67491.0, 799276.0, 148815.0, 14216.0, 3275.0, 1171.0, 518.0, 272.0, 154.0, 94.0, 54.0, 38.0, 32.0, 21.0, 6.0, 9.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-224.375, -218.080078125, -211.78515625, -205.490234375, -199.1953125, -192.900390625, -186.60546875, -180.310546875, -174.015625, -167.720703125, -161.42578125, -155.130859375, -148.8359375, -142.541015625, -136.24609375, -129.951171875, -123.65625, -117.361328125, -111.06640625, -104.771484375, -98.4765625, -92.181640625, -85.88671875, -79.591796875, -73.296875, -67.001953125, -60.70703125, -54.412109375, -48.1171875, -41.822265625, -35.52734375, -29.232421875, -22.9375, -16.642578125, -10.34765625, -4.052734375, 2.2421875, 8.537109375, 14.83203125, 21.126953125, 27.421875, 33.716796875, 40.01171875, 46.306640625, 52.6015625, 58.896484375, 65.19140625, 71.486328125, 77.78125, 84.076171875, 90.37109375, 96.666015625, 102.9609375, 109.255859375, 115.55078125, 121.845703125, 128.140625, 134.435546875, 140.73046875, 147.025390625, 153.3203125, 159.615234375, 165.91015625, 172.205078125, 178.5]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 4.0, 7.0, 9.0, 14.0, 24.0, 18.0, 21.0, 38.0, 40.0, 39.0, 40.0, 65.0, 55.0, 60.0, 64.0, 60.0, 59.0, 47.0, 43.0, 64.0, 42.0, 46.0, 30.0, 22.0, 20.0, 18.0, 10.0, 8.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.125, -185.3203125, -179.515625, -173.7109375, -167.90625, -162.1015625, -156.296875, -150.4921875, -144.6875, -138.8828125, -133.078125, -127.2734375, -121.46875, -115.6640625, -109.859375, -104.0546875, -98.25, -92.4453125, -86.640625, -80.8359375, -75.03125, -69.2265625, -63.421875, -57.6171875, -51.8125, -46.0078125, -40.203125, -34.3984375, -28.59375, -22.7890625, -16.984375, -11.1796875, -5.375, 0.4296875, 6.234375, 12.0390625, 17.84375, 23.6484375, 29.453125, 35.2578125, 41.0625, 46.8671875, 52.671875, 58.4765625, 64.28125, 70.0859375, 75.890625, 81.6953125, 87.5, 93.3046875, 99.109375, 104.9140625, 110.71875, 116.5234375, 122.328125, 128.1328125, 133.9375, 139.7421875, 145.546875, 151.3515625, 157.15625, 162.9609375, 168.765625, 174.5703125, 180.375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 9.0, 15.0, 29.0, 39.0, 101.0, 202.0, 478.0, 1563.0, 8282.0, 174766.0, 831401.0, 27173.0, 3100.0, 840.0, 277.0, 137.0, 61.0, 32.0, 18.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.125, -72.26171875, -69.3984375, -66.53515625, -63.671875, -60.80859375, -57.9453125, -55.08203125, -52.21875, -49.35546875, -46.4921875, -43.62890625, -40.765625, -37.90234375, -35.0390625, -32.17578125, -29.3125, -26.44921875, -23.5859375, -20.72265625, -17.859375, -14.99609375, -12.1328125, -9.26953125, -6.40625, -3.54296875, -0.6796875, 2.18359375, 5.046875, 7.91015625, 10.7734375, 13.63671875, 16.5, 19.36328125, 22.2265625, 25.08984375, 27.953125, 30.81640625, 33.6796875, 36.54296875, 39.40625, 42.26953125, 45.1328125, 47.99609375, 50.859375, 53.72265625, 56.5859375, 59.44921875, 62.3125, 65.17578125, 68.0390625, 70.90234375, 73.765625, 76.62890625, 79.4921875, 82.35546875, 85.21875, 88.08203125, 90.9453125, 93.80859375, 96.671875, 99.53515625, 102.3984375, 105.26171875, 108.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 9.0, 14.0, 20.0, 10.0, 26.0, 28.0, 33.0, 64.0, 75.0, 106.0, 108.0, 85.0, 86.0, 61.0, 53.0, 50.0, 30.0, 25.0, 25.0, 12.0, 11.0, 11.0, 5.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008575439453125, -0.00830686092376709, -0.00803828239440918, -0.0077697038650512695, -0.007501125335693359, -0.007232546806335449, -0.006963968276977539, -0.006695389747619629, -0.006426811218261719, -0.006158232688903809, -0.0058896541595458984, -0.005621075630187988, -0.005352497100830078, -0.005083918571472168, -0.004815340042114258, -0.004546761512756348, -0.0042781829833984375, -0.004009604454040527, -0.003741025924682617, -0.003472447395324707, -0.003203868865966797, -0.0029352903366088867, -0.0026667118072509766, -0.0023981332778930664, -0.0021295547485351562, -0.001860976219177246, -0.001592397689819336, -0.0013238191604614258, -0.0010552406311035156, -0.0007866621017456055, -0.0005180835723876953, -0.00024950504302978516, 1.9073486328125e-05, 0.00028765201568603516, 0.0005562305450439453, 0.0008248090744018555, 0.0010933876037597656, 0.0013619661331176758, 0.001630544662475586, 0.001899123191833496, 0.0021677017211914062, 0.0024362802505493164, 0.0027048587799072266, 0.0029734373092651367, 0.003242015838623047, 0.003510594367980957, 0.003779172897338867, 0.004047751426696777, 0.0043163299560546875, 0.004584908485412598, 0.004853487014770508, 0.005122065544128418, 0.005390644073486328, 0.005659222602844238, 0.0059278011322021484, 0.006196379661560059, 0.006464958190917969, 0.006733536720275879, 0.007002115249633789, 0.007270693778991699, 0.007539272308349609, 0.0078078508377075195, 0.00807642936706543, 0.00834500789642334, 0.00861358642578125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 12.0, 12.0, 15.0, 19.0, 31.0, 38.0, 60.0, 97.0, 171.0, 270.0, 512.0, 852.0, 1955.0, 4532.0, 14900.0, 101154.0, 783036.0, 116047.0, 15813.0, 4863.0, 1918.0, 944.0, 506.0, 312.0, 158.0, 90.0, 73.0, 41.0, 40.0, 23.0, 18.0, 7.0, 6.0, 7.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.125, -59.18603515625, -57.2470703125, -55.30810546875, -53.369140625, -51.43017578125, -49.4912109375, -47.55224609375, -45.61328125, -43.67431640625, -41.7353515625, -39.79638671875, -37.857421875, -35.91845703125, -33.9794921875, -32.04052734375, -30.1015625, -28.16259765625, -26.2236328125, -24.28466796875, -22.345703125, -20.40673828125, -18.4677734375, -16.52880859375, -14.58984375, -12.65087890625, -10.7119140625, -8.77294921875, -6.833984375, -4.89501953125, -2.9560546875, -1.01708984375, 0.921875, 2.86083984375, 4.7998046875, 6.73876953125, 8.677734375, 10.61669921875, 12.5556640625, 14.49462890625, 16.43359375, 18.37255859375, 20.3115234375, 22.25048828125, 24.189453125, 26.12841796875, 28.0673828125, 30.00634765625, 31.9453125, 33.88427734375, 35.8232421875, 37.76220703125, 39.701171875, 41.64013671875, 43.5791015625, 45.51806640625, 47.45703125, 49.39599609375, 51.3349609375, 53.27392578125, 55.212890625, 57.15185546875, 59.0908203125, 61.02978515625, 62.96875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 13.0, 18.0, 23.0, 34.0, 39.0, 65.0, 79.0, 84.0, 102.0, 126.0, 102.0, 100.0, 62.0, 36.0, 31.0, 24.0, 16.0, 7.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.125, -54.181640625, -52.23828125, -50.294921875, -48.3515625, -46.408203125, -44.46484375, -42.521484375, -40.578125, -38.634765625, -36.69140625, -34.748046875, -32.8046875, -30.861328125, -28.91796875, -26.974609375, -25.03125, -23.087890625, -21.14453125, -19.201171875, -17.2578125, -15.314453125, -13.37109375, -11.427734375, -9.484375, -7.541015625, -5.59765625, -3.654296875, -1.7109375, 0.232421875, 2.17578125, 4.119140625, 6.0625, 8.005859375, 9.94921875, 11.892578125, 13.8359375, 15.779296875, 17.72265625, 19.666015625, 21.609375, 23.552734375, 25.49609375, 27.439453125, 29.3828125, 31.326171875, 33.26953125, 35.212890625, 37.15625, 39.099609375, 41.04296875, 42.986328125, 44.9296875, 46.873046875, 48.81640625, 50.759765625, 52.703125, 54.646484375, 56.58984375, 58.533203125, 60.4765625, 62.419921875, 64.36328125, 66.306640625, 68.25]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 8.0, 5.0, 26.0, 60.0, 127.0, 204.0, 251.0, 165.0, 68.0, 34.0, 21.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1095.5286865234375, -1055.3272705078125, -1015.1258544921875, -974.9244384765625, -934.7230224609375, -894.5216064453125, -854.3201904296875, -814.1187744140625, -773.9173583984375, -733.7159423828125, -693.5145263671875, -653.3131103515625, -613.1116943359375, -572.9102783203125, -532.7088623046875, -492.5074768066406, -452.30609130859375, -412.10467529296875, -371.90325927734375, -331.70184326171875, -291.50042724609375, -251.2990264892578, -211.09762573242188, -170.89620971679688, -130.69479370117188, -90.49337768554688, -50.291969299316406, -10.090560913085938, 30.110855102539062, 70.31227111816406, 110.513671875, 150.715087890625, 190.91650390625, 231.117919921875, 271.3193359375, 311.520751953125, 351.72216796875, 391.923583984375, 432.1249694824219, 472.3263854980469, 512.52783203125, 552.729248046875, 592.9306640625, 633.132080078125, 673.33349609375, 713.534912109375, 753.736328125, 793.937744140625, 834.1390991210938, 874.3405151367188, 914.5419311523438, 954.7433471679688, 994.9447631835938, 1035.1461181640625, 1075.3475341796875, 1115.5489501953125, 1155.7503662109375, 1195.9517822265625, 1236.1531982421875, 1276.3546142578125, 1316.5560302734375, 1356.7574462890625, 1396.9588623046875, 1437.1602783203125, 1477.3616943359375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 2.0, 15.0, 14.0, 14.0, 22.0, 22.0, 25.0, 26.0, 46.0, 17.0, 29.0, 49.0, 42.0, 43.0, 58.0, 67.0, 78.0, 44.0, 55.0, 40.0, 42.0, 37.0, 34.0, 25.0, 30.0, 20.0, 18.0, 12.0, 17.0, 5.0, 9.0, 13.0, 3.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-673.5874633789062, -652.2804565429688, -630.9734497070312, -609.66650390625, -588.3594970703125, -567.052490234375, -545.7454833984375, -524.4384765625, -503.1315002441406, -481.8244934082031, -460.51751708984375, -439.21051025390625, -417.90350341796875, -396.5965270996094, -375.2895202636719, -353.9825439453125, -332.675537109375, -311.3685302734375, -290.0615539550781, -268.7545471191406, -247.4475555419922, -226.14056396484375, -204.83355712890625, -183.5265655517578, -162.21957397460938, -140.91258239746094, -119.60558319091797, -98.298583984375, -76.99159240722656, -55.684600830078125, -34.377601623535156, -13.070602416992188, 8.23638916015625, 29.543384552001953, 50.850379943847656, 72.15737915039062, 93.46437072753906, 114.7713623046875, 136.078369140625, 157.38536071777344, 178.69235229492188, 199.9993438720703, 221.30633544921875, 242.61334228515625, 263.92034912109375, 285.2273254394531, 306.5343322753906, 327.84130859375, 349.1483154296875, 370.455322265625, 391.7622985839844, 413.0693054199219, 434.37628173828125, 455.68328857421875, 476.99029541015625, 498.29730224609375, 519.604248046875, 540.9112548828125, 562.21826171875, 583.5252075195312, 604.8322143554688, 626.1392211914062, 647.4462280273438, 668.7532348632812, 690.0602416992188]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 19.0, 11.0, 25.0, 28.0, 40.0, 47.0, 77.0, 109.0, 213.0, 392.0, 842.0, 2333.0, 9306.0, 61095.0, 1785306.0, 2249464.0, 69632.0, 10738.0, 2668.0, 888.0, 372.0, 197.0, 134.0, 88.0, 57.0, 33.0, 35.0, 34.0, 22.0, 17.0, 16.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.0625, -95.763671875, -92.46484375, -89.166015625, -85.8671875, -82.568359375, -79.26953125, -75.970703125, -72.671875, -69.373046875, -66.07421875, -62.775390625, -59.4765625, -56.177734375, -52.87890625, -49.580078125, -46.28125, -42.982421875, -39.68359375, -36.384765625, -33.0859375, -29.787109375, -26.48828125, -23.189453125, -19.890625, -16.591796875, -13.29296875, -9.994140625, -6.6953125, -3.396484375, -0.09765625, 3.201171875, 6.5, 9.798828125, 13.09765625, 16.396484375, 19.6953125, 22.994140625, 26.29296875, 29.591796875, 32.890625, 36.189453125, 39.48828125, 42.787109375, 46.0859375, 49.384765625, 52.68359375, 55.982421875, 59.28125, 62.580078125, 65.87890625, 69.177734375, 72.4765625, 75.775390625, 79.07421875, 82.373046875, 85.671875, 88.970703125, 92.26953125, 95.568359375, 98.8671875, 102.166015625, 105.46484375, 108.763671875, 112.0625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 11.0, 16.0, 23.0, 31.0, 40.0, 57.0, 60.0, 77.0, 103.0, 100.0, 101.0, 83.0, 62.0, 60.0, 45.0, 37.0, 25.0, 23.0, 15.0, 14.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-78.6875, -76.8515625, -75.015625, -73.1796875, -71.34375, -69.5078125, -67.671875, -65.8359375, -64.0, -62.1640625, -60.328125, -58.4921875, -56.65625, -54.8203125, -52.984375, -51.1484375, -49.3125, -47.4765625, -45.640625, -43.8046875, -41.96875, -40.1328125, -38.296875, -36.4609375, -34.625, -32.7890625, -30.953125, -29.1171875, -27.28125, -25.4453125, -23.609375, -21.7734375, -19.9375, -18.1015625, -16.265625, -14.4296875, -12.59375, -10.7578125, -8.921875, -7.0859375, -5.25, -3.4140625, -1.578125, 0.2578125, 2.09375, 3.9296875, 5.765625, 7.6015625, 9.4375, 11.2734375, 13.109375, 14.9453125, 16.78125, 18.6171875, 20.453125, 22.2890625, 24.125, 25.9609375, 27.796875, 29.6328125, 31.46875, 33.3046875, 35.140625, 36.9765625, 38.8125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 14.0, 20.0, 37.0, 57.0, 102.0, 172.0, 336.0, 753.0, 1925.0, 6151.0, 26757.0, 200115.0, 3445967.0, 455405.0, 43443.0, 8677.0, 2524.0, 936.0, 394.0, 184.0, 102.0, 77.0, 37.0, 23.0, 17.0, 18.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.375, -82.287109375, -79.19921875, -76.111328125, -73.0234375, -69.935546875, -66.84765625, -63.759765625, -60.671875, -57.583984375, -54.49609375, -51.408203125, -48.3203125, -45.232421875, -42.14453125, -39.056640625, -35.96875, -32.880859375, -29.79296875, -26.705078125, -23.6171875, -20.529296875, -17.44140625, -14.353515625, -11.265625, -8.177734375, -5.08984375, -2.001953125, 1.0859375, 4.173828125, 7.26171875, 10.349609375, 13.4375, 16.525390625, 19.61328125, 22.701171875, 25.7890625, 28.876953125, 31.96484375, 35.052734375, 38.140625, 41.228515625, 44.31640625, 47.404296875, 50.4921875, 53.580078125, 56.66796875, 59.755859375, 62.84375, 65.931640625, 69.01953125, 72.107421875, 75.1953125, 78.283203125, 81.37109375, 84.458984375, 87.546875, 90.634765625, 93.72265625, 96.810546875, 99.8984375, 102.986328125, 106.07421875, 109.162109375, 112.25]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 8.0, 10.0, 12.0, 16.0, 21.0, 25.0, 41.0, 55.0, 65.0, 100.0, 183.0, 267.0, 516.0, 768.0, 788.0, 497.0, 278.0, 124.0, 77.0, 63.0, 40.0, 32.0, 24.0, 13.0, 7.0, 12.0, 7.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.75, -94.8671875, -91.984375, -89.1015625, -86.21875, -83.3359375, -80.453125, -77.5703125, -74.6875, -71.8046875, -68.921875, -66.0390625, -63.15625, -60.2734375, -57.390625, -54.5078125, -51.625, -48.7421875, -45.859375, -42.9765625, -40.09375, -37.2109375, -34.328125, -31.4453125, -28.5625, -25.6796875, -22.796875, -19.9140625, -17.03125, -14.1484375, -11.265625, -8.3828125, -5.5, -2.6171875, 0.265625, 3.1484375, 6.03125, 8.9140625, 11.796875, 14.6796875, 17.5625, 20.4453125, 23.328125, 26.2109375, 29.09375, 31.9765625, 34.859375, 37.7421875, 40.625, 43.5078125, 46.390625, 49.2734375, 52.15625, 55.0390625, 57.921875, 60.8046875, 63.6875, 66.5703125, 69.453125, 72.3359375, 75.21875, 78.1015625, 80.984375, 83.8671875, 86.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 7.0, 8.0, 5.0, 22.0, 88.0, 265.0, 350.0, 180.0, 50.0, 14.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2868.54833984375, -2815.765869140625, -2762.9833984375, -2710.20068359375, -2657.418212890625, -2604.6357421875, -2551.853271484375, -2499.07080078125, -2446.2880859375, -2393.505615234375, -2340.72314453125, -2287.9404296875, -2235.157958984375, -2182.37548828125, -2129.593017578125, -2076.810546875, -2024.0279541015625, -1971.2454833984375, -1918.462890625, -1865.680419921875, -1812.8978271484375, -1760.1153564453125, -1707.332763671875, -1654.55029296875, -1601.767822265625, -1548.9853515625, -1496.2027587890625, -1443.4202880859375, -1390.6376953125, -1337.855224609375, -1285.07275390625, -1232.2901611328125, -1179.507568359375, -1126.72509765625, -1073.9425048828125, -1021.1600341796875, -968.37744140625, -915.594970703125, -862.8124389648438, -810.0299072265625, -757.247314453125, -704.4647827148438, -651.6822509765625, -598.8997802734375, -546.1171875, -493.3346862792969, -440.55218505859375, -387.7696533203125, -334.98712158203125, -282.20458984375, -229.4220733642578, -176.63955688476562, -123.85702514648438, -71.07449340820312, -18.2919921875, 34.49053955078125, 87.2730712890625, 140.05560302734375, 192.83811950683594, 245.62063598632812, 298.4031677246094, 351.1856994628906, 403.96820068359375, 456.750732421875, 509.53326416015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 13.0, 4.0, 7.0, 15.0, 21.0, 15.0, 16.0, 27.0, 25.0, 26.0, 37.0, 36.0, 43.0, 55.0, 41.0, 52.0, 54.0, 55.0, 45.0, 58.0, 45.0, 41.0, 45.0, 35.0, 27.0, 16.0, 26.0, 20.0, 18.0, 12.0, 10.0, 8.0, 10.0, 10.0, 8.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-407.34918212890625, -394.2499084472656, -381.150634765625, -368.0513610839844, -354.95208740234375, -341.852783203125, -328.7535095214844, -315.65423583984375, -302.5549621582031, -289.4556884765625, -276.3564147949219, -263.25714111328125, -250.15785217285156, -237.05857849121094, -223.95928955078125, -210.86001586914062, -197.7607421875, -184.66146850585938, -171.56219482421875, -158.46290588378906, -145.36363220214844, -132.2643585205078, -119.16507720947266, -106.0657958984375, -92.96652221679688, -79.86724853515625, -66.7679672241211, -53.6686897277832, -40.56941223144531, -27.470138549804688, -14.370857238769531, -1.271575927734375, 11.82769775390625, 24.92697525024414, 38.02625274658203, 51.12553024291992, 64.22480773925781, 77.32408142089844, 90.4233627319336, 103.52264404296875, 116.62191772460938, 129.72119140625, 142.82046508789062, 155.9197540283203, 169.01902770996094, 182.11830139160156, 195.21759033203125, 208.31686401367188, 221.4161376953125, 234.51541137695312, 247.61468505859375, 260.7139587402344, 273.813232421875, 286.91253662109375, 300.0118103027344, 313.111083984375, 326.2103576660156, 339.30963134765625, 352.4089050292969, 365.5081787109375, 378.60748291015625, 391.70672607421875, 404.8060302734375, 417.9053039550781, 431.00457763671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 7.0, 6.0, 13.0, 21.0, 26.0, 41.0, 43.0, 67.0, 114.0, 206.0, 280.0, 563.0, 1088.0, 2389.0, 7048.0, 25335.0, 98292.0, 372347.0, 393738.0, 107093.0, 27172.0, 7500.0, 2647.0, 1016.0, 607.0, 313.0, 191.0, 106.0, 98.0, 53.0, 34.0, 31.0, 20.0, 10.0, 8.0, 11.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.3125, -91.45703125, -88.6015625, -85.74609375, -82.890625, -80.03515625, -77.1796875, -74.32421875, -71.46875, -68.61328125, -65.7578125, -62.90234375, -60.046875, -57.19140625, -54.3359375, -51.48046875, -48.625, -45.76953125, -42.9140625, -40.05859375, -37.203125, -34.34765625, -31.4921875, -28.63671875, -25.78125, -22.92578125, -20.0703125, -17.21484375, -14.359375, -11.50390625, -8.6484375, -5.79296875, -2.9375, -0.08203125, 2.7734375, 5.62890625, 8.484375, 11.33984375, 14.1953125, 17.05078125, 19.90625, 22.76171875, 25.6171875, 28.47265625, 31.328125, 34.18359375, 37.0390625, 39.89453125, 42.75, 45.60546875, 48.4609375, 51.31640625, 54.171875, 57.02734375, 59.8828125, 62.73828125, 65.59375, 68.44921875, 71.3046875, 74.16015625, 77.015625, 79.87109375, 82.7265625, 85.58203125, 88.4375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 10.0, 14.0, 17.0, 30.0, 37.0, 43.0, 52.0, 69.0, 83.0, 92.0, 103.0, 96.0, 79.0, 66.0, 61.0, 48.0, 33.0, 21.0, 18.0, 15.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-78.25, -76.4560546875, -74.662109375, -72.8681640625, -71.07421875, -69.2802734375, -67.486328125, -65.6923828125, -63.8984375, -62.1044921875, -60.310546875, -58.5166015625, -56.72265625, -54.9287109375, -53.134765625, -51.3408203125, -49.546875, -47.7529296875, -45.958984375, -44.1650390625, -42.37109375, -40.5771484375, -38.783203125, -36.9892578125, -35.1953125, -33.4013671875, -31.607421875, -29.8134765625, -28.01953125, -26.2255859375, -24.431640625, -22.6376953125, -20.84375, -19.0498046875, -17.255859375, -15.4619140625, -13.66796875, -11.8740234375, -10.080078125, -8.2861328125, -6.4921875, -4.6982421875, -2.904296875, -1.1103515625, 0.68359375, 2.4775390625, 4.271484375, 6.0654296875, 7.859375, 9.6533203125, 11.447265625, 13.2412109375, 15.03515625, 16.8291015625, 18.623046875, 20.4169921875, 22.2109375, 24.0048828125, 25.798828125, 27.5927734375, 29.38671875, 31.1806640625, 32.974609375, 34.7685546875, 36.5625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 4.0, 11.0, 6.0, 16.0, 23.0, 37.0, 41.0, 71.0, 123.0, 169.0, 262.0, 448.0, 695.0, 1273.0, 2694.0, 8189.0, 55712.0, 741081.0, 210282.0, 18602.0, 4527.0, 1806.0, 932.0, 566.0, 361.0, 198.0, 135.0, 85.0, 66.0, 32.0, 38.0, 11.0, 14.0, 8.0, 12.0, 4.0, 10.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-146.0, -140.921875, -135.84375, -130.765625, -125.6875, -120.609375, -115.53125, -110.453125, -105.375, -100.296875, -95.21875, -90.140625, -85.0625, -79.984375, -74.90625, -69.828125, -64.75, -59.671875, -54.59375, -49.515625, -44.4375, -39.359375, -34.28125, -29.203125, -24.125, -19.046875, -13.96875, -8.890625, -3.8125, 1.265625, 6.34375, 11.421875, 16.5, 21.578125, 26.65625, 31.734375, 36.8125, 41.890625, 46.96875, 52.046875, 57.125, 62.203125, 67.28125, 72.359375, 77.4375, 82.515625, 87.59375, 92.671875, 97.75, 102.828125, 107.90625, 112.984375, 118.0625, 123.140625, 128.21875, 133.296875, 138.375, 143.453125, 148.53125, 153.609375, 158.6875, 163.765625, 168.84375, 173.921875, 179.0]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 10.0, 4.0, 9.0, 13.0, 8.0, 16.0, 23.0, 30.0, 33.0, 34.0, 43.0, 56.0, 67.0, 54.0, 60.0, 63.0, 54.0, 57.0, 51.0, 55.0, 48.0, 33.0, 31.0, 27.0, 20.0, 13.0, 20.0, 12.0, 14.0, 9.0, 6.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-162.625, -157.50390625, -152.3828125, -147.26171875, -142.140625, -137.01953125, -131.8984375, -126.77734375, -121.65625, -116.53515625, -111.4140625, -106.29296875, -101.171875, -96.05078125, -90.9296875, -85.80859375, -80.6875, -75.56640625, -70.4453125, -65.32421875, -60.203125, -55.08203125, -49.9609375, -44.83984375, -39.71875, -34.59765625, -29.4765625, -24.35546875, -19.234375, -14.11328125, -8.9921875, -3.87109375, 1.25, 6.37109375, 11.4921875, 16.61328125, 21.734375, 26.85546875, 31.9765625, 37.09765625, 42.21875, 47.33984375, 52.4609375, 57.58203125, 62.703125, 67.82421875, 72.9453125, 78.06640625, 83.1875, 88.30859375, 93.4296875, 98.55078125, 103.671875, 108.79296875, 113.9140625, 119.03515625, 124.15625, 129.27734375, 134.3984375, 139.51953125, 144.640625, 149.76171875, 154.8828125, 160.00390625, 165.125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 5.0, 12.0, 7.0, 10.0, 16.0, 14.0, 34.0, 28.0, 30.0, 41.0, 70.0, 90.0, 156.0, 254.0, 713.0, 2500.0, 16453.0, 830380.0, 186802.0, 8211.0, 1601.0, 430.0, 183.0, 150.0, 93.0, 62.0, 37.0, 25.0, 22.0, 20.0, 12.0, 13.0, 17.0, 10.0, 11.0, 4.0, 10.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-86.6875, -83.96484375, -81.2421875, -78.51953125, -75.796875, -73.07421875, -70.3515625, -67.62890625, -64.90625, -62.18359375, -59.4609375, -56.73828125, -54.015625, -51.29296875, -48.5703125, -45.84765625, -43.125, -40.40234375, -37.6796875, -34.95703125, -32.234375, -29.51171875, -26.7890625, -24.06640625, -21.34375, -18.62109375, -15.8984375, -13.17578125, -10.453125, -7.73046875, -5.0078125, -2.28515625, 0.4375, 3.16015625, 5.8828125, 8.60546875, 11.328125, 14.05078125, 16.7734375, 19.49609375, 22.21875, 24.94140625, 27.6640625, 30.38671875, 33.109375, 35.83203125, 38.5546875, 41.27734375, 44.0, 46.72265625, 49.4453125, 52.16796875, 54.890625, 57.61328125, 60.3359375, 63.05859375, 65.78125, 68.50390625, 71.2265625, 73.94921875, 76.671875, 79.39453125, 82.1171875, 84.83984375, 87.5625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 1.0, 8.0, 9.0, 10.0, 20.0, 19.0, 32.0, 41.0, 51.0, 73.0, 104.0, 158.0, 121.0, 99.0, 72.0, 41.0, 34.0, 26.0, 24.0, 11.0, 8.0, 9.0, 3.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01403045654296875, -0.013669848442077637, -0.013309240341186523, -0.01294863224029541, -0.012588024139404297, -0.012227416038513184, -0.01186680793762207, -0.011506199836730957, -0.011145591735839844, -0.01078498363494873, -0.010424375534057617, -0.010063767433166504, -0.00970315933227539, -0.009342551231384277, -0.008981943130493164, -0.00862133502960205, -0.008260726928710938, -0.007900118827819824, -0.007539510726928711, -0.007178902626037598, -0.006818294525146484, -0.006457686424255371, -0.006097078323364258, -0.0057364702224731445, -0.005375862121582031, -0.005015254020690918, -0.004654645919799805, -0.004294037818908691, -0.003933429718017578, -0.003572821617126465, -0.0032122135162353516, -0.0028516054153442383, -0.002490997314453125, -0.0021303892135620117, -0.0017697811126708984, -0.0014091730117797852, -0.0010485649108886719, -0.0006879568099975586, -0.0003273487091064453, 3.325939178466797e-05, 0.00039386749267578125, 0.0007544755935668945, 0.0011150836944580078, 0.001475691795349121, 0.0018362998962402344, 0.0021969079971313477, 0.002557516098022461, 0.0029181241989135742, 0.0032787322998046875, 0.0036393404006958008, 0.003999948501586914, 0.004360556602478027, 0.004721164703369141, 0.005081772804260254, 0.005442380905151367, 0.0058029890060424805, 0.006163597106933594, 0.006524205207824707, 0.00688481330871582, 0.007245421409606934, 0.007606029510498047, 0.00796663761138916, 0.008327245712280273, 0.008687853813171387, 0.0090484619140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 2.0, 13.0, 8.0, 14.0, 19.0, 28.0, 40.0, 84.0, 106.0, 224.0, 500.0, 1215.0, 4067.0, 23006.0, 929454.0, 79430.0, 7054.0, 1898.0, 665.0, 295.0, 145.0, 95.0, 57.0, 34.0, 30.0, 22.0, 11.0, 14.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-90.75, -87.5869140625, -84.423828125, -81.2607421875, -78.09765625, -74.9345703125, -71.771484375, -68.6083984375, -65.4453125, -62.2822265625, -59.119140625, -55.9560546875, -52.79296875, -49.6298828125, -46.466796875, -43.3037109375, -40.140625, -36.9775390625, -33.814453125, -30.6513671875, -27.48828125, -24.3251953125, -21.162109375, -17.9990234375, -14.8359375, -11.6728515625, -8.509765625, -5.3466796875, -2.18359375, 0.9794921875, 4.142578125, 7.3056640625, 10.46875, 13.6318359375, 16.794921875, 19.9580078125, 23.12109375, 26.2841796875, 29.447265625, 32.6103515625, 35.7734375, 38.9365234375, 42.099609375, 45.2626953125, 48.42578125, 51.5888671875, 54.751953125, 57.9150390625, 61.078125, 64.2412109375, 67.404296875, 70.5673828125, 73.73046875, 76.8935546875, 80.056640625, 83.2197265625, 86.3828125, 89.5458984375, 92.708984375, 95.8720703125, 99.03515625, 102.1982421875, 105.361328125, 108.5244140625, 111.6875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 7.0, 19.0, 49.0, 107.0, 223.0, 243.0, 182.0, 73.0, 38.0, 18.0, 12.0, 3.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.5, -70.193359375, -66.88671875, -63.580078125, -60.2734375, -56.966796875, -53.66015625, -50.353515625, -47.046875, -43.740234375, -40.43359375, -37.126953125, -33.8203125, -30.513671875, -27.20703125, -23.900390625, -20.59375, -17.287109375, -13.98046875, -10.673828125, -7.3671875, -4.060546875, -0.75390625, 2.552734375, 5.859375, 9.166015625, 12.47265625, 15.779296875, 19.0859375, 22.392578125, 25.69921875, 29.005859375, 32.3125, 35.619140625, 38.92578125, 42.232421875, 45.5390625, 48.845703125, 52.15234375, 55.458984375, 58.765625, 62.072265625, 65.37890625, 68.685546875, 71.9921875, 75.298828125, 78.60546875, 81.912109375, 85.21875, 88.525390625, 91.83203125, 95.138671875, 98.4453125, 101.751953125, 105.05859375, 108.365234375, 111.671875, 114.978515625, 118.28515625, 121.591796875, 124.8984375, 128.205078125, 131.51171875, 134.818359375, 138.125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 7.0, 18.0, 18.0, 49.0, 119.0, 190.0, 296.0, 155.0, 67.0, 37.0, 16.0, 11.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1079.8812255859375, -1046.6134033203125, -1013.345703125, -980.0779418945312, -946.8101806640625, -913.5423583984375, -880.2745971679688, -847.0068359375, -813.7390747070312, -780.4713134765625, -747.2035522460938, -713.935791015625, -680.66796875, -647.4002685546875, -614.1324462890625, -580.8646850585938, -547.596923828125, -514.3291625976562, -481.0614013671875, -447.7936096191406, -414.5258483886719, -381.2580871582031, -347.99029541015625, -314.7225341796875, -281.45477294921875, -248.18701171875, -214.9192352294922, -181.65145874023438, -148.38369750976562, -115.11593627929688, -81.84815979003906, -48.58038330078125, -15.312744140625, 17.95502471923828, 51.22279357910156, 84.49056243896484, 117.75833129882812, 151.02609252929688, 184.2938690185547, 217.5616455078125, 250.82940673828125, 284.09716796875, 317.36492919921875, 350.6327209472656, 383.9004821777344, 417.1682434082031, 450.43603515625, 483.70379638671875, 516.9715576171875, 550.2393188476562, 583.507080078125, 616.7748413085938, 650.0426025390625, 683.3104248046875, 716.5781860351562, 749.845947265625, 783.1137084960938, 816.3814697265625, 849.6492309570312, 882.9169921875, 916.184814453125, 949.4525146484375, 982.7203369140625, 1015.9880981445312, 1049.255859375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 16.0, 22.0, 29.0, 31.0, 38.0, 41.0, 52.0, 65.0, 85.0, 98.0, 112.0, 76.0, 46.0, 58.0, 65.0, 26.0, 23.0, 26.0, 20.0, 19.0, 11.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-686.9322509765625, -661.5528564453125, -636.1734619140625, -610.7941284179688, -585.4147338867188, -560.0353393554688, -534.6559448242188, -509.2765808105469, -483.897216796875, -458.517822265625, -433.1384582519531, -407.7590637207031, -382.37969970703125, -357.00030517578125, -331.62091064453125, -306.2415466308594, -280.8621520996094, -255.48277282714844, -230.1033935546875, -204.7239990234375, -179.34463500976562, -153.96524047851562, -128.5858612060547, -103.20648193359375, -77.82710266113281, -52.447723388671875, -27.068340301513672, -1.6889572143554688, 23.69042205810547, 49.069801330566406, 74.44918823242188, 99.82856750488281, 125.20794677734375, 150.5873260498047, 175.96670532226562, 201.34609985351562, 226.7254638671875, 252.1048583984375, 277.4842529296875, 302.8636169433594, 328.24298095703125, 353.62237548828125, 379.0017395019531, 404.3811340332031, 429.760498046875, 455.139892578125, 480.519287109375, 505.8986511230469, 531.278076171875, 556.657470703125, 582.036865234375, 607.4161987304688, 632.7955932617188, 658.1749877929688, 683.5543823242188, 708.9337158203125, 734.3131103515625, 759.6925048828125, 785.0718994140625, 810.4512329101562, 835.8306274414062, 861.2100219726562, 886.5894165039062, 911.96875, 937.34814453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 16.0, 19.0, 40.0, 48.0, 62.0, 126.0, 221.0, 491.0, 1612.0, 9873.0, 393830.0, 3739358.0, 43076.0, 3724.0, 838.0, 347.0, 225.0, 118.0, 85.0, 47.0, 37.0, 21.0, 17.0, 13.0, 3.0, 6.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.5625, -106.3525390625, -102.142578125, -97.9326171875, -93.72265625, -89.5126953125, -85.302734375, -81.0927734375, -76.8828125, -72.6728515625, -68.462890625, -64.2529296875, -60.04296875, -55.8330078125, -51.623046875, -47.4130859375, -43.203125, -38.9931640625, -34.783203125, -30.5732421875, -26.36328125, -22.1533203125, -17.943359375, -13.7333984375, -9.5234375, -5.3134765625, -1.103515625, 3.1064453125, 7.31640625, 11.5263671875, 15.736328125, 19.9462890625, 24.15625, 28.3662109375, 32.576171875, 36.7861328125, 40.99609375, 45.2060546875, 49.416015625, 53.6259765625, 57.8359375, 62.0458984375, 66.255859375, 70.4658203125, 74.67578125, 78.8857421875, 83.095703125, 87.3056640625, 91.515625, 95.7255859375, 99.935546875, 104.1455078125, 108.35546875, 112.5654296875, 116.775390625, 120.9853515625, 125.1953125, 129.4052734375, 133.615234375, 137.8251953125, 142.03515625, 146.2451171875, 150.455078125, 154.6650390625, 158.875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 5.0, 5.0, 5.0, 10.0, 17.0, 14.0, 11.0, 15.0, 21.0, 29.0, 41.0, 33.0, 28.0, 48.0, 60.0, 35.0, 53.0, 56.0, 58.0, 29.0, 52.0, 43.0, 45.0, 53.0, 37.0, 26.0, 36.0, 31.0, 19.0, 24.0, 17.0, 13.0, 9.0, 6.0, 8.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.021240234375, -24.99560546875, -23.969970703125, -22.9443359375, -21.918701171875, -20.89306640625, -19.867431640625, -18.841796875, -17.816162109375, -16.79052734375, -15.764892578125, -14.7392578125, -13.713623046875, -12.68798828125, -11.662353515625, -10.63671875, -9.611083984375, -8.58544921875, -7.559814453125, -6.5341796875, -5.508544921875, -4.48291015625, -3.457275390625, -2.431640625, -1.406005859375, -0.38037109375, 0.645263671875, 1.6708984375, 2.696533203125, 3.72216796875, 4.747802734375, 5.7734375, 6.799072265625, 7.82470703125, 8.850341796875, 9.8759765625, 10.901611328125, 11.92724609375, 12.952880859375, 13.978515625, 15.004150390625, 16.02978515625, 17.055419921875, 18.0810546875, 19.106689453125, 20.13232421875, 21.157958984375, 22.18359375, 23.209228515625, 24.23486328125, 25.260498046875, 26.2861328125, 27.311767578125, 28.33740234375, 29.363037109375, 30.388671875, 31.414306640625, 32.43994140625, 33.465576171875, 34.4912109375, 35.516845703125, 36.54248046875, 37.568115234375, 38.59375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 15.0, 17.0, 23.0, 34.0, 58.0, 106.0, 214.0, 445.0, 1173.0, 3358.0, 12758.0, 77189.0, 1986288.0, 2010719.0, 80964.0, 14048.0, 4073.0, 1461.0, 666.0, 322.0, 136.0, 76.0, 51.0, 35.0, 10.0, 16.0, 10.0, 4.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.6875, -82.041015625, -79.39453125, -76.748046875, -74.1015625, -71.455078125, -68.80859375, -66.162109375, -63.515625, -60.869140625, -58.22265625, -55.576171875, -52.9296875, -50.283203125, -47.63671875, -44.990234375, -42.34375, -39.697265625, -37.05078125, -34.404296875, -31.7578125, -29.111328125, -26.46484375, -23.818359375, -21.171875, -18.525390625, -15.87890625, -13.232421875, -10.5859375, -7.939453125, -5.29296875, -2.646484375, 0.0, 2.646484375, 5.29296875, 7.939453125, 10.5859375, 13.232421875, 15.87890625, 18.525390625, 21.171875, 23.818359375, 26.46484375, 29.111328125, 31.7578125, 34.404296875, 37.05078125, 39.697265625, 42.34375, 44.990234375, 47.63671875, 50.283203125, 52.9296875, 55.576171875, 58.22265625, 60.869140625, 63.515625, 66.162109375, 68.80859375, 71.455078125, 74.1015625, 76.748046875, 79.39453125, 82.041015625, 84.6875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 18.0, 22.0, 29.0, 47.0, 78.0, 118.0, 202.0, 340.0, 694.0, 877.0, 635.0, 386.0, 232.0, 132.0, 66.0, 39.0, 39.0, 27.0, 20.0, 12.0, 7.0, 5.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.125, -66.515625, -63.90625, -61.296875, -58.6875, -56.078125, -53.46875, -50.859375, -48.25, -45.640625, -43.03125, -40.421875, -37.8125, -35.203125, -32.59375, -29.984375, -27.375, -24.765625, -22.15625, -19.546875, -16.9375, -14.328125, -11.71875, -9.109375, -6.5, -3.890625, -1.28125, 1.328125, 3.9375, 6.546875, 9.15625, 11.765625, 14.375, 16.984375, 19.59375, 22.203125, 24.8125, 27.421875, 30.03125, 32.640625, 35.25, 37.859375, 40.46875, 43.078125, 45.6875, 48.296875, 50.90625, 53.515625, 56.125, 58.734375, 61.34375, 63.953125, 66.5625, 69.171875, 71.78125, 74.390625, 77.0, 79.609375, 82.21875, 84.828125, 87.4375, 90.046875, 92.65625, 95.265625, 97.875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 3.0, 8.0, 15.0, 23.0, 57.0, 127.0, 224.0, 270.0, 156.0, 60.0, 25.0, 13.0, 9.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-657.460205078125, -627.7137451171875, -597.9672241210938, -568.2207641601562, -538.4743041992188, -508.7278137207031, -478.9813232421875, -449.23486328125, -419.4883728027344, -389.74188232421875, -359.99542236328125, -330.2489318847656, -300.50244140625, -270.7559814453125, -241.00949096679688, -211.2630157470703, -181.51654052734375, -151.7700653076172, -122.0235824584961, -92.277099609375, -62.53062438964844, -32.784149169921875, -3.03765869140625, 26.708816528320312, 56.455291748046875, 86.20176696777344, 115.94824981689453, 145.69473266601562, 175.4412078857422, 205.18768310546875, 234.93417358398438, 264.6806640625, 294.4271240234375, 324.1736145019531, 353.9200744628906, 383.66656494140625, 413.41302490234375, 443.1595153808594, 472.906005859375, 502.6524658203125, 532.39892578125, 562.1453857421875, 591.8919067382812, 621.6383666992188, 651.3848266601562, 681.13134765625, 710.8778076171875, 740.624267578125, 770.3707885742188, 800.1172485351562, 829.86376953125, 859.6102294921875, 889.356689453125, 919.1031494140625, 948.8496704101562, 978.5961303710938, 1008.3426513671875, 1038.089111328125, 1067.8355712890625, 1097.58203125, 1127.32861328125, 1157.0750732421875, 1186.821533203125, 1216.5679931640625, 1246.314453125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 11.0, 11.0, 7.0, 14.0, 9.0, 15.0, 35.0, 22.0, 26.0, 48.0, 49.0, 55.0, 67.0, 63.0, 50.0, 53.0, 49.0, 57.0, 49.0, 38.0, 44.0, 39.0, 34.0, 28.0, 26.0, 23.0, 14.0, 11.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-426.2154541015625, -414.5389709472656, -402.86248779296875, -391.18597412109375, -379.5094909667969, -367.8330078125, -356.1565246582031, -344.48004150390625, -332.80352783203125, -321.1270446777344, -309.4505615234375, -297.7740478515625, -286.0975646972656, -274.42108154296875, -262.7445983886719, -251.06809997558594, -239.39161682128906, -227.7151336669922, -216.03863525390625, -204.36215209960938, -192.68565368652344, -181.00917053222656, -169.33267211914062, -157.65618896484375, -145.97970581054688, -134.30322265625, -122.62672424316406, -110.95024108886719, -99.27374267578125, -87.59725952148438, -75.92076873779297, -64.24427795410156, -52.567779541015625, -40.89128875732422, -29.214799880981445, -17.538311004638672, -5.861820220947266, 5.814670562744141, 17.49115753173828, 29.167648315429688, 40.844139099121094, 52.5206298828125, 64.1971206665039, 75.87361145019531, 87.55009460449219, 99.22659301757812, 110.903076171875, 122.5795669555664, 134.2560577392578, 145.9325408935547, 157.60903930664062, 169.2855224609375, 180.96202087402344, 192.6385040283203, 204.31500244140625, 215.99148559570312, 227.66796875, 239.34445190429688, 251.0209503173828, 262.69744873046875, 274.3739318847656, 286.0504150390625, 297.7268981933594, 309.40338134765625, 321.07989501953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 10.0, 4.0, 8.0, 9.0, 25.0, 25.0, 31.0, 31.0, 63.0, 90.0, 127.0, 183.0, 313.0, 544.0, 1058.0, 2075.0, 4609.0, 11896.0, 34788.0, 117439.0, 402453.0, 334228.0, 92629.0, 28231.0, 9622.0, 3861.0, 1847.0, 954.0, 486.0, 309.0, 185.0, 108.0, 85.0, 50.0, 33.0, 40.0, 23.0, 18.0, 17.0, 10.0, 12.0, 9.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-74.1875, -71.8623046875, -69.537109375, -67.2119140625, -64.88671875, -62.5615234375, -60.236328125, -57.9111328125, -55.5859375, -53.2607421875, -50.935546875, -48.6103515625, -46.28515625, -43.9599609375, -41.634765625, -39.3095703125, -36.984375, -34.6591796875, -32.333984375, -30.0087890625, -27.68359375, -25.3583984375, -23.033203125, -20.7080078125, -18.3828125, -16.0576171875, -13.732421875, -11.4072265625, -9.08203125, -6.7568359375, -4.431640625, -2.1064453125, 0.21875, 2.5439453125, 4.869140625, 7.1943359375, 9.51953125, 11.8447265625, 14.169921875, 16.4951171875, 18.8203125, 21.1455078125, 23.470703125, 25.7958984375, 28.12109375, 30.4462890625, 32.771484375, 35.0966796875, 37.421875, 39.7470703125, 42.072265625, 44.3974609375, 46.72265625, 49.0478515625, 51.373046875, 53.6982421875, 56.0234375, 58.3486328125, 60.673828125, 62.9990234375, 65.32421875, 67.6494140625, 69.974609375, 72.2998046875, 74.625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 6.0, 7.0, 7.0, 13.0, 14.0, 14.0, 23.0, 24.0, 24.0, 27.0, 41.0, 43.0, 52.0, 51.0, 58.0, 51.0, 56.0, 41.0, 39.0, 55.0, 44.0, 48.0, 40.0, 27.0, 41.0, 33.0, 23.0, 20.0, 19.0, 19.0, 6.0, 9.0, 11.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.109375, -29.073974609375, -28.03857421875, -27.003173828125, -25.9677734375, -24.932373046875, -23.89697265625, -22.861572265625, -21.826171875, -20.790771484375, -19.75537109375, -18.719970703125, -17.6845703125, -16.649169921875, -15.61376953125, -14.578369140625, -13.54296875, -12.507568359375, -11.47216796875, -10.436767578125, -9.4013671875, -8.365966796875, -7.33056640625, -6.295166015625, -5.259765625, -4.224365234375, -3.18896484375, -2.153564453125, -1.1181640625, -0.082763671875, 0.95263671875, 1.988037109375, 3.0234375, 4.058837890625, 5.09423828125, 6.129638671875, 7.1650390625, 8.200439453125, 9.23583984375, 10.271240234375, 11.306640625, 12.342041015625, 13.37744140625, 14.412841796875, 15.4482421875, 16.483642578125, 17.51904296875, 18.554443359375, 19.58984375, 20.625244140625, 21.66064453125, 22.696044921875, 23.7314453125, 24.766845703125, 25.80224609375, 26.837646484375, 27.873046875, 28.908447265625, 29.94384765625, 30.979248046875, 32.0146484375, 33.050048828125, 34.08544921875, 35.120849609375, 36.15625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 15.0, 17.0, 18.0, 30.0, 60.0, 93.0, 150.0, 237.0, 406.0, 777.0, 1676.0, 5004.0, 35318.0, 794701.0, 191909.0, 12793.0, 2882.0, 1129.0, 530.0, 307.0, 181.0, 103.0, 63.0, 47.0, 32.0, 21.0, 8.0, 12.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-243.625, -237.5, -231.375, -225.25, -219.125, -213.0, -206.875, -200.75, -194.625, -188.5, -182.375, -176.25, -170.125, -164.0, -157.875, -151.75, -145.625, -139.5, -133.375, -127.25, -121.125, -115.0, -108.875, -102.75, -96.625, -90.5, -84.375, -78.25, -72.125, -66.0, -59.875, -53.75, -47.625, -41.5, -35.375, -29.25, -23.125, -17.0, -10.875, -4.75, 1.375, 7.5, 13.625, 19.75, 25.875, 32.0, 38.125, 44.25, 50.375, 56.5, 62.625, 68.75, 74.875, 81.0, 87.125, 93.25, 99.375, 105.5, 111.625, 117.75, 123.875, 130.0, 136.125, 142.25, 148.375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 4.0, 12.0, 8.0, 13.0, 9.0, 16.0, 18.0, 21.0, 30.0, 30.0, 26.0, 24.0, 36.0, 42.0, 31.0, 48.0, 47.0, 57.0, 60.0, 30.0, 45.0, 53.0, 53.0, 37.0, 36.0, 30.0, 30.0, 31.0, 17.0, 16.0, 19.0, 14.0, 6.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.25, -109.62109375, -105.9921875, -102.36328125, -98.734375, -95.10546875, -91.4765625, -87.84765625, -84.21875, -80.58984375, -76.9609375, -73.33203125, -69.703125, -66.07421875, -62.4453125, -58.81640625, -55.1875, -51.55859375, -47.9296875, -44.30078125, -40.671875, -37.04296875, -33.4140625, -29.78515625, -26.15625, -22.52734375, -18.8984375, -15.26953125, -11.640625, -8.01171875, -4.3828125, -0.75390625, 2.875, 6.50390625, 10.1328125, 13.76171875, 17.390625, 21.01953125, 24.6484375, 28.27734375, 31.90625, 35.53515625, 39.1640625, 42.79296875, 46.421875, 50.05078125, 53.6796875, 57.30859375, 60.9375, 64.56640625, 68.1953125, 71.82421875, 75.453125, 79.08203125, 82.7109375, 86.33984375, 89.96875, 93.59765625, 97.2265625, 100.85546875, 104.484375, 108.11328125, 111.7421875, 115.37109375, 119.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 9.0, 8.0, 5.0, 18.0, 17.0, 30.0, 37.0, 59.0, 85.0, 132.0, 217.0, 434.0, 1016.0, 3454.0, 20627.0, 663979.0, 337987.0, 15566.0, 2965.0, 889.0, 412.0, 207.0, 136.0, 83.0, 37.0, 44.0, 28.0, 25.0, 14.0, 7.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-70.875, -68.90283203125, -66.9306640625, -64.95849609375, -62.986328125, -61.01416015625, -59.0419921875, -57.06982421875, -55.09765625, -53.12548828125, -51.1533203125, -49.18115234375, -47.208984375, -45.23681640625, -43.2646484375, -41.29248046875, -39.3203125, -37.34814453125, -35.3759765625, -33.40380859375, -31.431640625, -29.45947265625, -27.4873046875, -25.51513671875, -23.54296875, -21.57080078125, -19.5986328125, -17.62646484375, -15.654296875, -13.68212890625, -11.7099609375, -9.73779296875, -7.765625, -5.79345703125, -3.8212890625, -1.84912109375, 0.123046875, 2.09521484375, 4.0673828125, 6.03955078125, 8.01171875, 9.98388671875, 11.9560546875, 13.92822265625, 15.900390625, 17.87255859375, 19.8447265625, 21.81689453125, 23.7890625, 25.76123046875, 27.7333984375, 29.70556640625, 31.677734375, 33.64990234375, 35.6220703125, 37.59423828125, 39.56640625, 41.53857421875, 43.5107421875, 45.48291015625, 47.455078125, 49.42724609375, 51.3994140625, 53.37158203125, 55.34375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 4.0, 7.0, 8.0, 7.0, 5.0, 12.0, 13.0, 16.0, 17.0, 38.0, 41.0, 67.0, 60.0, 93.0, 112.0, 106.0, 84.0, 69.0, 44.0, 36.0, 33.0, 24.0, 18.0, 13.0, 18.0, 9.0, 9.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00897216796875, -0.008716464042663574, -0.008460760116577148, -0.008205056190490723, -0.007949352264404297, -0.007693648338317871, -0.007437944412231445, -0.0071822404861450195, -0.006926536560058594, -0.006670832633972168, -0.006415128707885742, -0.006159424781799316, -0.005903720855712891, -0.005648016929626465, -0.005392313003540039, -0.005136609077453613, -0.0048809051513671875, -0.004625201225280762, -0.004369497299194336, -0.00411379337310791, -0.0038580894470214844, -0.0036023855209350586, -0.003346681594848633, -0.003090977668762207, -0.0028352737426757812, -0.0025795698165893555, -0.0023238658905029297, -0.002068161964416504, -0.0018124580383300781, -0.0015567541122436523, -0.0013010501861572266, -0.0010453462600708008, -0.000789642333984375, -0.0005339384078979492, -0.00027823448181152344, -2.2530555725097656e-05, 0.00023317337036132812, 0.0004888772964477539, 0.0007445812225341797, 0.0010002851486206055, 0.0012559890747070312, 0.001511693000793457, 0.0017673969268798828, 0.0020231008529663086, 0.0022788047790527344, 0.00253450870513916, 0.002790212631225586, 0.0030459165573120117, 0.0033016204833984375, 0.0035573244094848633, 0.003813028335571289, 0.004068732261657715, 0.004324436187744141, 0.004580140113830566, 0.004835844039916992, 0.005091547966003418, 0.005347251892089844, 0.0056029558181762695, 0.005858659744262695, 0.006114363670349121, 0.006370067596435547, 0.006625771522521973, 0.0068814754486083984, 0.007137179374694824, 0.00739288330078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 2.0, 14.0, 16.0, 15.0, 27.0, 46.0, 73.0, 89.0, 143.0, 256.0, 437.0, 974.0, 2334.0, 7015.0, 34978.0, 663351.0, 306183.0, 23443.0, 5341.0, 1953.0, 805.0, 397.0, 234.0, 124.0, 84.0, 56.0, 42.0, 32.0, 15.0, 13.0, 8.0, 16.0, 3.0, 3.0, 11.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.96875, -35.48388671875, -33.9990234375, -32.51416015625, -31.029296875, -29.54443359375, -28.0595703125, -26.57470703125, -25.08984375, -23.60498046875, -22.1201171875, -20.63525390625, -19.150390625, -17.66552734375, -16.1806640625, -14.69580078125, -13.2109375, -11.72607421875, -10.2412109375, -8.75634765625, -7.271484375, -5.78662109375, -4.3017578125, -2.81689453125, -1.33203125, 0.15283203125, 1.6376953125, 3.12255859375, 4.607421875, 6.09228515625, 7.5771484375, 9.06201171875, 10.546875, 12.03173828125, 13.5166015625, 15.00146484375, 16.486328125, 17.97119140625, 19.4560546875, 20.94091796875, 22.42578125, 23.91064453125, 25.3955078125, 26.88037109375, 28.365234375, 29.85009765625, 31.3349609375, 32.81982421875, 34.3046875, 35.78955078125, 37.2744140625, 38.75927734375, 40.244140625, 41.72900390625, 43.2138671875, 44.69873046875, 46.18359375, 47.66845703125, 49.1533203125, 50.63818359375, 52.123046875, 53.60791015625, 55.0927734375, 56.57763671875, 58.0625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 3.0, 11.0, 14.0, 18.0, 41.0, 57.0, 86.0, 131.0, 160.0, 149.0, 125.0, 69.0, 43.0, 25.0, 16.0, 8.0, 5.0, 6.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.3125, -51.6318359375, -49.951171875, -48.2705078125, -46.58984375, -44.9091796875, -43.228515625, -41.5478515625, -39.8671875, -38.1865234375, -36.505859375, -34.8251953125, -33.14453125, -31.4638671875, -29.783203125, -28.1025390625, -26.421875, -24.7412109375, -23.060546875, -21.3798828125, -19.69921875, -18.0185546875, -16.337890625, -14.6572265625, -12.9765625, -11.2958984375, -9.615234375, -7.9345703125, -6.25390625, -4.5732421875, -2.892578125, -1.2119140625, 0.46875, 2.1494140625, 3.830078125, 5.5107421875, 7.19140625, 8.8720703125, 10.552734375, 12.2333984375, 13.9140625, 15.5947265625, 17.275390625, 18.9560546875, 20.63671875, 22.3173828125, 23.998046875, 25.6787109375, 27.359375, 29.0400390625, 30.720703125, 32.4013671875, 34.08203125, 35.7626953125, 37.443359375, 39.1240234375, 40.8046875, 42.4853515625, 44.166015625, 45.8466796875, 47.52734375, 49.2080078125, 50.888671875, 52.5693359375, 54.25]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 10.0, 46.0, 185.0, 430.0, 209.0, 65.0, 19.0, 8.0, 5.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1132.900390625, -1082.6402587890625, -1032.380126953125, -982.1199340820312, -931.8598022460938, -881.5996704101562, -831.3394775390625, -781.079345703125, -730.8192138671875, -680.55908203125, -630.2989501953125, -580.0387573242188, -529.7786254882812, -479.51849365234375, -429.2583312988281, -378.9981689453125, -328.738037109375, -278.4779052734375, -228.21774291992188, -177.9575958251953, -127.69744873046875, -77.43730163574219, -27.177154541015625, 23.0830078125, 73.3431396484375, 123.60328674316406, 173.86343383789062, 224.1235809326172, 274.38372802734375, 324.64385986328125, 374.9040222167969, 425.1641845703125, 475.42431640625, 525.6844482421875, 575.944580078125, 626.2047729492188, 676.4649047851562, 726.7250366210938, 776.9852294921875, 827.245361328125, 877.5054931640625, 927.765625, 978.0257568359375, 1028.285888671875, 1078.546142578125, 1128.8062744140625, 1179.06640625, 1229.3265380859375, 1279.586669921875, 1329.8468017578125, 1380.10693359375, 1430.3670654296875, 1480.627197265625, 1530.887451171875, 1581.1475830078125, 1631.40771484375, 1681.6678466796875, 1731.927978515625, 1782.1881103515625, 1832.4482421875, 1882.70849609375, 1932.9686279296875, 1983.228759765625, 2033.4888916015625, 2083.7490234375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 9.0, 4.0, 10.0, 21.0, 16.0, 17.0, 25.0, 34.0, 24.0, 22.0, 31.0, 37.0, 34.0, 45.0, 59.0, 71.0, 69.0, 70.0, 40.0, 42.0, 41.0, 27.0, 31.0, 22.0, 35.0, 20.0, 15.0, 13.0, 14.0, 18.0, 14.0, 16.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-459.073486328125, -444.3462829589844, -429.61907958984375, -414.891845703125, -400.1646423339844, -385.43743896484375, -370.710205078125, -355.9830017089844, -341.25579833984375, -326.5285949707031, -311.8013916015625, -297.07415771484375, -282.3469543457031, -267.6197509765625, -252.8925323486328, -238.16531372070312, -223.4381103515625, -208.71090698242188, -193.9836883544922, -179.2564697265625, -164.52926635742188, -149.80206298828125, -135.07484436035156, -120.3476333618164, -105.62042236328125, -90.8932113647461, -76.16600036621094, -61.43878936767578, -46.711578369140625, -31.98436737060547, -17.257156372070312, -2.5299453735351562, 12.197265625, 26.924476623535156, 41.65168762207031, 56.37889862060547, 71.10610961914062, 85.83332061767578, 100.56053161621094, 115.2877426147461, 130.01495361328125, 144.74215698242188, 159.46937561035156, 174.19659423828125, 188.92379760742188, 203.6510009765625, 218.3782196044922, 233.10543823242188, 247.8326416015625, 262.5598449707031, 277.28704833984375, 292.0142822265625, 306.7414855957031, 321.46868896484375, 336.1959228515625, 350.9231262207031, 365.65032958984375, 380.3775329589844, 395.104736328125, 409.83197021484375, 424.5591735839844, 439.286376953125, 454.01361083984375, 468.7408142089844, 483.468017578125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 11.0, 10.0, 15.0, 34.0, 60.0, 112.0, 235.0, 483.0, 1364.0, 7247.0, 135502.0, 3964843.0, 76888.0, 5287.0, 1259.0, 440.0, 199.0, 114.0, 68.0, 23.0, 29.0, 15.0, 11.0, 5.0, 9.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.9375, -100.0068359375, -96.076171875, -92.1455078125, -88.21484375, -84.2841796875, -80.353515625, -76.4228515625, -72.4921875, -68.5615234375, -64.630859375, -60.7001953125, -56.76953125, -52.8388671875, -48.908203125, -44.9775390625, -41.046875, -37.1162109375, -33.185546875, -29.2548828125, -25.32421875, -21.3935546875, -17.462890625, -13.5322265625, -9.6015625, -5.6708984375, -1.740234375, 2.1904296875, 6.12109375, 10.0517578125, 13.982421875, 17.9130859375, 21.84375, 25.7744140625, 29.705078125, 33.6357421875, 37.56640625, 41.4970703125, 45.427734375, 49.3583984375, 53.2890625, 57.2197265625, 61.150390625, 65.0810546875, 69.01171875, 72.9423828125, 76.873046875, 80.8037109375, 84.734375, 88.6650390625, 92.595703125, 96.5263671875, 100.45703125, 104.3876953125, 108.318359375, 112.2490234375, 116.1796875, 120.1103515625, 124.041015625, 127.9716796875, 131.90234375, 135.8330078125, 139.763671875, 143.6943359375, 147.625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 13.0, 7.0, 23.0, 24.0, 37.0, 35.0, 46.0, 47.0, 64.0, 51.0, 77.0, 70.0, 63.0, 66.0, 62.0, 52.0, 44.0, 45.0, 37.0, 31.0, 23.0, 16.0, 18.0, 12.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.3125, -32.041015625, -30.76953125, -29.498046875, -28.2265625, -26.955078125, -25.68359375, -24.412109375, -23.140625, -21.869140625, -20.59765625, -19.326171875, -18.0546875, -16.783203125, -15.51171875, -14.240234375, -12.96875, -11.697265625, -10.42578125, -9.154296875, -7.8828125, -6.611328125, -5.33984375, -4.068359375, -2.796875, -1.525390625, -0.25390625, 1.017578125, 2.2890625, 3.560546875, 4.83203125, 6.103515625, 7.375, 8.646484375, 9.91796875, 11.189453125, 12.4609375, 13.732421875, 15.00390625, 16.275390625, 17.546875, 18.818359375, 20.08984375, 21.361328125, 22.6328125, 23.904296875, 25.17578125, 26.447265625, 27.71875, 28.990234375, 30.26171875, 31.533203125, 32.8046875, 34.076171875, 35.34765625, 36.619140625, 37.890625, 39.162109375, 40.43359375, 41.705078125, 42.9765625, 44.248046875, 45.51953125, 46.791015625, 48.0625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 11.0, 13.0, 24.0, 32.0, 53.0, 94.0, 153.0, 320.0, 595.0, 1358.0, 3441.0, 11791.0, 86355.0, 3630226.0, 426624.0, 23876.0, 5138.0, 1907.0, 1008.0, 547.0, 296.0, 169.0, 86.0, 53.0, 38.0, 20.0, 10.0, 6.0, 12.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-108.125, -105.0107421875, -101.896484375, -98.7822265625, -95.66796875, -92.5537109375, -89.439453125, -86.3251953125, -83.2109375, -80.0966796875, -76.982421875, -73.8681640625, -70.75390625, -67.6396484375, -64.525390625, -61.4111328125, -58.296875, -55.1826171875, -52.068359375, -48.9541015625, -45.83984375, -42.7255859375, -39.611328125, -36.4970703125, -33.3828125, -30.2685546875, -27.154296875, -24.0400390625, -20.92578125, -17.8115234375, -14.697265625, -11.5830078125, -8.46875, -5.3544921875, -2.240234375, 0.8740234375, 3.98828125, 7.1025390625, 10.216796875, 13.3310546875, 16.4453125, 19.5595703125, 22.673828125, 25.7880859375, 28.90234375, 32.0166015625, 35.130859375, 38.2451171875, 41.359375, 44.4736328125, 47.587890625, 50.7021484375, 53.81640625, 56.9306640625, 60.044921875, 63.1591796875, 66.2734375, 69.3876953125, 72.501953125, 75.6162109375, 78.73046875, 81.8447265625, 84.958984375, 88.0732421875, 91.1875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 14.0, 14.0, 18.0, 53.0, 108.0, 226.0, 598.0, 1466.0, 965.0, 335.0, 131.0, 61.0, 22.0, 21.0, 11.0, 9.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.875, -93.904296875, -89.93359375, -85.962890625, -81.9921875, -78.021484375, -74.05078125, -70.080078125, -66.109375, -62.138671875, -58.16796875, -54.197265625, -50.2265625, -46.255859375, -42.28515625, -38.314453125, -34.34375, -30.373046875, -26.40234375, -22.431640625, -18.4609375, -14.490234375, -10.51953125, -6.548828125, -2.578125, 1.392578125, 5.36328125, 9.333984375, 13.3046875, 17.275390625, 21.24609375, 25.216796875, 29.1875, 33.158203125, 37.12890625, 41.099609375, 45.0703125, 49.041015625, 53.01171875, 56.982421875, 60.953125, 64.923828125, 68.89453125, 72.865234375, 76.8359375, 80.806640625, 84.77734375, 88.748046875, 92.71875, 96.689453125, 100.66015625, 104.630859375, 108.6015625, 112.572265625, 116.54296875, 120.513671875, 124.484375, 128.455078125, 132.42578125, 136.396484375, 140.3671875, 144.337890625, 148.30859375, 152.279296875, 156.25]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 8.0, 15.0, 33.0, 118.0, 266.0, 315.0, 147.0, 43.0, 23.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-700.1126708984375, -666.9328002929688, -633.7528686523438, -600.572998046875, -567.39306640625, -534.2131958007812, -501.0333251953125, -467.8534240722656, -434.67352294921875, -401.4936218261719, -368.313720703125, -335.13385009765625, -301.9539489746094, -268.7740478515625, -235.5941619873047, -202.41427612304688, -169.234375, -136.05447387695312, -102.87458801269531, -69.69469451904297, -36.514801025390625, -3.33489990234375, 29.844985961914062, 63.024871826171875, 96.20477294921875, 129.38467407226562, 162.56455993652344, 195.74444580078125, 228.92434692382812, 262.104248046875, 295.28411865234375, 328.4640197753906, 361.64404296875, 394.8239440917969, 428.00384521484375, 461.1837158203125, 494.3636169433594, 527.5435180664062, 560.723388671875, 593.9033203125, 627.0831909179688, 660.2630615234375, 693.4429931640625, 726.6228637695312, 759.802734375, 792.982666015625, 826.1625366210938, 859.3424072265625, 892.5223388671875, 925.7022094726562, 958.8821411132812, 992.06201171875, 1025.241943359375, 1058.421875, 1091.6016845703125, 1124.7816162109375, 1157.96142578125, 1191.141357421875, 1224.3211669921875, 1257.5010986328125, 1290.6810302734375, 1323.86083984375, 1357.040771484375, 1390.220703125, 1423.400634765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 14.0, 16.0, 20.0, 22.0, 26.0, 33.0, 55.0, 48.0, 55.0, 50.0, 65.0, 68.0, 68.0, 68.0, 66.0, 72.0, 47.0, 32.0, 39.0, 25.0, 27.0, 19.0, 13.0, 12.0, 7.0, 5.0, 10.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-532.0860595703125, -518.8864135742188, -505.6867370605469, -492.4870910644531, -479.28741455078125, -466.0877685546875, -452.88812255859375, -439.6884765625, -426.4888000488281, -413.2891540527344, -400.0894775390625, -386.88983154296875, -373.690185546875, -360.4905090332031, -347.2908630371094, -334.0911865234375, -320.89154052734375, -307.69189453125, -294.4922180175781, -281.2925720214844, -268.0928955078125, -254.89324951171875, -241.693603515625, -228.4939422607422, -215.29428100585938, -202.09461975097656, -188.89495849609375, -175.6953125, -162.4956512451172, -149.29598999023438, -136.09634399414062, -122.89668273925781, -109.697021484375, -96.49736022949219, -83.2977066040039, -70.09805297851562, -56.89839172363281, -43.69873046875, -30.49907684326172, -17.299423217773438, -4.099761962890625, 9.099895477294922, 22.29955291748047, 35.499210357666016, 48.69886779785156, 61.898529052734375, 75.09818267822266, 88.29783630371094, 101.49749755859375, 114.69715881347656, 127.89681243896484, 141.09646606445312, 154.29612731933594, 167.49578857421875, 180.6954345703125, 193.8950958251953, 207.09475708007812, 220.29441833496094, 233.49407958984375, 246.6937255859375, 259.89337158203125, 273.0930480957031, 286.2926940917969, 299.49237060546875, 312.6920166015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 12.0, 18.0, 24.0, 28.0, 45.0, 58.0, 81.0, 166.0, 254.0, 444.0, 866.0, 1882.0, 4664.0, 13965.0, 50298.0, 206771.0, 479600.0, 213899.0, 52109.0, 14473.0, 4902.0, 1928.0, 910.0, 447.0, 253.0, 133.0, 93.0, 58.0, 40.0, 28.0, 25.0, 20.0, 11.0, 7.0, 9.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.15625, -57.15185546875, -55.1474609375, -53.14306640625, -51.138671875, -49.13427734375, -47.1298828125, -45.12548828125, -43.12109375, -41.11669921875, -39.1123046875, -37.10791015625, -35.103515625, -33.09912109375, -31.0947265625, -29.09033203125, -27.0859375, -25.08154296875, -23.0771484375, -21.07275390625, -19.068359375, -17.06396484375, -15.0595703125, -13.05517578125, -11.05078125, -9.04638671875, -7.0419921875, -5.03759765625, -3.033203125, -1.02880859375, 0.9755859375, 2.97998046875, 4.984375, 6.98876953125, 8.9931640625, 10.99755859375, 13.001953125, 15.00634765625, 17.0107421875, 19.01513671875, 21.01953125, 23.02392578125, 25.0283203125, 27.03271484375, 29.037109375, 31.04150390625, 33.0458984375, 35.05029296875, 37.0546875, 39.05908203125, 41.0634765625, 43.06787109375, 45.072265625, 47.07666015625, 49.0810546875, 51.08544921875, 53.08984375, 55.09423828125, 57.0986328125, 59.10302734375, 61.107421875, 63.11181640625, 65.1162109375, 67.12060546875, 69.125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 3.0, 9.0, 19.0, 20.0, 29.0, 36.0, 52.0, 60.0, 69.0, 62.0, 79.0, 77.0, 96.0, 92.0, 64.0, 67.0, 37.0, 36.0, 22.0, 17.0, 15.0, 14.0, 10.0, 4.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.375, -40.84033203125, -39.3056640625, -37.77099609375, -36.236328125, -34.70166015625, -33.1669921875, -31.63232421875, -30.09765625, -28.56298828125, -27.0283203125, -25.49365234375, -23.958984375, -22.42431640625, -20.8896484375, -19.35498046875, -17.8203125, -16.28564453125, -14.7509765625, -13.21630859375, -11.681640625, -10.14697265625, -8.6123046875, -7.07763671875, -5.54296875, -4.00830078125, -2.4736328125, -0.93896484375, 0.595703125, 2.13037109375, 3.6650390625, 5.19970703125, 6.734375, 8.26904296875, 9.8037109375, 11.33837890625, 12.873046875, 14.40771484375, 15.9423828125, 17.47705078125, 19.01171875, 20.54638671875, 22.0810546875, 23.61572265625, 25.150390625, 26.68505859375, 28.2197265625, 29.75439453125, 31.2890625, 32.82373046875, 34.3583984375, 35.89306640625, 37.427734375, 38.96240234375, 40.4970703125, 42.03173828125, 43.56640625, 45.10107421875, 46.6357421875, 48.17041015625, 49.705078125, 51.23974609375, 52.7744140625, 54.30908203125, 55.84375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 10.0, 8.0, 6.0, 13.0, 13.0, 27.0, 26.0, 46.0, 59.0, 88.0, 133.0, 207.0, 349.0, 759.0, 1789.0, 5760.0, 23274.0, 130440.0, 653404.0, 187969.0, 32460.0, 7520.0, 2236.0, 855.0, 418.0, 211.0, 133.0, 95.0, 70.0, 49.0, 33.0, 29.0, 13.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-76.9375, -74.5029296875, -72.068359375, -69.6337890625, -67.19921875, -64.7646484375, -62.330078125, -59.8955078125, -57.4609375, -55.0263671875, -52.591796875, -50.1572265625, -47.72265625, -45.2880859375, -42.853515625, -40.4189453125, -37.984375, -35.5498046875, -33.115234375, -30.6806640625, -28.24609375, -25.8115234375, -23.376953125, -20.9423828125, -18.5078125, -16.0732421875, -13.638671875, -11.2041015625, -8.76953125, -6.3349609375, -3.900390625, -1.4658203125, 0.96875, 3.4033203125, 5.837890625, 8.2724609375, 10.70703125, 13.1416015625, 15.576171875, 18.0107421875, 20.4453125, 22.8798828125, 25.314453125, 27.7490234375, 30.18359375, 32.6181640625, 35.052734375, 37.4873046875, 39.921875, 42.3564453125, 44.791015625, 47.2255859375, 49.66015625, 52.0947265625, 54.529296875, 56.9638671875, 59.3984375, 61.8330078125, 64.267578125, 66.7021484375, 69.13671875, 71.5712890625, 74.005859375, 76.4404296875, 78.875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 6.0, 8.0, 6.0, 5.0, 6.0, 8.0, 15.0, 14.0, 14.0, 14.0, 17.0, 20.0, 24.0, 28.0, 28.0, 35.0, 39.0, 36.0, 39.0, 48.0, 32.0, 35.0, 53.0, 43.0, 42.0, 35.0, 43.0, 37.0, 37.0, 33.0, 24.0, 20.0, 18.0, 30.0, 16.0, 16.0, 11.0, 9.0, 12.0, 10.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0], "bins": [-93.25, -90.46875, -87.6875, -84.90625, -82.125, -79.34375, -76.5625, -73.78125, -71.0, -68.21875, -65.4375, -62.65625, -59.875, -57.09375, -54.3125, -51.53125, -48.75, -45.96875, -43.1875, -40.40625, -37.625, -34.84375, -32.0625, -29.28125, -26.5, -23.71875, -20.9375, -18.15625, -15.375, -12.59375, -9.8125, -7.03125, -4.25, -1.46875, 1.3125, 4.09375, 6.875, 9.65625, 12.4375, 15.21875, 18.0, 20.78125, 23.5625, 26.34375, 29.125, 31.90625, 34.6875, 37.46875, 40.25, 43.03125, 45.8125, 48.59375, 51.375, 54.15625, 56.9375, 59.71875, 62.5, 65.28125, 68.0625, 70.84375, 73.625, 76.40625, 79.1875, 81.96875, 84.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 11.0, 12.0, 15.0, 23.0, 28.0, 29.0, 67.0, 122.0, 197.0, 345.0, 790.0, 1988.0, 5586.0, 18254.0, 71599.0, 322242.0, 515648.0, 80988.0, 20570.0, 6174.0, 2107.0, 858.0, 390.0, 193.0, 107.0, 68.0, 37.0, 34.0, 14.0, 15.0, 18.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.0625, -19.47314453125, -18.8837890625, -18.29443359375, -17.705078125, -17.11572265625, -16.5263671875, -15.93701171875, -15.34765625, -14.75830078125, -14.1689453125, -13.57958984375, -12.990234375, -12.40087890625, -11.8115234375, -11.22216796875, -10.6328125, -10.04345703125, -9.4541015625, -8.86474609375, -8.275390625, -7.68603515625, -7.0966796875, -6.50732421875, -5.91796875, -5.32861328125, -4.7392578125, -4.14990234375, -3.560546875, -2.97119140625, -2.3818359375, -1.79248046875, -1.203125, -0.61376953125, -0.0244140625, 0.56494140625, 1.154296875, 1.74365234375, 2.3330078125, 2.92236328125, 3.51171875, 4.10107421875, 4.6904296875, 5.27978515625, 5.869140625, 6.45849609375, 7.0478515625, 7.63720703125, 8.2265625, 8.81591796875, 9.4052734375, 9.99462890625, 10.583984375, 11.17333984375, 11.7626953125, 12.35205078125, 12.94140625, 13.53076171875, 14.1201171875, 14.70947265625, 15.298828125, 15.88818359375, 16.4775390625, 17.06689453125, 17.65625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 9.0, 8.0, 17.0, 17.0, 21.0, 22.0, 20.0, 31.0, 46.0, 63.0, 57.0, 57.0, 74.0, 73.0, 76.0, 80.0, 63.0, 45.0, 36.0, 37.0, 20.0, 19.0, 25.0, 13.0, 7.0, 9.0, 13.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0054931640625, -0.005337417125701904, -0.005181670188903809, -0.005025923252105713, -0.004870176315307617, -0.0047144293785095215, -0.004558682441711426, -0.00440293550491333, -0.004247188568115234, -0.004091441631317139, -0.003935694694519043, -0.0037799477577209473, -0.0036242008209228516, -0.003468453884124756, -0.00331270694732666, -0.0031569600105285645, -0.0030012130737304688, -0.002845466136932373, -0.0026897192001342773, -0.0025339722633361816, -0.002378225326538086, -0.0022224783897399902, -0.0020667314529418945, -0.0019109845161437988, -0.0017552375793457031, -0.0015994906425476074, -0.0014437437057495117, -0.001287996768951416, -0.0011322498321533203, -0.0009765028953552246, -0.0008207559585571289, -0.0006650090217590332, -0.0005092620849609375, -0.0003535151481628418, -0.0001977682113647461, -4.202127456665039e-05, 0.00011372566223144531, 0.000269472599029541, 0.0004252195358276367, 0.0005809664726257324, 0.0007367134094238281, 0.0008924603462219238, 0.0010482072830200195, 0.0012039542198181152, 0.001359701156616211, 0.0015154480934143066, 0.0016711950302124023, 0.001826941967010498, 0.0019826889038085938, 0.0021384358406066895, 0.002294182777404785, 0.002449929714202881, 0.0026056766510009766, 0.0027614235877990723, 0.002917170524597168, 0.0030729174613952637, 0.0032286643981933594, 0.003384411334991455, 0.0035401582717895508, 0.0036959052085876465, 0.003851652145385742, 0.004007399082183838, 0.004163146018981934, 0.004318892955780029, 0.004474639892578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 9.0, 16.0, 20.0, 33.0, 49.0, 80.0, 143.0, 287.0, 531.0, 1180.0, 2959.0, 9164.0, 37150.0, 195331.0, 644081.0, 122053.0, 24757.0, 6579.0, 2265.0, 900.0, 418.0, 204.0, 113.0, 81.0, 40.0, 34.0, 24.0, 19.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.0819091796875, -13.390380859375, -12.6988525390625, -12.00732421875, -11.3157958984375, -10.624267578125, -9.9327392578125, -9.2412109375, -8.5496826171875, -7.858154296875, -7.1666259765625, -6.47509765625, -5.7835693359375, -5.092041015625, -4.4005126953125, -3.708984375, -3.0174560546875, -2.325927734375, -1.6343994140625, -0.94287109375, -0.2513427734375, 0.440185546875, 1.1317138671875, 1.8232421875, 2.5147705078125, 3.206298828125, 3.8978271484375, 4.58935546875, 5.2808837890625, 5.972412109375, 6.6639404296875, 7.35546875, 8.0469970703125, 8.738525390625, 9.4300537109375, 10.12158203125, 10.8131103515625, 11.504638671875, 12.1961669921875, 12.8876953125, 13.5792236328125, 14.270751953125, 14.9622802734375, 15.65380859375, 16.3453369140625, 17.036865234375, 17.7283935546875, 18.419921875, 19.1114501953125, 19.802978515625, 20.4945068359375, 21.18603515625, 21.8775634765625, 22.569091796875, 23.2606201171875, 23.9521484375, 24.6436767578125, 25.335205078125, 26.0267333984375, 26.71826171875, 27.4097900390625, 28.101318359375, 28.7928466796875, 29.484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 11.0, 10.0, 18.0, 16.0, 24.0, 37.0, 42.0, 60.0, 85.0, 91.0, 85.0, 92.0, 82.0, 88.0, 63.0, 46.0, 36.0, 34.0, 13.0, 19.0, 15.0, 9.0, 4.0, 6.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.603759765625, -15.81689453125, -15.030029296875, -14.2431640625, -13.456298828125, -12.66943359375, -11.882568359375, -11.095703125, -10.308837890625, -9.52197265625, -8.735107421875, -7.9482421875, -7.161376953125, -6.37451171875, -5.587646484375, -4.80078125, -4.013916015625, -3.22705078125, -2.440185546875, -1.6533203125, -0.866455078125, -0.07958984375, 0.707275390625, 1.494140625, 2.281005859375, 3.06787109375, 3.854736328125, 4.6416015625, 5.428466796875, 6.21533203125, 7.002197265625, 7.7890625, 8.575927734375, 9.36279296875, 10.149658203125, 10.9365234375, 11.723388671875, 12.51025390625, 13.297119140625, 14.083984375, 14.870849609375, 15.65771484375, 16.444580078125, 17.2314453125, 18.018310546875, 18.80517578125, 19.592041015625, 20.37890625, 21.165771484375, 21.95263671875, 22.739501953125, 23.5263671875, 24.313232421875, 25.10009765625, 25.886962890625, 26.673828125, 27.460693359375, 28.24755859375, 29.034423828125, 29.8212890625, 30.608154296875, 31.39501953125, 32.181884765625, 32.96875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 18.0, 47.0, 186.0, 448.0, 197.0, 55.0, 20.0, 12.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-725.009033203125, -687.73828125, -650.467529296875, -613.19677734375, -575.926025390625, -538.6552734375, -501.38458251953125, -464.11383056640625, -426.84307861328125, -389.57232666015625, -352.30157470703125, -315.0308532714844, -277.7601013183594, -240.48934936523438, -203.21861267089844, -165.9478759765625, -128.6771240234375, -91.40637969970703, -54.13563537597656, -16.864891052246094, 20.405853271484375, 57.676605224609375, 94.94734191894531, 132.21807861328125, 169.48883056640625, 206.75958251953125, 244.0303192138672, 281.3010559082031, 318.5718078613281, 355.8425598144531, 393.11328125, 430.384033203125, 467.6546630859375, 504.9254150390625, 542.1961669921875, 579.4669189453125, 616.7376708984375, 654.0084228515625, 691.2791137695312, 728.5498657226562, 765.8206176757812, 803.0913696289062, 840.3621215820312, 877.6328735351562, 914.903564453125, 952.17431640625, 989.445068359375, 1026.7158203125, 1063.986572265625, 1101.25732421875, 1138.528076171875, 1175.798828125, 1213.069580078125, 1250.34033203125, 1287.611083984375, 1324.8818359375, 1362.152587890625, 1399.42333984375, 1436.694091796875, 1473.96484375, 1511.235595703125, 1548.50634765625, 1585.777099609375, 1623.0478515625, 1660.3184814453125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 4.0, 8.0, 11.0, 18.0, 14.0, 14.0, 26.0, 16.0, 27.0, 26.0, 25.0, 33.0, 56.0, 45.0, 84.0, 98.0, 96.0, 59.0, 47.0, 23.0, 23.0, 43.0, 19.0, 28.0, 18.0, 22.0, 28.0, 20.0, 10.0, 5.0, 8.0, 6.0, 6.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-422.7027893066406, -410.2447814941406, -397.7867736816406, -385.3287658691406, -372.8707580566406, -360.4127502441406, -347.9547424316406, -335.4967346191406, -323.0387268066406, -310.5807189941406, -298.1227111816406, -285.6647033691406, -273.2066955566406, -260.7486877441406, -248.29067993164062, -235.83267211914062, -223.3746795654297, -210.9166717529297, -198.4586639404297, -186.0006561279297, -173.5426483154297, -161.0846405029297, -148.62664794921875, -136.16864013671875, -123.71062469482422, -111.25261688232422, -98.79460906982422, -86.33660888671875, -73.87860107421875, -61.420589447021484, -48.96258544921875, -36.50457763671875, -24.04656982421875, -11.588562965393066, 0.8694438934326172, 13.327449798583984, 25.785457611083984, 38.243465423583984, 50.70146942138672, 63.15947723388672, 75.61748504638672, 88.07549285888672, 100.53350067138672, 112.99150085449219, 125.44950866699219, 137.9075164794922, 150.3655242919922, 162.8235321044922, 175.2815399169922, 187.7395477294922, 200.1975555419922, 212.6555633544922, 225.1135711669922, 237.5715789794922, 250.02957153320312, 262.4875793457031, 274.9455871582031, 287.4035949707031, 299.8616027832031, 312.3196105957031, 324.7776184082031, 337.2356262207031, 349.6936340332031, 362.1516418457031, 374.6096496582031]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 7.0, 17.0, 15.0, 27.0, 32.0, 66.0, 89.0, 186.0, 433.0, 1006.0, 3503.0, 19732.0, 482022.0, 3561855.0, 112405.0, 9255.0, 2134.0, 733.0, 311.0, 161.0, 104.0, 47.0, 31.0, 29.0, 13.0, 14.0, 16.0, 7.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.9375, -62.470703125, -60.00390625, -57.537109375, -55.0703125, -52.603515625, -50.13671875, -47.669921875, -45.203125, -42.736328125, -40.26953125, -37.802734375, -35.3359375, -32.869140625, -30.40234375, -27.935546875, -25.46875, -23.001953125, -20.53515625, -18.068359375, -15.6015625, -13.134765625, -10.66796875, -8.201171875, -5.734375, -3.267578125, -0.80078125, 1.666015625, 4.1328125, 6.599609375, 9.06640625, 11.533203125, 14.0, 16.466796875, 18.93359375, 21.400390625, 23.8671875, 26.333984375, 28.80078125, 31.267578125, 33.734375, 36.201171875, 38.66796875, 41.134765625, 43.6015625, 46.068359375, 48.53515625, 51.001953125, 53.46875, 55.935546875, 58.40234375, 60.869140625, 63.3359375, 65.802734375, 68.26953125, 70.736328125, 73.203125, 75.669921875, 78.13671875, 80.603515625, 83.0703125, 85.537109375, 88.00390625, 90.470703125, 92.9375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 8.0, 12.0, 15.0, 21.0, 24.0, 28.0, 35.0, 46.0, 41.0, 62.0, 67.0, 50.0, 67.0, 65.0, 73.0, 64.0, 67.0, 56.0, 50.0, 29.0, 30.0, 16.0, 13.0, 13.0, 12.0, 10.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.40625, -32.21142578125, -31.0166015625, -29.82177734375, -28.626953125, -27.43212890625, -26.2373046875, -25.04248046875, -23.84765625, -22.65283203125, -21.4580078125, -20.26318359375, -19.068359375, -17.87353515625, -16.6787109375, -15.48388671875, -14.2890625, -13.09423828125, -11.8994140625, -10.70458984375, -9.509765625, -8.31494140625, -7.1201171875, -5.92529296875, -4.73046875, -3.53564453125, -2.3408203125, -1.14599609375, 0.048828125, 1.24365234375, 2.4384765625, 3.63330078125, 4.828125, 6.02294921875, 7.2177734375, 8.41259765625, 9.607421875, 10.80224609375, 11.9970703125, 13.19189453125, 14.38671875, 15.58154296875, 16.7763671875, 17.97119140625, 19.166015625, 20.36083984375, 21.5556640625, 22.75048828125, 23.9453125, 25.14013671875, 26.3349609375, 27.52978515625, 28.724609375, 29.91943359375, 31.1142578125, 32.30908203125, 33.50390625, 34.69873046875, 35.8935546875, 37.08837890625, 38.283203125, 39.47802734375, 40.6728515625, 41.86767578125, 43.0625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 3.0, 12.0, 8.0, 15.0, 16.0, 23.0, 35.0, 48.0, 96.0, 161.0, 370.0, 793.0, 2026.0, 5929.0, 22771.0, 148028.0, 2976504.0, 954356.0, 63681.0, 12875.0, 3908.0, 1398.0, 573.0, 253.0, 147.0, 67.0, 60.0, 33.0, 27.0, 18.0, 12.0, 13.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-59.0, -57.25439453125, -55.5087890625, -53.76318359375, -52.017578125, -50.27197265625, -48.5263671875, -46.78076171875, -45.03515625, -43.28955078125, -41.5439453125, -39.79833984375, -38.052734375, -36.30712890625, -34.5615234375, -32.81591796875, -31.0703125, -29.32470703125, -27.5791015625, -25.83349609375, -24.087890625, -22.34228515625, -20.5966796875, -18.85107421875, -17.10546875, -15.35986328125, -13.6142578125, -11.86865234375, -10.123046875, -8.37744140625, -6.6318359375, -4.88623046875, -3.140625, -1.39501953125, 0.3505859375, 2.09619140625, 3.841796875, 5.58740234375, 7.3330078125, 9.07861328125, 10.82421875, 12.56982421875, 14.3154296875, 16.06103515625, 17.806640625, 19.55224609375, 21.2978515625, 23.04345703125, 24.7890625, 26.53466796875, 28.2802734375, 30.02587890625, 31.771484375, 33.51708984375, 35.2626953125, 37.00830078125, 38.75390625, 40.49951171875, 42.2451171875, 43.99072265625, 45.736328125, 47.48193359375, 49.2275390625, 50.97314453125, 52.71875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 11.0, 12.0, 12.0, 13.0, 18.0, 28.0, 40.0, 55.0, 102.0, 140.0, 150.0, 243.0, 377.0, 567.0, 595.0, 505.0, 380.0, 217.0, 186.0, 107.0, 71.0, 61.0, 35.0, 32.0, 22.0, 18.0, 14.0, 6.0, 11.0, 10.0, 6.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-45.71875, -44.34423828125, -42.9697265625, -41.59521484375, -40.220703125, -38.84619140625, -37.4716796875, -36.09716796875, -34.72265625, -33.34814453125, -31.9736328125, -30.59912109375, -29.224609375, -27.85009765625, -26.4755859375, -25.10107421875, -23.7265625, -22.35205078125, -20.9775390625, -19.60302734375, -18.228515625, -16.85400390625, -15.4794921875, -14.10498046875, -12.73046875, -11.35595703125, -9.9814453125, -8.60693359375, -7.232421875, -5.85791015625, -4.4833984375, -3.10888671875, -1.734375, -0.35986328125, 1.0146484375, 2.38916015625, 3.763671875, 5.13818359375, 6.5126953125, 7.88720703125, 9.26171875, 10.63623046875, 12.0107421875, 13.38525390625, 14.759765625, 16.13427734375, 17.5087890625, 18.88330078125, 20.2578125, 21.63232421875, 23.0068359375, 24.38134765625, 25.755859375, 27.13037109375, 28.5048828125, 29.87939453125, 31.25390625, 32.62841796875, 34.0029296875, 35.37744140625, 36.751953125, 38.12646484375, 39.5009765625, 40.87548828125, 42.25]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 14.0, 19.0, 44.0, 92.0, 153.0, 191.0, 184.0, 133.0, 84.0, 29.0, 16.0, 8.0, 2.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-402.8458251953125, -385.7581787109375, -368.6705322265625, -351.5828857421875, -334.4952392578125, -317.4075927734375, -300.3199462890625, -283.2322998046875, -266.1446533203125, -249.0570068359375, -231.9693603515625, -214.8817138671875, -197.7940673828125, -180.7064208984375, -163.61878967285156, -146.53114318847656, -129.44351196289062, -112.35586547851562, -95.26821899414062, -78.18058013916016, -61.092933654785156, -44.005287170410156, -26.917648315429688, -9.830001831054688, 7.2576446533203125, 24.34528923034668, 41.43293380737305, 58.52057647705078, 75.60822296142578, 92.69586944580078, 109.78350830078125, 126.87115478515625, 143.95880126953125, 161.04644775390625, 178.13409423828125, 195.22174072265625, 212.30938720703125, 229.39703369140625, 246.4846649169922, 263.57232666015625, 280.65997314453125, 297.74761962890625, 314.83526611328125, 331.92291259765625, 349.01055908203125, 366.09820556640625, 383.18585205078125, 400.27349853515625, 417.3611145019531, 434.4487609863281, 451.5364074707031, 468.6240539550781, 485.7117004394531, 502.7993469238281, 519.886962890625, 536.974609375, 554.062255859375, 571.14990234375, 588.237548828125, 605.3251953125, 622.412841796875, 639.50048828125, 656.588134765625, 673.67578125, 690.763427734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 9.0, 8.0, 5.0, 10.0, 14.0, 18.0, 18.0, 32.0, 30.0, 31.0, 32.0, 32.0, 40.0, 42.0, 50.0, 32.0, 48.0, 39.0, 35.0, 52.0, 35.0, 37.0, 47.0, 29.0, 23.0, 49.0, 33.0, 27.0, 33.0, 27.0, 17.0, 18.0, 16.0, 11.0, 5.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-288.9852600097656, -281.2853698730469, -273.58544921875, -265.88555908203125, -258.1856689453125, -250.48577880859375, -242.78587341308594, -235.08596801757812, -227.38607788085938, -219.68618774414062, -211.9862823486328, -204.286376953125, -196.58648681640625, -188.8865966796875, -181.1866912841797, -173.48678588867188, -165.78689575195312, -158.08700561523438, -150.38710021972656, -142.68719482421875, -134.9873046875, -127.28740692138672, -119.58750915527344, -111.88761138916016, -104.18771362304688, -96.4878158569336, -88.78791809082031, -81.08802032470703, -73.38812255859375, -65.68822479248047, -57.98832702636719, -50.288429260253906, -42.58854675292969, -34.888648986816406, -27.188751220703125, -19.488853454589844, -11.788955688476562, -4.089057922363281, 3.61083984375, 11.310737609863281, 19.010635375976562, 26.710533142089844, 34.410430908203125, 42.110328674316406, 49.81022644042969, 57.51012420654297, 65.21002197265625, 72.90991973876953, 80.60981750488281, 88.3097152709961, 96.00961303710938, 103.70951080322266, 111.40940856933594, 119.10930633544922, 126.8092041015625, 134.50909423828125, 142.20899963378906, 149.90890502929688, 157.60879516601562, 165.30868530273438, 173.0085906982422, 180.70849609375, 188.40838623046875, 196.1082763671875, 203.8081817626953]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 14.0, 14.0, 16.0, 31.0, 41.0, 78.0, 108.0, 193.0, 383.0, 799.0, 1842.0, 5409.0, 18370.0, 75790.0, 336399.0, 453142.0, 116650.0, 27262.0, 7418.0, 2547.0, 973.0, 469.0, 229.0, 133.0, 70.0, 71.0, 35.0, 19.0, 15.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-72.0, -70.0615234375, -68.123046875, -66.1845703125, -64.24609375, -62.3076171875, -60.369140625, -58.4306640625, -56.4921875, -54.5537109375, -52.615234375, -50.6767578125, -48.73828125, -46.7998046875, -44.861328125, -42.9228515625, -40.984375, -39.0458984375, -37.107421875, -35.1689453125, -33.23046875, -31.2919921875, -29.353515625, -27.4150390625, -25.4765625, -23.5380859375, -21.599609375, -19.6611328125, -17.72265625, -15.7841796875, -13.845703125, -11.9072265625, -9.96875, -8.0302734375, -6.091796875, -4.1533203125, -2.21484375, -0.2763671875, 1.662109375, 3.6005859375, 5.5390625, 7.4775390625, 9.416015625, 11.3544921875, 13.29296875, 15.2314453125, 17.169921875, 19.1083984375, 21.046875, 22.9853515625, 24.923828125, 26.8623046875, 28.80078125, 30.7392578125, 32.677734375, 34.6162109375, 36.5546875, 38.4931640625, 40.431640625, 42.3701171875, 44.30859375, 46.2470703125, 48.185546875, 50.1240234375, 52.0625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 10.0, 11.0, 12.0, 15.0, 25.0, 30.0, 34.0, 35.0, 45.0, 56.0, 68.0, 60.0, 67.0, 63.0, 70.0, 54.0, 69.0, 48.0, 47.0, 38.0, 32.0, 23.0, 26.0, 17.0, 10.0, 13.0, 5.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.28125, -33.07470703125, -31.8681640625, -30.66162109375, -29.455078125, -28.24853515625, -27.0419921875, -25.83544921875, -24.62890625, -23.42236328125, -22.2158203125, -21.00927734375, -19.802734375, -18.59619140625, -17.3896484375, -16.18310546875, -14.9765625, -13.77001953125, -12.5634765625, -11.35693359375, -10.150390625, -8.94384765625, -7.7373046875, -6.53076171875, -5.32421875, -4.11767578125, -2.9111328125, -1.70458984375, -0.498046875, 0.70849609375, 1.9150390625, 3.12158203125, 4.328125, 5.53466796875, 6.7412109375, 7.94775390625, 9.154296875, 10.36083984375, 11.5673828125, 12.77392578125, 13.98046875, 15.18701171875, 16.3935546875, 17.60009765625, 18.806640625, 20.01318359375, 21.2197265625, 22.42626953125, 23.6328125, 24.83935546875, 26.0458984375, 27.25244140625, 28.458984375, 29.66552734375, 30.8720703125, 32.07861328125, 33.28515625, 34.49169921875, 35.6982421875, 36.90478515625, 38.111328125, 39.31787109375, 40.5244140625, 41.73095703125, 42.9375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 6.0, 12.0, 12.0, 20.0, 33.0, 57.0, 78.0, 84.0, 186.0, 262.0, 461.0, 929.0, 2567.0, 12376.0, 139136.0, 812446.0, 68484.0, 7733.0, 1811.0, 783.0, 397.0, 252.0, 128.0, 101.0, 61.0, 39.0, 23.0, 16.0, 13.0, 16.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.1875, -111.8359375, -108.484375, -105.1328125, -101.78125, -98.4296875, -95.078125, -91.7265625, -88.375, -85.0234375, -81.671875, -78.3203125, -74.96875, -71.6171875, -68.265625, -64.9140625, -61.5625, -58.2109375, -54.859375, -51.5078125, -48.15625, -44.8046875, -41.453125, -38.1015625, -34.75, -31.3984375, -28.046875, -24.6953125, -21.34375, -17.9921875, -14.640625, -11.2890625, -7.9375, -4.5859375, -1.234375, 2.1171875, 5.46875, 8.8203125, 12.171875, 15.5234375, 18.875, 22.2265625, 25.578125, 28.9296875, 32.28125, 35.6328125, 38.984375, 42.3359375, 45.6875, 49.0390625, 52.390625, 55.7421875, 59.09375, 62.4453125, 65.796875, 69.1484375, 72.5, 75.8515625, 79.203125, 82.5546875, 85.90625, 89.2578125, 92.609375, 95.9609375, 99.3125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 5.0, 3.0, 12.0, 10.0, 12.0, 15.0, 22.0, 19.0, 21.0, 35.0, 41.0, 36.0, 46.0, 52.0, 60.0, 49.0, 59.0, 50.0, 64.0, 47.0, 52.0, 42.0, 42.0, 39.0, 36.0, 28.0, 18.0, 13.0, 20.0, 7.0, 6.0, 3.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.4375, -100.8896484375, -97.341796875, -93.7939453125, -90.24609375, -86.6982421875, -83.150390625, -79.6025390625, -76.0546875, -72.5068359375, -68.958984375, -65.4111328125, -61.86328125, -58.3154296875, -54.767578125, -51.2197265625, -47.671875, -44.1240234375, -40.576171875, -37.0283203125, -33.48046875, -29.9326171875, -26.384765625, -22.8369140625, -19.2890625, -15.7412109375, -12.193359375, -8.6455078125, -5.09765625, -1.5498046875, 1.998046875, 5.5458984375, 9.09375, 12.6416015625, 16.189453125, 19.7373046875, 23.28515625, 26.8330078125, 30.380859375, 33.9287109375, 37.4765625, 41.0244140625, 44.572265625, 48.1201171875, 51.66796875, 55.2158203125, 58.763671875, 62.3115234375, 65.859375, 69.4072265625, 72.955078125, 76.5029296875, 80.05078125, 83.5986328125, 87.146484375, 90.6943359375, 94.2421875, 97.7900390625, 101.337890625, 104.8857421875, 108.43359375, 111.9814453125, 115.529296875, 119.0771484375, 122.625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 7.0, 8.0, 9.0, 10.0, 10.0, 14.0, 14.0, 19.0, 33.0, 51.0, 65.0, 113.0, 205.0, 399.0, 908.0, 2731.0, 11236.0, 72302.0, 793535.0, 141911.0, 18691.0, 3921.0, 1155.0, 526.0, 256.0, 132.0, 78.0, 61.0, 36.0, 30.0, 31.0, 11.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -27.13037109375, -26.2451171875, -25.35986328125, -24.474609375, -23.58935546875, -22.7041015625, -21.81884765625, -20.93359375, -20.04833984375, -19.1630859375, -18.27783203125, -17.392578125, -16.50732421875, -15.6220703125, -14.73681640625, -13.8515625, -12.96630859375, -12.0810546875, -11.19580078125, -10.310546875, -9.42529296875, -8.5400390625, -7.65478515625, -6.76953125, -5.88427734375, -4.9990234375, -4.11376953125, -3.228515625, -2.34326171875, -1.4580078125, -0.57275390625, 0.3125, 1.19775390625, 2.0830078125, 2.96826171875, 3.853515625, 4.73876953125, 5.6240234375, 6.50927734375, 7.39453125, 8.27978515625, 9.1650390625, 10.05029296875, 10.935546875, 11.82080078125, 12.7060546875, 13.59130859375, 14.4765625, 15.36181640625, 16.2470703125, 17.13232421875, 18.017578125, 18.90283203125, 19.7880859375, 20.67333984375, 21.55859375, 22.44384765625, 23.3291015625, 24.21435546875, 25.099609375, 25.98486328125, 26.8701171875, 27.75537109375, 28.640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 2.0, 5.0, 7.0, 8.0, 9.0, 10.0, 10.0, 12.0, 12.0, 25.0, 21.0, 43.0, 42.0, 48.0, 72.0, 93.0, 111.0, 101.0, 73.0, 56.0, 45.0, 42.0, 25.0, 23.0, 19.0, 17.0, 12.0, 15.0, 7.0, 11.0, 5.0, 2.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004932403564453125, -0.0047754645347595215, -0.004618525505065918, -0.0044615864753723145, -0.004304647445678711, -0.004147708415985107, -0.003990769386291504, -0.0038338303565979004, -0.003676891326904297, -0.0035199522972106934, -0.00336301326751709, -0.0032060742378234863, -0.003049135208129883, -0.0028921961784362793, -0.0027352571487426758, -0.0025783181190490723, -0.0024213790893554688, -0.0022644400596618652, -0.0021075010299682617, -0.0019505620002746582, -0.0017936229705810547, -0.0016366839408874512, -0.0014797449111938477, -0.0013228058815002441, -0.0011658668518066406, -0.0010089278221130371, -0.0008519887924194336, -0.0006950497627258301, -0.0005381107330322266, -0.00038117170333862305, -0.00022423267364501953, -6.729364395141602e-05, 8.96453857421875e-05, 0.000246584415435791, 0.00040352344512939453, 0.000560462474822998, 0.0007174015045166016, 0.0008743405342102051, 0.0010312795639038086, 0.0011882185935974121, 0.0013451576232910156, 0.0015020966529846191, 0.0016590356826782227, 0.0018159747123718262, 0.0019729137420654297, 0.002129852771759033, 0.0022867918014526367, 0.0024437308311462402, 0.0026006698608398438, 0.0027576088905334473, 0.0029145479202270508, 0.0030714869499206543, 0.003228425979614258, 0.0033853650093078613, 0.003542304039001465, 0.0036992430686950684, 0.003856182098388672, 0.004013121128082275, 0.004170060157775879, 0.004326999187469482, 0.004483938217163086, 0.0046408772468566895, 0.004797816276550293, 0.0049547553062438965, 0.0051116943359375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 6.0, 3.0, 5.0, 7.0, 5.0, 6.0, 9.0, 17.0, 20.0, 34.0, 42.0, 73.0, 94.0, 151.0, 236.0, 390.0, 652.0, 1435.0, 3172.0, 9067.0, 32412.0, 165598.0, 696407.0, 103860.0, 22696.0, 6808.0, 2586.0, 1177.0, 606.0, 347.0, 202.0, 138.0, 90.0, 58.0, 48.0, 33.0, 20.0, 18.0, 10.0, 9.0, 4.0, 7.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.734375, -18.13720703125, -17.5400390625, -16.94287109375, -16.345703125, -15.74853515625, -15.1513671875, -14.55419921875, -13.95703125, -13.35986328125, -12.7626953125, -12.16552734375, -11.568359375, -10.97119140625, -10.3740234375, -9.77685546875, -9.1796875, -8.58251953125, -7.9853515625, -7.38818359375, -6.791015625, -6.19384765625, -5.5966796875, -4.99951171875, -4.40234375, -3.80517578125, -3.2080078125, -2.61083984375, -2.013671875, -1.41650390625, -0.8193359375, -0.22216796875, 0.375, 0.97216796875, 1.5693359375, 2.16650390625, 2.763671875, 3.36083984375, 3.9580078125, 4.55517578125, 5.15234375, 5.74951171875, 6.3466796875, 6.94384765625, 7.541015625, 8.13818359375, 8.7353515625, 9.33251953125, 9.9296875, 10.52685546875, 11.1240234375, 11.72119140625, 12.318359375, 12.91552734375, 13.5126953125, 14.10986328125, 14.70703125, 15.30419921875, 15.9013671875, 16.49853515625, 17.095703125, 17.69287109375, 18.2900390625, 18.88720703125, 19.484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 12.0, 6.0, 11.0, 18.0, 20.0, 28.0, 44.0, 49.0, 68.0, 88.0, 105.0, 134.0, 97.0, 77.0, 69.0, 35.0, 27.0, 38.0, 21.0, 13.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.265625, -22.492919921875, -21.72021484375, -20.947509765625, -20.1748046875, -19.402099609375, -18.62939453125, -17.856689453125, -17.083984375, -16.311279296875, -15.53857421875, -14.765869140625, -13.9931640625, -13.220458984375, -12.44775390625, -11.675048828125, -10.90234375, -10.129638671875, -9.35693359375, -8.584228515625, -7.8115234375, -7.038818359375, -6.26611328125, -5.493408203125, -4.720703125, -3.947998046875, -3.17529296875, -2.402587890625, -1.6298828125, -0.857177734375, -0.08447265625, 0.688232421875, 1.4609375, 2.233642578125, 3.00634765625, 3.779052734375, 4.5517578125, 5.324462890625, 6.09716796875, 6.869873046875, 7.642578125, 8.415283203125, 9.18798828125, 9.960693359375, 10.7333984375, 11.506103515625, 12.27880859375, 13.051513671875, 13.82421875, 14.596923828125, 15.36962890625, 16.142333984375, 16.9150390625, 17.687744140625, 18.46044921875, 19.233154296875, 20.005859375, 20.778564453125, 21.55126953125, 22.323974609375, 23.0966796875, 23.869384765625, 24.64208984375, 25.414794921875, 26.1875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 11.0, 16.0, 31.0, 39.0, 98.0, 174.0, 302.0, 157.0, 76.0, 38.0, 25.0, 11.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-782.902587890625, -764.0009155273438, -745.0992431640625, -726.1976318359375, -707.2959594726562, -688.394287109375, -669.4926147460938, -650.5909423828125, -631.6893310546875, -612.7876586914062, -593.885986328125, -574.984375, -556.0827026367188, -537.1810302734375, -518.2793579101562, -499.377685546875, -480.47601318359375, -461.5743408203125, -442.6726989746094, -423.7710266113281, -404.869384765625, -385.96771240234375, -367.0660400390625, -348.16436767578125, -329.2627258300781, -310.3610534667969, -291.45941162109375, -272.5577392578125, -253.6560821533203, -234.75442504882812, -215.85275268554688, -196.9510955810547, -178.0494384765625, -159.1477813720703, -140.24612426757812, -121.34445190429688, -102.44279479980469, -83.5411376953125, -64.63947296142578, -45.73780822753906, -26.836151123046875, -7.934490203857422, 10.967170715332031, 29.868831634521484, 48.77049255371094, 67.67214965820312, 86.57381439208984, 105.47547912597656, 124.37713623046875, 143.27879333496094, 162.18045043945312, 181.08212280273438, 199.98377990722656, 218.88543701171875, 237.787109375, 256.68878173828125, 275.5904235839844, 294.4920959472656, 313.39373779296875, 332.29541015625, 351.19708251953125, 370.0987243652344, 389.0003967285156, 407.90203857421875, 426.8037109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 2.0, 3.0, 9.0, 6.0, 10.0, 8.0, 13.0, 15.0, 15.0, 26.0, 27.0, 30.0, 26.0, 31.0, 32.0, 34.0, 47.0, 67.0, 104.0, 97.0, 53.0, 46.0, 37.0, 30.0, 28.0, 28.0, 26.0, 20.0, 22.0, 16.0, 17.0, 13.0, 13.0, 12.0, 7.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.5806884765625, -352.6942138671875, -340.8077392578125, -328.9212646484375, -317.0347900390625, -305.1483459472656, -293.2618713378906, -281.3753967285156, -269.4889221191406, -257.6024475097656, -245.71597290039062, -233.8295135498047, -221.9430389404297, -210.0565643310547, -198.17010498046875, -186.28363037109375, -174.39715576171875, -162.51068115234375, -150.62420654296875, -138.7377471923828, -126.85127258300781, -114.96479797363281, -103.07833099365234, -91.19186401367188, -79.30538940429688, -67.41891479492188, -55.532447814941406, -43.64597702026367, -31.759506225585938, -19.873035430908203, -7.986564636230469, 3.89990234375, 15.786376953125, 27.672847747802734, 39.55931854248047, 51.4457893371582, 63.33226013183594, 75.21873474121094, 87.1052017211914, 98.99166870117188, 110.87814331054688, 122.76461791992188, 134.65109252929688, 146.5375518798828, 158.4240264892578, 170.3105010986328, 182.19696044921875, 194.08343505859375, 205.96990966796875, 217.85638427734375, 229.74285888671875, 241.6293182373047, 253.5157928466797, 265.4022521972656, 277.2887268066406, 289.1752014160156, 301.0616760253906, 312.9481506347656, 324.8346252441406, 336.7210998535156, 348.6075439453125, 360.4940185546875, 372.3804931640625, 384.2669677734375, 396.1534423828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 12.0, 10.0, 16.0, 14.0, 33.0, 25.0, 49.0, 73.0, 132.0, 178.0, 357.0, 778.0, 2397.0, 10229.0, 89069.0, 2551905.0, 1480152.0, 48028.0, 7332.0, 1868.0, 676.0, 320.0, 193.0, 138.0, 74.0, 63.0, 36.0, 17.0, 24.0, 26.0, 11.0, 11.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-65.375, -63.1884765625, -61.001953125, -58.8154296875, -56.62890625, -54.4423828125, -52.255859375, -50.0693359375, -47.8828125, -45.6962890625, -43.509765625, -41.3232421875, -39.13671875, -36.9501953125, -34.763671875, -32.5771484375, -30.390625, -28.2041015625, -26.017578125, -23.8310546875, -21.64453125, -19.4580078125, -17.271484375, -15.0849609375, -12.8984375, -10.7119140625, -8.525390625, -6.3388671875, -4.15234375, -1.9658203125, 0.220703125, 2.4072265625, 4.59375, 6.7802734375, 8.966796875, 11.1533203125, 13.33984375, 15.5263671875, 17.712890625, 19.8994140625, 22.0859375, 24.2724609375, 26.458984375, 28.6455078125, 30.83203125, 33.0185546875, 35.205078125, 37.3916015625, 39.578125, 41.7646484375, 43.951171875, 46.1376953125, 48.32421875, 50.5107421875, 52.697265625, 54.8837890625, 57.0703125, 59.2568359375, 61.443359375, 63.6298828125, 65.81640625, 68.0029296875, 70.189453125, 72.3759765625, 74.5625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 7.0, 5.0, 7.0, 12.0, 6.0, 10.0, 13.0, 16.0, 18.0, 30.0, 30.0, 45.0, 44.0, 41.0, 42.0, 57.0, 46.0, 53.0, 52.0, 36.0, 45.0, 48.0, 46.0, 37.0, 28.0, 37.0, 25.0, 23.0, 25.0, 16.0, 21.0, 19.0, 12.0, 12.0, 11.0, 5.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.265625, -24.356689453125, -23.44775390625, -22.538818359375, -21.6298828125, -20.720947265625, -19.81201171875, -18.903076171875, -17.994140625, -17.085205078125, -16.17626953125, -15.267333984375, -14.3583984375, -13.449462890625, -12.54052734375, -11.631591796875, -10.72265625, -9.813720703125, -8.90478515625, -7.995849609375, -7.0869140625, -6.177978515625, -5.26904296875, -4.360107421875, -3.451171875, -2.542236328125, -1.63330078125, -0.724365234375, 0.1845703125, 1.093505859375, 2.00244140625, 2.911376953125, 3.8203125, 4.729248046875, 5.63818359375, 6.547119140625, 7.4560546875, 8.364990234375, 9.27392578125, 10.182861328125, 11.091796875, 12.000732421875, 12.90966796875, 13.818603515625, 14.7275390625, 15.636474609375, 16.54541015625, 17.454345703125, 18.36328125, 19.272216796875, 20.18115234375, 21.090087890625, 21.9990234375, 22.907958984375, 23.81689453125, 24.725830078125, 25.634765625, 26.543701171875, 27.45263671875, 28.361572265625, 29.2705078125, 30.179443359375, 31.08837890625, 31.997314453125, 32.90625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 5.0, 9.0, 22.0, 25.0, 40.0, 55.0, 89.0, 154.0, 347.0, 1021.0, 3590.0, 20414.0, 359800.0, 3670385.0, 123828.0, 11000.0, 2263.0, 641.0, 254.0, 138.0, 61.0, 55.0, 20.0, 16.0, 5.0, 10.0, 8.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.3125, -67.8330078125, -65.353515625, -62.8740234375, -60.39453125, -57.9150390625, -55.435546875, -52.9560546875, -50.4765625, -47.9970703125, -45.517578125, -43.0380859375, -40.55859375, -38.0791015625, -35.599609375, -33.1201171875, -30.640625, -28.1611328125, -25.681640625, -23.2021484375, -20.72265625, -18.2431640625, -15.763671875, -13.2841796875, -10.8046875, -8.3251953125, -5.845703125, -3.3662109375, -0.88671875, 1.5927734375, 4.072265625, 6.5517578125, 9.03125, 11.5107421875, 13.990234375, 16.4697265625, 18.94921875, 21.4287109375, 23.908203125, 26.3876953125, 28.8671875, 31.3466796875, 33.826171875, 36.3056640625, 38.78515625, 41.2646484375, 43.744140625, 46.2236328125, 48.703125, 51.1826171875, 53.662109375, 56.1416015625, 58.62109375, 61.1005859375, 63.580078125, 66.0595703125, 68.5390625, 71.0185546875, 73.498046875, 75.9775390625, 78.45703125, 80.9365234375, 83.416015625, 85.8955078125, 88.375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 14.0, 16.0, 18.0, 28.0, 36.0, 43.0, 75.0, 118.0, 185.0, 276.0, 472.0, 582.0, 718.0, 574.0, 306.0, 232.0, 135.0, 73.0, 50.0, 25.0, 18.0, 14.0, 17.0, 7.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4375, -58.55419921875, -56.6708984375, -54.78759765625, -52.904296875, -51.02099609375, -49.1376953125, -47.25439453125, -45.37109375, -43.48779296875, -41.6044921875, -39.72119140625, -37.837890625, -35.95458984375, -34.0712890625, -32.18798828125, -30.3046875, -28.42138671875, -26.5380859375, -24.65478515625, -22.771484375, -20.88818359375, -19.0048828125, -17.12158203125, -15.23828125, -13.35498046875, -11.4716796875, -9.58837890625, -7.705078125, -5.82177734375, -3.9384765625, -2.05517578125, -0.171875, 1.71142578125, 3.5947265625, 5.47802734375, 7.361328125, 9.24462890625, 11.1279296875, 13.01123046875, 14.89453125, 16.77783203125, 18.6611328125, 20.54443359375, 22.427734375, 24.31103515625, 26.1943359375, 28.07763671875, 29.9609375, 31.84423828125, 33.7275390625, 35.61083984375, 37.494140625, 39.37744140625, 41.2607421875, 43.14404296875, 45.02734375, 46.91064453125, 48.7939453125, 50.67724609375, 52.560546875, 54.44384765625, 56.3271484375, 58.21044921875, 60.09375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 14.0, 27.0, 51.0, 122.0, 231.0, 242.0, 187.0, 79.0, 20.0, 12.0, 6.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1182.080810546875, -1160.336669921875, -1138.5926513671875, -1116.8485107421875, -1095.1043701171875, -1073.3603515625, -1051.6162109375, -1029.8720703125, -1008.1279907226562, -986.3839111328125, -964.6397705078125, -942.8956909179688, -921.151611328125, -899.407470703125, -877.6633911132812, -855.9193115234375, -834.1751708984375, -812.4310913085938, -790.6869506835938, -768.94287109375, -747.19873046875, -725.4546508789062, -703.7105712890625, -681.9664306640625, -660.2223510742188, -638.478271484375, -616.734130859375, -594.9900512695312, -573.2459716796875, -551.5018310546875, -529.7577514648438, -508.0136413574219, -486.2695617675781, -464.52545166015625, -442.7813720703125, -421.0372619628906, -399.29315185546875, -377.5490417480469, -355.804931640625, -334.06085205078125, -312.3167419433594, -290.5726318359375, -268.82855224609375, -247.08444213867188, -225.34033203125, -203.59622192382812, -181.8521270751953, -160.1080322265625, -138.36392211914062, -116.61981964111328, -94.87571716308594, -73.1316146850586, -51.38751220703125, -29.643409729003906, -7.8993072509765625, 13.84478759765625, 35.588897705078125, 57.33300018310547, 79.07710266113281, 100.82120513916016, 122.5653076171875, 144.30941772460938, 166.0535125732422, 187.797607421875, 209.54171752929688]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 5.0, 5.0, 16.0, 9.0, 15.0, 8.0, 20.0, 26.0, 20.0, 34.0, 26.0, 33.0, 38.0, 42.0, 34.0, 49.0, 54.0, 45.0, 45.0, 43.0, 36.0, 27.0, 38.0, 42.0, 32.0, 27.0, 29.0, 24.0, 28.0, 20.0, 9.0, 17.0, 18.0, 15.0, 11.0, 8.0, 5.0, 5.0, 7.0, 3.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-232.91329956054688, -225.816162109375, -218.71902465820312, -211.62188720703125, -204.52474975585938, -197.4276123046875, -190.33047485351562, -183.23333740234375, -176.13619995117188, -169.0390625, -161.94192504882812, -154.84478759765625, -147.74765014648438, -140.6505126953125, -133.55337524414062, -126.45623779296875, -119.35910034179688, -112.261962890625, -105.16482543945312, -98.06768798828125, -90.97055053710938, -83.8734130859375, -76.77627563476562, -69.67913818359375, -62.582000732421875, -55.48486328125, -48.387725830078125, -41.29058837890625, -34.193450927734375, -27.0963134765625, -19.999176025390625, -12.90203857421875, -5.8048858642578125, 1.2922515869140625, 8.389389038085938, 15.486526489257812, 22.583663940429688, 29.680801391601562, 36.77793884277344, 43.87507629394531, 50.97221374511719, 58.06935119628906, 65.16648864746094, 72.26362609863281, 79.36076354980469, 86.45790100097656, 93.55503845214844, 100.65217590332031, 107.74931335449219, 114.84645080566406, 121.94358825683594, 129.0407257080078, 136.1378631591797, 143.23500061035156, 150.33213806152344, 157.4292755126953, 164.5264129638672, 171.62355041503906, 178.72068786621094, 185.8178253173828, 192.9149627685547, 200.01210021972656, 207.10923767089844, 214.2063751220703, 221.3035125732422]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 10.0, 9.0, 11.0, 24.0, 39.0, 81.0, 155.0, 415.0, 1197.0, 3683.0, 13863.0, 66688.0, 442617.0, 435309.0, 65014.0, 13792.0, 3723.0, 1143.0, 407.0, 159.0, 93.0, 49.0, 20.0, 22.0, 8.0, 0.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.75, -82.015625, -79.28125, -76.546875, -73.8125, -71.078125, -68.34375, -65.609375, -62.875, -60.140625, -57.40625, -54.671875, -51.9375, -49.203125, -46.46875, -43.734375, -41.0, -38.265625, -35.53125, -32.796875, -30.0625, -27.328125, -24.59375, -21.859375, -19.125, -16.390625, -13.65625, -10.921875, -8.1875, -5.453125, -2.71875, 0.015625, 2.75, 5.484375, 8.21875, 10.953125, 13.6875, 16.421875, 19.15625, 21.890625, 24.625, 27.359375, 30.09375, 32.828125, 35.5625, 38.296875, 41.03125, 43.765625, 46.5, 49.234375, 51.96875, 54.703125, 57.4375, 60.171875, 62.90625, 65.640625, 68.375, 71.109375, 73.84375, 76.578125, 79.3125, 82.046875, 84.78125, 87.515625, 90.25]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 7.0, 6.0, 12.0, 15.0, 16.0, 18.0, 22.0, 15.0, 26.0, 29.0, 40.0, 47.0, 53.0, 39.0, 49.0, 42.0, 46.0, 56.0, 35.0, 51.0, 49.0, 43.0, 37.0, 37.0, 25.0, 28.0, 26.0, 28.0, 16.0, 18.0, 12.0, 14.0, 6.0, 5.0, 5.0, 9.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.953125, -25.034423828125, -24.11572265625, -23.197021484375, -22.2783203125, -21.359619140625, -20.44091796875, -19.522216796875, -18.603515625, -17.684814453125, -16.76611328125, -15.847412109375, -14.9287109375, -14.010009765625, -13.09130859375, -12.172607421875, -11.25390625, -10.335205078125, -9.41650390625, -8.497802734375, -7.5791015625, -6.660400390625, -5.74169921875, -4.822998046875, -3.904296875, -2.985595703125, -2.06689453125, -1.148193359375, -0.2294921875, 0.689208984375, 1.60791015625, 2.526611328125, 3.4453125, 4.364013671875, 5.28271484375, 6.201416015625, 7.1201171875, 8.038818359375, 8.95751953125, 9.876220703125, 10.794921875, 11.713623046875, 12.63232421875, 13.551025390625, 14.4697265625, 15.388427734375, 16.30712890625, 17.225830078125, 18.14453125, 19.063232421875, 19.98193359375, 20.900634765625, 21.8193359375, 22.738037109375, 23.65673828125, 24.575439453125, 25.494140625, 26.412841796875, 27.33154296875, 28.250244140625, 29.1689453125, 30.087646484375, 31.00634765625, 31.925048828125, 32.84375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 1.0, 5.0, 12.0, 9.0, 22.0, 29.0, 33.0, 43.0, 89.0, 117.0, 150.0, 248.0, 398.0, 584.0, 1115.0, 2407.0, 8985.0, 79718.0, 860347.0, 80090.0, 8934.0, 2371.0, 1092.0, 598.0, 388.0, 235.0, 157.0, 112.0, 73.0, 56.0, 45.0, 25.0, 16.0, 10.0, 11.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-101.8125, -98.361328125, -94.91015625, -91.458984375, -88.0078125, -84.556640625, -81.10546875, -77.654296875, -74.203125, -70.751953125, -67.30078125, -63.849609375, -60.3984375, -56.947265625, -53.49609375, -50.044921875, -46.59375, -43.142578125, -39.69140625, -36.240234375, -32.7890625, -29.337890625, -25.88671875, -22.435546875, -18.984375, -15.533203125, -12.08203125, -8.630859375, -5.1796875, -1.728515625, 1.72265625, 5.173828125, 8.625, 12.076171875, 15.52734375, 18.978515625, 22.4296875, 25.880859375, 29.33203125, 32.783203125, 36.234375, 39.685546875, 43.13671875, 46.587890625, 50.0390625, 53.490234375, 56.94140625, 60.392578125, 63.84375, 67.294921875, 70.74609375, 74.197265625, 77.6484375, 81.099609375, 84.55078125, 88.001953125, 91.453125, 94.904296875, 98.35546875, 101.806640625, 105.2578125, 108.708984375, 112.16015625, 115.611328125, 119.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 3.0, 7.0, 4.0, 10.0, 11.0, 20.0, 16.0, 20.0, 26.0, 37.0, 28.0, 44.0, 57.0, 53.0, 49.0, 79.0, 60.0, 60.0, 61.0, 61.0, 43.0, 41.0, 30.0, 28.0, 29.0, 15.0, 21.0, 18.0, 15.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.625, -117.646484375, -113.66796875, -109.689453125, -105.7109375, -101.732421875, -97.75390625, -93.775390625, -89.796875, -85.818359375, -81.83984375, -77.861328125, -73.8828125, -69.904296875, -65.92578125, -61.947265625, -57.96875, -53.990234375, -50.01171875, -46.033203125, -42.0546875, -38.076171875, -34.09765625, -30.119140625, -26.140625, -22.162109375, -18.18359375, -14.205078125, -10.2265625, -6.248046875, -2.26953125, 1.708984375, 5.6875, 9.666015625, 13.64453125, 17.623046875, 21.6015625, 25.580078125, 29.55859375, 33.537109375, 37.515625, 41.494140625, 45.47265625, 49.451171875, 53.4296875, 57.408203125, 61.38671875, 65.365234375, 69.34375, 73.322265625, 77.30078125, 81.279296875, 85.2578125, 89.236328125, 93.21484375, 97.193359375, 101.171875, 105.150390625, 109.12890625, 113.107421875, 117.0859375, 121.064453125, 125.04296875, 129.021484375, 133.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 14.0, 12.0, 33.0, 28.0, 36.0, 79.0, 122.0, 212.0, 407.0, 782.0, 2032.0, 6478.0, 44538.0, 886047.0, 93470.0, 9554.0, 2629.0, 986.0, 447.0, 229.0, 125.0, 82.0, 50.0, 35.0, 26.0, 13.0, 17.0, 12.0, 14.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.703125, -30.633056640625, -29.56298828125, -28.492919921875, -27.4228515625, -26.352783203125, -25.28271484375, -24.212646484375, -23.142578125, -22.072509765625, -21.00244140625, -19.932373046875, -18.8623046875, -17.792236328125, -16.72216796875, -15.652099609375, -14.58203125, -13.511962890625, -12.44189453125, -11.371826171875, -10.3017578125, -9.231689453125, -8.16162109375, -7.091552734375, -6.021484375, -4.951416015625, -3.88134765625, -2.811279296875, -1.7412109375, -0.671142578125, 0.39892578125, 1.468994140625, 2.5390625, 3.609130859375, 4.67919921875, 5.749267578125, 6.8193359375, 7.889404296875, 8.95947265625, 10.029541015625, 11.099609375, 12.169677734375, 13.23974609375, 14.309814453125, 15.3798828125, 16.449951171875, 17.52001953125, 18.590087890625, 19.66015625, 20.730224609375, 21.80029296875, 22.870361328125, 23.9404296875, 25.010498046875, 26.08056640625, 27.150634765625, 28.220703125, 29.290771484375, 30.36083984375, 31.430908203125, 32.5009765625, 33.571044921875, 34.64111328125, 35.711181640625, 36.78125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 2.0, 8.0, 9.0, 13.0, 12.0, 14.0, 15.0, 35.0, 47.0, 61.0, 87.0, 144.0, 156.0, 115.0, 67.0, 52.0, 29.0, 33.0, 24.0, 14.0, 18.0, 6.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005748748779296875, -0.005529940128326416, -0.005311131477355957, -0.005092322826385498, -0.004873514175415039, -0.00465470552444458, -0.004435896873474121, -0.004217088222503662, -0.003998279571533203, -0.003779470920562744, -0.003560662269592285, -0.003341853618621826, -0.003123044967651367, -0.002904236316680908, -0.0026854276657104492, -0.0024666190147399902, -0.0022478103637695312, -0.0020290017127990723, -0.0018101930618286133, -0.0015913844108581543, -0.0013725757598876953, -0.0011537671089172363, -0.0009349584579467773, -0.0007161498069763184, -0.0004973411560058594, -0.0002785325050354004, -5.9723854064941406e-05, 0.00015908479690551758, 0.00037789344787597656, 0.0005967020988464355, 0.0008155107498168945, 0.0010343194007873535, 0.0012531280517578125, 0.0014719367027282715, 0.0016907453536987305, 0.0019095540046691895, 0.0021283626556396484, 0.0023471713066101074, 0.0025659799575805664, 0.0027847886085510254, 0.0030035972595214844, 0.0032224059104919434, 0.0034412145614624023, 0.0036600232124328613, 0.0038788318634033203, 0.004097640514373779, 0.004316449165344238, 0.004535257816314697, 0.004754066467285156, 0.004972875118255615, 0.005191683769226074, 0.005410492420196533, 0.005629301071166992, 0.005848109722137451, 0.00606691837310791, 0.006285727024078369, 0.006504535675048828, 0.006723344326019287, 0.006942152976989746, 0.007160961627960205, 0.007379770278930664, 0.007598578929901123, 0.007817387580871582, 0.008036196231842041, 0.0082550048828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 12.0, 13.0, 20.0, 11.0, 29.0, 26.0, 48.0, 60.0, 89.0, 122.0, 170.0, 240.0, 391.0, 731.0, 1300.0, 2721.0, 6852.0, 24499.0, 207295.0, 734738.0, 50904.0, 10450.0, 3749.0, 1711.0, 881.0, 491.0, 308.0, 204.0, 130.0, 86.0, 71.0, 45.0, 28.0, 33.0, 11.0, 10.0, 14.0, 14.0, 10.0, 4.0, 7.0, 3.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0], "bins": [-24.265625, -23.576171875, -22.88671875, -22.197265625, -21.5078125, -20.818359375, -20.12890625, -19.439453125, -18.75, -18.060546875, -17.37109375, -16.681640625, -15.9921875, -15.302734375, -14.61328125, -13.923828125, -13.234375, -12.544921875, -11.85546875, -11.166015625, -10.4765625, -9.787109375, -9.09765625, -8.408203125, -7.71875, -7.029296875, -6.33984375, -5.650390625, -4.9609375, -4.271484375, -3.58203125, -2.892578125, -2.203125, -1.513671875, -0.82421875, -0.134765625, 0.5546875, 1.244140625, 1.93359375, 2.623046875, 3.3125, 4.001953125, 4.69140625, 5.380859375, 6.0703125, 6.759765625, 7.44921875, 8.138671875, 8.828125, 9.517578125, 10.20703125, 10.896484375, 11.5859375, 12.275390625, 12.96484375, 13.654296875, 14.34375, 15.033203125, 15.72265625, 16.412109375, 17.1015625, 17.791015625, 18.48046875, 19.169921875, 19.859375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 13.0, 11.0, 24.0, 33.0, 28.0, 47.0, 50.0, 56.0, 79.0, 89.0, 99.0, 111.0, 73.0, 70.0, 46.0, 28.0, 38.0, 20.0, 14.0, 10.0, 8.0, 8.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.59375, -20.97998046875, -20.3662109375, -19.75244140625, -19.138671875, -18.52490234375, -17.9111328125, -17.29736328125, -16.68359375, -16.06982421875, -15.4560546875, -14.84228515625, -14.228515625, -13.61474609375, -13.0009765625, -12.38720703125, -11.7734375, -11.15966796875, -10.5458984375, -9.93212890625, -9.318359375, -8.70458984375, -8.0908203125, -7.47705078125, -6.86328125, -6.24951171875, -5.6357421875, -5.02197265625, -4.408203125, -3.79443359375, -3.1806640625, -2.56689453125, -1.953125, -1.33935546875, -0.7255859375, -0.11181640625, 0.501953125, 1.11572265625, 1.7294921875, 2.34326171875, 2.95703125, 3.57080078125, 4.1845703125, 4.79833984375, 5.412109375, 6.02587890625, 6.6396484375, 7.25341796875, 7.8671875, 8.48095703125, 9.0947265625, 9.70849609375, 10.322265625, 10.93603515625, 11.5498046875, 12.16357421875, 12.77734375, 13.39111328125, 14.0048828125, 14.61865234375, 15.232421875, 15.84619140625, 16.4599609375, 17.07373046875, 17.6875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 12.0, 19.0, 80.0, 216.0, 488.0, 123.0, 40.0, 7.0, 8.0, 0.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-560.6902465820312, -526.1357421875, -491.5812072753906, -457.02667236328125, -422.47216796875, -387.91766357421875, -353.3631286621094, -318.80859375, -284.25408935546875, -249.69956970214844, -215.14505004882812, -180.5905303955078, -146.0360107421875, -111.48149108886719, -76.92697143554688, -42.37245178222656, -7.81793212890625, 26.736587524414062, 61.291107177734375, 95.84562683105469, 130.400146484375, 164.9546661376953, 199.50918579101562, 234.06370544433594, 268.61822509765625, 303.1727294921875, 337.7272644042969, 372.28179931640625, 406.8363037109375, 441.39080810546875, 475.9453430175781, 510.4998779296875, 545.0543212890625, 579.6088256835938, 614.163330078125, 648.7178955078125, 683.2723999023438, 717.826904296875, 752.3814697265625, 786.9359741210938, 821.490478515625, 856.0449829101562, 890.5994873046875, 925.154052734375, 959.7085571289062, 994.2630615234375, 1028.817626953125, 1063.3720703125, 1097.9266357421875, 1132.481201171875, 1167.03564453125, 1201.5902099609375, 1236.144775390625, 1270.69921875, 1305.2537841796875, 1339.8082275390625, 1374.36279296875, 1408.9173583984375, 1443.4718017578125, 1478.0263671875, 1512.580810546875, 1547.1353759765625, 1581.68994140625, 1616.244384765625, 1650.7989501953125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 4.0, 2.0, 7.0, 8.0, 6.0, 6.0, 12.0, 4.0, 5.0, 16.0, 12.0, 17.0, 26.0, 23.0, 19.0, 36.0, 36.0, 24.0, 39.0, 82.0, 130.0, 108.0, 65.0, 35.0, 39.0, 25.0, 25.0, 28.0, 23.0, 22.0, 28.0, 22.0, 7.0, 12.0, 10.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-390.56060791015625, -379.00103759765625, -367.4414978027344, -355.8819274902344, -344.3223876953125, -332.7628173828125, -321.2032470703125, -309.6437072753906, -298.08416748046875, -286.52459716796875, -274.9650573730469, -263.4054870605469, -251.845947265625, -240.286376953125, -228.72682189941406, -217.16726684570312, -205.60769653320312, -194.0481414794922, -182.48858642578125, -170.92901611328125, -159.36947631835938, -147.80990600585938, -136.25035095214844, -124.6907958984375, -113.13124084472656, -101.57168579101562, -90.01213073730469, -78.45256805419922, -66.89301300048828, -55.333457946777344, -43.773895263671875, -32.21434020996094, -20.654815673828125, -9.095258712768555, 2.4642982482910156, 14.023857116699219, 25.583412170410156, 37.142967224121094, 48.70252990722656, 60.2620849609375, 71.82164001464844, 83.38119506835938, 94.94075012207031, 106.50031280517578, 118.05986785888672, 129.61941528320312, 141.17898559570312, 152.73854064941406, 164.298095703125, 175.85765075683594, 187.41720581054688, 198.97677612304688, 210.53631591796875, 222.09588623046875, 233.6554412841797, 245.21499633789062, 256.7745361328125, 268.3341064453125, 279.8936462402344, 291.4532165527344, 303.01275634765625, 314.57232666015625, 326.13189697265625, 337.6914367675781, 349.2510070800781]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 14.0, 19.0, 30.0, 30.0, 47.0, 71.0, 107.0, 161.0, 280.0, 541.0, 1002.0, 2429.0, 7090.0, 33662.0, 411115.0, 2818302.0, 846221.0, 56641.0, 10053.0, 3275.0, 1404.0, 727.0, 411.0, 209.0, 140.0, 96.0, 64.0, 38.0, 21.0, 25.0, 15.0, 9.0, 5.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.25, -57.025390625, -54.80078125, -52.576171875, -50.3515625, -48.126953125, -45.90234375, -43.677734375, -41.453125, -39.228515625, -37.00390625, -34.779296875, -32.5546875, -30.330078125, -28.10546875, -25.880859375, -23.65625, -21.431640625, -19.20703125, -16.982421875, -14.7578125, -12.533203125, -10.30859375, -8.083984375, -5.859375, -3.634765625, -1.41015625, 0.814453125, 3.0390625, 5.263671875, 7.48828125, 9.712890625, 11.9375, 14.162109375, 16.38671875, 18.611328125, 20.8359375, 23.060546875, 25.28515625, 27.509765625, 29.734375, 31.958984375, 34.18359375, 36.408203125, 38.6328125, 40.857421875, 43.08203125, 45.306640625, 47.53125, 49.755859375, 51.98046875, 54.205078125, 56.4296875, 58.654296875, 60.87890625, 63.103515625, 65.328125, 67.552734375, 69.77734375, 72.001953125, 74.2265625, 76.451171875, 78.67578125, 80.900390625, 83.125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 12.0, 10.0, 16.0, 18.0, 15.0, 20.0, 15.0, 28.0, 36.0, 43.0, 44.0, 49.0, 43.0, 61.0, 67.0, 52.0, 51.0, 49.0, 47.0, 65.0, 43.0, 33.0, 24.0, 19.0, 22.0, 32.0, 19.0, 16.0, 12.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-33.5, -32.529541015625, -31.55908203125, -30.588623046875, -29.6181640625, -28.647705078125, -27.67724609375, -26.706787109375, -25.736328125, -24.765869140625, -23.79541015625, -22.824951171875, -21.8544921875, -20.884033203125, -19.91357421875, -18.943115234375, -17.97265625, -17.002197265625, -16.03173828125, -15.061279296875, -14.0908203125, -13.120361328125, -12.14990234375, -11.179443359375, -10.208984375, -9.238525390625, -8.26806640625, -7.297607421875, -6.3271484375, -5.356689453125, -4.38623046875, -3.415771484375, -2.4453125, -1.474853515625, -0.50439453125, 0.466064453125, 1.4365234375, 2.406982421875, 3.37744140625, 4.347900390625, 5.318359375, 6.288818359375, 7.25927734375, 8.229736328125, 9.2001953125, 10.170654296875, 11.14111328125, 12.111572265625, 13.08203125, 14.052490234375, 15.02294921875, 15.993408203125, 16.9638671875, 17.934326171875, 18.90478515625, 19.875244140625, 20.845703125, 21.816162109375, 22.78662109375, 23.757080078125, 24.7275390625, 25.697998046875, 26.66845703125, 27.638916015625, 28.609375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 10.0, 11.0, 24.0, 27.0, 49.0, 65.0, 129.0, 188.0, 363.0, 779.0, 2027.0, 9205.0, 436631.0, 3712477.0, 25631.0, 3968.0, 1385.0, 563.0, 299.0, 160.0, 98.0, 60.0, 31.0, 32.0, 15.0, 15.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-187.75, -182.560546875, -177.37109375, -172.181640625, -166.9921875, -161.802734375, -156.61328125, -151.423828125, -146.234375, -141.044921875, -135.85546875, -130.666015625, -125.4765625, -120.287109375, -115.09765625, -109.908203125, -104.71875, -99.529296875, -94.33984375, -89.150390625, -83.9609375, -78.771484375, -73.58203125, -68.392578125, -63.203125, -58.013671875, -52.82421875, -47.634765625, -42.4453125, -37.255859375, -32.06640625, -26.876953125, -21.6875, -16.498046875, -11.30859375, -6.119140625, -0.9296875, 4.259765625, 9.44921875, 14.638671875, 19.828125, 25.017578125, 30.20703125, 35.396484375, 40.5859375, 45.775390625, 50.96484375, 56.154296875, 61.34375, 66.533203125, 71.72265625, 76.912109375, 82.1015625, 87.291015625, 92.48046875, 97.669921875, 102.859375, 108.048828125, 113.23828125, 118.427734375, 123.6171875, 128.806640625, 133.99609375, 139.185546875, 144.375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 11.0, 18.0, 26.0, 45.0, 90.0, 145.0, 226.0, 405.0, 507.0, 665.0, 610.0, 400.0, 313.0, 181.0, 113.0, 87.0, 59.0, 46.0, 20.0, 26.0, 19.0, 16.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.5625, -92.4150390625, -89.267578125, -86.1201171875, -82.97265625, -79.8251953125, -76.677734375, -73.5302734375, -70.3828125, -67.2353515625, -64.087890625, -60.9404296875, -57.79296875, -54.6455078125, -51.498046875, -48.3505859375, -45.203125, -42.0556640625, -38.908203125, -35.7607421875, -32.61328125, -29.4658203125, -26.318359375, -23.1708984375, -20.0234375, -16.8759765625, -13.728515625, -10.5810546875, -7.43359375, -4.2861328125, -1.138671875, 2.0087890625, 5.15625, 8.3037109375, 11.451171875, 14.5986328125, 17.74609375, 20.8935546875, 24.041015625, 27.1884765625, 30.3359375, 33.4833984375, 36.630859375, 39.7783203125, 42.92578125, 46.0732421875, 49.220703125, 52.3681640625, 55.515625, 58.6630859375, 61.810546875, 64.9580078125, 68.10546875, 71.2529296875, 74.400390625, 77.5478515625, 80.6953125, 83.8427734375, 86.990234375, 90.1376953125, 93.28515625, 96.4326171875, 99.580078125, 102.7275390625, 105.875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 15.0, 24.0, 195.0, 584.0, 134.0, 33.0, 13.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2136.615234375, -2025.388427734375, -1914.16162109375, -1802.9349365234375, -1691.7081298828125, -1580.4813232421875, -1469.254638671875, -1358.02783203125, -1246.801025390625, -1135.57421875, -1024.347412109375, -913.1207275390625, -801.8939208984375, -690.6671142578125, -579.4403686523438, -468.213623046875, -356.98681640625, -245.76004028320312, -134.53326416015625, -23.306488037109375, 87.9202880859375, 199.1470947265625, 310.37384033203125, 421.6005859375, 532.827392578125, 644.05419921875, 755.2809448242188, 866.5076904296875, 977.7344970703125, 1088.9613037109375, 1200.18798828125, 1311.414794921875, 1422.6416015625, 1533.868408203125, 1645.09521484375, 1756.3218994140625, 1867.5487060546875, 1978.7755126953125, 2090.002197265625, 2201.22900390625, 2312.455810546875, 2423.6826171875, 2534.909423828125, 2646.13623046875, 2757.36279296875, 2868.58984375, 2979.81640625, 3091.043212890625, 3202.27001953125, 3313.496826171875, 3424.7236328125, 3535.950439453125, 3647.17724609375, 3758.40380859375, 3869.630615234375, 3980.857421875, 4092.084228515625, 4203.31103515625, 4314.53759765625, 4425.7646484375, 4536.9912109375, 4648.21826171875, 4759.44482421875, 4870.671875, 4981.8984375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 8.0, 2.0, 6.0, 9.0, 8.0, 10.0, 15.0, 15.0, 23.0, 22.0, 31.0, 34.0, 31.0, 48.0, 49.0, 66.0, 63.0, 77.0, 77.0, 94.0, 56.0, 43.0, 50.0, 25.0, 35.0, 17.0, 21.0, 16.0, 10.0, 12.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-747.901611328125, -723.1615600585938, -698.4215698242188, -673.6815185546875, -648.9414672851562, -624.201416015625, -599.46142578125, -574.7213745117188, -549.9813232421875, -525.2412719726562, -500.5012512207031, -475.76123046875, -451.02117919921875, -426.2811584472656, -401.5411376953125, -376.80108642578125, -352.0610656738281, -327.321044921875, -302.58099365234375, -277.8409729003906, -253.10092163085938, -228.36090087890625, -203.62086486816406, -178.88082885742188, -154.1407928466797, -129.4007568359375, -104.66072082519531, -79.92069244384766, -55.18065643310547, -30.44062042236328, -5.700592041015625, 19.039443969726562, 43.77947998046875, 68.51951599121094, 93.25955200195312, 117.99958038330078, 142.7396240234375, 167.47964477539062, 192.2196807861328, 216.959716796875, 241.6997528076172, 266.4397888183594, 291.1798095703125, 315.91986083984375, 340.6598815917969, 365.3999328613281, 390.13995361328125, 414.8800048828125, 439.6200256347656, 464.36004638671875, 489.10009765625, 513.8401489257812, 538.5801391601562, 563.3201904296875, 588.0602416992188, 612.80029296875, 637.540283203125, 662.2803344726562, 687.0203247070312, 711.7603759765625, 736.5004272460938, 761.240478515625, 785.98046875, 810.7205200195312, 835.4605712890625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 10.0, 13.0, 12.0, 13.0, 18.0, 30.0, 40.0, 63.0, 101.0, 150.0, 230.0, 321.0, 592.0, 1012.0, 2227.0, 5333.0, 14673.0, 50348.0, 245975.0, 589773.0, 97276.0, 25253.0, 8208.0, 3413.0, 1493.0, 780.0, 453.0, 240.0, 153.0, 118.0, 69.0, 50.0, 32.0, 16.0, 10.0, 10.0, 10.0, 8.0, 9.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-58.15625, -56.2939453125, -54.431640625, -52.5693359375, -50.70703125, -48.8447265625, -46.982421875, -45.1201171875, -43.2578125, -41.3955078125, -39.533203125, -37.6708984375, -35.80859375, -33.9462890625, -32.083984375, -30.2216796875, -28.359375, -26.4970703125, -24.634765625, -22.7724609375, -20.91015625, -19.0478515625, -17.185546875, -15.3232421875, -13.4609375, -11.5986328125, -9.736328125, -7.8740234375, -6.01171875, -4.1494140625, -2.287109375, -0.4248046875, 1.4375, 3.2998046875, 5.162109375, 7.0244140625, 8.88671875, 10.7490234375, 12.611328125, 14.4736328125, 16.3359375, 18.1982421875, 20.060546875, 21.9228515625, 23.78515625, 25.6474609375, 27.509765625, 29.3720703125, 31.234375, 33.0966796875, 34.958984375, 36.8212890625, 38.68359375, 40.5458984375, 42.408203125, 44.2705078125, 46.1328125, 47.9951171875, 49.857421875, 51.7197265625, 53.58203125, 55.4443359375, 57.306640625, 59.1689453125, 61.03125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 9.0, 17.0, 19.0, 22.0, 27.0, 33.0, 50.0, 73.0, 58.0, 88.0, 87.0, 88.0, 77.0, 83.0, 74.0, 58.0, 36.0, 29.0, 19.0, 20.0, 11.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.125, -57.2158203125, -55.306640625, -53.3974609375, -51.48828125, -49.5791015625, -47.669921875, -45.7607421875, -43.8515625, -41.9423828125, -40.033203125, -38.1240234375, -36.21484375, -34.3056640625, -32.396484375, -30.4873046875, -28.578125, -26.6689453125, -24.759765625, -22.8505859375, -20.94140625, -19.0322265625, -17.123046875, -15.2138671875, -13.3046875, -11.3955078125, -9.486328125, -7.5771484375, -5.66796875, -3.7587890625, -1.849609375, 0.0595703125, 1.96875, 3.8779296875, 5.787109375, 7.6962890625, 9.60546875, 11.5146484375, 13.423828125, 15.3330078125, 17.2421875, 19.1513671875, 21.060546875, 22.9697265625, 24.87890625, 26.7880859375, 28.697265625, 30.6064453125, 32.515625, 34.4248046875, 36.333984375, 38.2431640625, 40.15234375, 42.0615234375, 43.970703125, 45.8798828125, 47.7890625, 49.6982421875, 51.607421875, 53.5166015625, 55.42578125, 57.3349609375, 59.244140625, 61.1533203125, 63.0625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 5.0, 12.0, 30.0, 43.0, 59.0, 91.0, 148.0, 244.0, 527.0, 1061.0, 3726.0, 33186.0, 942593.0, 59119.0, 5168.0, 1308.0, 552.0, 272.0, 152.0, 86.0, 55.0, 29.0, 35.0, 15.0, 6.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.75, -110.3642578125, -106.978515625, -103.5927734375, -100.20703125, -96.8212890625, -93.435546875, -90.0498046875, -86.6640625, -83.2783203125, -79.892578125, -76.5068359375, -73.12109375, -69.7353515625, -66.349609375, -62.9638671875, -59.578125, -56.1923828125, -52.806640625, -49.4208984375, -46.03515625, -42.6494140625, -39.263671875, -35.8779296875, -32.4921875, -29.1064453125, -25.720703125, -22.3349609375, -18.94921875, -15.5634765625, -12.177734375, -8.7919921875, -5.40625, -2.0205078125, 1.365234375, 4.7509765625, 8.13671875, 11.5224609375, 14.908203125, 18.2939453125, 21.6796875, 25.0654296875, 28.451171875, 31.8369140625, 35.22265625, 38.6083984375, 41.994140625, 45.3798828125, 48.765625, 52.1513671875, 55.537109375, 58.9228515625, 62.30859375, 65.6943359375, 69.080078125, 72.4658203125, 75.8515625, 79.2373046875, 82.623046875, 86.0087890625, 89.39453125, 92.7802734375, 96.166015625, 99.5517578125, 102.9375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 13.0, 15.0, 13.0, 15.0, 26.0, 48.0, 37.0, 54.0, 59.0, 93.0, 95.0, 100.0, 108.0, 77.0, 61.0, 42.0, 27.0, 26.0, 24.0, 15.0, 9.0, 10.0, 5.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-239.75, -233.109375, -226.46875, -219.828125, -213.1875, -206.546875, -199.90625, -193.265625, -186.625, -179.984375, -173.34375, -166.703125, -160.0625, -153.421875, -146.78125, -140.140625, -133.5, -126.859375, -120.21875, -113.578125, -106.9375, -100.296875, -93.65625, -87.015625, -80.375, -73.734375, -67.09375, -60.453125, -53.8125, -47.171875, -40.53125, -33.890625, -27.25, -20.609375, -13.96875, -7.328125, -0.6875, 5.953125, 12.59375, 19.234375, 25.875, 32.515625, 39.15625, 45.796875, 52.4375, 59.078125, 65.71875, 72.359375, 79.0, 85.640625, 92.28125, 98.921875, 105.5625, 112.203125, 118.84375, 125.484375, 132.125, 138.765625, 145.40625, 152.046875, 158.6875, 165.328125, 171.96875, 178.609375, 185.25]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 12.0, 8.0, 10.0, 13.0, 11.0, 14.0, 12.0, 20.0, 21.0, 29.0, 41.0, 75.0, 127.0, 230.0, 544.0, 1549.0, 6642.0, 59734.0, 939250.0, 33294.0, 4628.0, 1236.0, 434.0, 209.0, 129.0, 63.0, 43.0, 45.0, 20.0, 18.0, 14.0, 10.0, 11.0, 9.0, 8.0, 9.0, 0.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.703125, -24.933349609375, -24.16357421875, -23.393798828125, -22.6240234375, -21.854248046875, -21.08447265625, -20.314697265625, -19.544921875, -18.775146484375, -18.00537109375, -17.235595703125, -16.4658203125, -15.696044921875, -14.92626953125, -14.156494140625, -13.38671875, -12.616943359375, -11.84716796875, -11.077392578125, -10.3076171875, -9.537841796875, -8.76806640625, -7.998291015625, -7.228515625, -6.458740234375, -5.68896484375, -4.919189453125, -4.1494140625, -3.379638671875, -2.60986328125, -1.840087890625, -1.0703125, -0.300537109375, 0.46923828125, 1.239013671875, 2.0087890625, 2.778564453125, 3.54833984375, 4.318115234375, 5.087890625, 5.857666015625, 6.62744140625, 7.397216796875, 8.1669921875, 8.936767578125, 9.70654296875, 10.476318359375, 11.24609375, 12.015869140625, 12.78564453125, 13.555419921875, 14.3251953125, 15.094970703125, 15.86474609375, 16.634521484375, 17.404296875, 18.174072265625, 18.94384765625, 19.713623046875, 20.4833984375, 21.253173828125, 22.02294921875, 22.792724609375, 23.5625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 11.0, 6.0, 14.0, 10.0, 19.0, 27.0, 30.0, 50.0, 76.0, 95.0, 139.0, 119.0, 105.0, 80.0, 42.0, 36.0, 24.0, 18.0, 17.0, 10.0, 12.0, 7.0, 6.0, 8.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00357818603515625, -0.0034590959548950195, -0.003340005874633789, -0.0032209157943725586, -0.003101825714111328, -0.0029827356338500977, -0.002863645553588867, -0.0027445554733276367, -0.0026254653930664062, -0.0025063753128051758, -0.0023872852325439453, -0.002268195152282715, -0.0021491050720214844, -0.002030014991760254, -0.0019109249114990234, -0.001791834831237793, -0.0016727447509765625, -0.001553654670715332, -0.0014345645904541016, -0.001315474510192871, -0.0011963844299316406, -0.0010772943496704102, -0.0009582042694091797, -0.0008391141891479492, -0.0007200241088867188, -0.0006009340286254883, -0.0004818439483642578, -0.00036275386810302734, -0.00024366378784179688, -0.0001245737075805664, -5.4836273193359375e-06, 0.00011360645294189453, 0.000232696533203125, 0.00035178661346435547, 0.00047087669372558594, 0.0005899667739868164, 0.0007090568542480469, 0.0008281469345092773, 0.0009472370147705078, 0.0010663270950317383, 0.0011854171752929688, 0.0013045072555541992, 0.0014235973358154297, 0.0015426874160766602, 0.0016617774963378906, 0.001780867576599121, 0.0018999576568603516, 0.002019047737121582, 0.0021381378173828125, 0.002257227897644043, 0.0023763179779052734, 0.002495408058166504, 0.0026144981384277344, 0.002733588218688965, 0.0028526782989501953, 0.0029717683792114258, 0.0030908584594726562, 0.0032099485397338867, 0.003329038619995117, 0.0034481287002563477, 0.003567218780517578, 0.0036863088607788086, 0.003805398941040039, 0.0039244890213012695, 0.0040435791015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 7.0, 5.0, 8.0, 17.0, 23.0, 39.0, 45.0, 84.0, 185.0, 392.0, 1218.0, 5879.0, 59354.0, 943852.0, 31844.0, 4005.0, 952.0, 307.0, 159.0, 65.0, 42.0, 24.0, 13.0, 7.0, 13.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.859375, -28.162109375, -27.46484375, -26.767578125, -26.0703125, -25.373046875, -24.67578125, -23.978515625, -23.28125, -22.583984375, -21.88671875, -21.189453125, -20.4921875, -19.794921875, -19.09765625, -18.400390625, -17.703125, -17.005859375, -16.30859375, -15.611328125, -14.9140625, -14.216796875, -13.51953125, -12.822265625, -12.125, -11.427734375, -10.73046875, -10.033203125, -9.3359375, -8.638671875, -7.94140625, -7.244140625, -6.546875, -5.849609375, -5.15234375, -4.455078125, -3.7578125, -3.060546875, -2.36328125, -1.666015625, -0.96875, -0.271484375, 0.42578125, 1.123046875, 1.8203125, 2.517578125, 3.21484375, 3.912109375, 4.609375, 5.306640625, 6.00390625, 6.701171875, 7.3984375, 8.095703125, 8.79296875, 9.490234375, 10.1875, 10.884765625, 11.58203125, 12.279296875, 12.9765625, 13.673828125, 14.37109375, 15.068359375, 15.765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 7.0, 1.0, 3.0, 5.0, 3.0, 4.0, 13.0, 12.0, 15.0, 28.0, 34.0, 63.0, 109.0, 112.0, 143.0, 114.0, 110.0, 79.0, 35.0, 30.0, 22.0, 12.0, 14.0, 8.0, 6.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.570556640625, -16.93798828125, -16.305419921875, -15.6728515625, -15.040283203125, -14.40771484375, -13.775146484375, -13.142578125, -12.510009765625, -11.87744140625, -11.244873046875, -10.6123046875, -9.979736328125, -9.34716796875, -8.714599609375, -8.08203125, -7.449462890625, -6.81689453125, -6.184326171875, -5.5517578125, -4.919189453125, -4.28662109375, -3.654052734375, -3.021484375, -2.388916015625, -1.75634765625, -1.123779296875, -0.4912109375, 0.141357421875, 0.77392578125, 1.406494140625, 2.0390625, 2.671630859375, 3.30419921875, 3.936767578125, 4.5693359375, 5.201904296875, 5.83447265625, 6.467041015625, 7.099609375, 7.732177734375, 8.36474609375, 8.997314453125, 9.6298828125, 10.262451171875, 10.89501953125, 11.527587890625, 12.16015625, 12.792724609375, 13.42529296875, 14.057861328125, 14.6904296875, 15.322998046875, 15.95556640625, 16.588134765625, 17.220703125, 17.853271484375, 18.48583984375, 19.118408203125, 19.7509765625, 20.383544921875, 21.01611328125, 21.648681640625, 22.28125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 6.0, 10.0, 13.0, 26.0, 72.0, 172.0, 558.0, 81.0, 30.0, 14.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1120.3734130859375, -1093.8857421875, -1067.3980712890625, -1040.910400390625, -1014.4226684570312, -987.9349365234375, -961.447265625, -934.9595947265625, -908.4718627929688, -881.9841918945312, -855.4964599609375, -829.0087890625, -802.5211181640625, -776.0333862304688, -749.5457153320312, -723.0579833984375, -696.5703125, -670.0826416015625, -643.5949096679688, -617.1072387695312, -590.6195678710938, -564.1318359375, -537.6441650390625, -511.1564636230469, -484.6688232421875, -458.1811218261719, -431.6934509277344, -405.20574951171875, -378.7180480957031, -352.2303466796875, -325.74267578125, -299.2549743652344, -272.76727294921875, -246.2795867919922, -219.79188537597656, -193.30419921875, -166.81649780273438, -140.3288116455078, -113.84112548828125, -87.35342407226562, -60.86573791503906, -34.37804412841797, -7.890354156494141, 18.597335815429688, 45.08502960205078, 71.57272338867188, 98.06040954589844, 124.54811096191406, 151.03579711914062, 177.5234832763672, 204.0111846923828, 230.49887084960938, 256.986572265625, 283.4742431640625, 309.9619445800781, 336.44964599609375, 362.93731689453125, 389.4250183105469, 415.9126892089844, 442.400390625, 468.8880920410156, 495.37579345703125, 521.8634643554688, 548.3511962890625, 574.8388671875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 16.0, 13.0, 25.0, 21.0, 33.0, 29.0, 45.0, 119.0, 290.0, 155.0, 49.0, 39.0, 36.0, 25.0, 22.0, 17.0, 16.0, 7.0, 7.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-667.7740478515625, -649.9910278320312, -632.2080078125, -614.4249267578125, -596.6419067382812, -578.85888671875, -561.0758056640625, -543.2927856445312, -525.509765625, -507.72674560546875, -489.9436950683594, -472.16064453125, -454.37762451171875, -436.5946044921875, -418.8115539550781, -401.02850341796875, -383.2454833984375, -365.46246337890625, -347.6794128417969, -329.8963623046875, -312.11334228515625, -294.330322265625, -276.5472717285156, -258.76422119140625, -240.981201171875, -223.1981658935547, -205.41513061523438, -187.63209533691406, -169.84906005859375, -152.06602478027344, -134.28298950195312, -116.49995422363281, -98.71685791015625, -80.93382263183594, -63.150787353515625, -45.36775207519531, -27.584716796875, -9.801681518554688, 7.981353759765625, 25.764389038085938, 43.54742431640625, 61.33045959472656, 79.11349487304688, 96.89653015136719, 114.6795654296875, 132.4626007080078, 150.24563598632812, 168.02867126464844, 185.81170654296875, 203.59474182128906, 221.37777709960938, 239.1608123779297, 256.94384765625, 274.72686767578125, 292.5099182128906, 310.29296875, 328.07598876953125, 345.8590087890625, 363.6420593261719, 381.42510986328125, 399.2081298828125, 416.99114990234375, 434.7742004394531, 452.5572509765625, 470.34027099609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 12.0, 11.0, 13.0, 15.0, 18.0, 18.0, 24.0, 45.0, 22.0, 68.0, 105.0, 267.0, 87.0, 46.0, 40.0, 29.0, 24.0, 32.0, 19.0, 28.0, 14.0, 9.0, 12.0, 10.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-48.09375, -46.904541015625, -45.71533203125, -44.526123046875, -43.3369140625, -42.147705078125, -40.95849609375, -39.769287109375, -38.580078125, -37.390869140625, -36.20166015625, -35.012451171875, -33.8232421875, -32.634033203125, -31.44482421875, -30.255615234375, -29.06640625, -27.877197265625, -26.68798828125, -25.498779296875, -24.3095703125, -23.120361328125, -21.93115234375, -20.741943359375, -19.552734375, -18.363525390625, -17.17431640625, -15.985107421875, -14.7958984375, -13.606689453125, -12.41748046875, -11.228271484375, -10.0390625, -8.849853515625, -7.66064453125, -6.471435546875, -5.2822265625, -4.093017578125, -2.90380859375, -1.714599609375, -0.525390625, 0.663818359375, 1.85302734375, 3.042236328125, 4.2314453125, 5.420654296875, 6.60986328125, 7.799072265625, 8.98828125, 10.177490234375, 11.36669921875, 12.555908203125, 13.7451171875, 14.934326171875, 16.12353515625, 17.312744140625, 18.501953125, 19.691162109375, 20.88037109375, 22.069580078125, 23.2587890625, 24.447998046875, 25.63720703125, 26.826416015625, 28.015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 7.0, 6.0, 10.0, 9.0, 21.0, 35.0, 33.0, 61.0, 204.0, 632.0, 10571.0, 8372808.0, 3418.0, 407.0, 149.0, 59.0, 29.0, 21.0, 13.0, 17.0, 14.0, 18.0, 19.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-661.8748168945312, -638.5213012695312, -615.167724609375, -591.814208984375, -568.4606323242188, -545.1071166992188, -521.7535400390625, -498.4000244140625, -475.0464782714844, -451.69293212890625, -428.3393859863281, -404.98583984375, -381.63232421875, -358.27874755859375, -334.92523193359375, -311.5716857910156, -288.2181396484375, -264.8645935058594, -241.51104736328125, -218.1575164794922, -194.80397033691406, -171.45042419433594, -148.09689331054688, -124.74334716796875, -101.38980102539062, -78.0362548828125, -54.682716369628906, -31.329177856445312, -7.9756317138671875, 15.377914428710938, 38.7314453125, 62.084991455078125, 85.4385986328125, 108.79214477539062, 132.14569091796875, 155.4992218017578, 178.85276794433594, 202.20631408691406, 225.55984497070312, 248.91339111328125, 272.2669372558594, 295.6204833984375, 318.9740295410156, 342.32757568359375, 365.68109130859375, 389.03466796875, 412.38818359375, 435.7417297363281, 459.09527587890625, 482.4488220214844, 505.8023681640625, 529.1558837890625, 552.5094604492188, 575.8629760742188, 599.216552734375, 622.570068359375, 645.923583984375, 669.277099609375, 692.6306762695312, 715.9841918945312, 739.3377685546875, 762.6912841796875, 786.0447998046875, 809.3983764648438, 832.751953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 6.0, 7.0, 11.0, 6.0, 5.0, 5.0, 6.0, 9.0, 7.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-950.4044799804688, -926.173583984375, -901.942626953125, -877.7117309570312, -853.4808349609375, -829.2498779296875, -805.0189819335938, -780.7880859375, -756.55712890625, -732.3262329101562, -708.0952758789062, -683.8643798828125, -659.6334228515625, -635.4025268554688, -611.171630859375, -586.940673828125, -562.7097778320312, -538.4788818359375, -514.2479248046875, -490.01702880859375, -465.7861022949219, -441.55517578125, -417.32427978515625, -393.0933532714844, -368.8624267578125, -344.6315002441406, -320.40057373046875, -296.169677734375, -271.9387512207031, -247.70782470703125, -223.47691345214844, -199.24600219726562, -175.0150146484375, -150.78408813476562, -126.55317687988281, -102.32225799560547, -78.09133911132812, -53.86042022705078, -29.629501342773438, -5.398590087890625, 18.83233642578125, 43.063255310058594, 67.29417419433594, 91.52509307861328, 115.75601196289062, 139.9869384765625, 164.2178497314453, 188.44876098632812, 212.6796875, 236.91061401367188, 261.14154052734375, 285.3724365234375, 309.6033630371094, 333.83428955078125, 358.065185546875, 382.2961120605469, 406.52703857421875, 430.7579650878906, 454.9888916015625, 479.21978759765625, 503.4507141113281, 527.681640625, 551.9125366210938, 576.1434326171875, 600.3743896484375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 5.0, 8.0, 9.0, 12.0, 14.0, 17.0, 18.0, 35.0, 42.0, 58.0, 82.0, 93.0, 138.0, 195.0, 324.0, 579.0, 995.0, 2204.0, 5244.0, 14364.0, 41410.0, 128561.0, 204361.0, 83145.0, 26322.0, 9231.0, 3492.0, 1463.0, 721.0, 405.0, 200.0, 121.0, 109.0, 67.0, 51.0, 41.0, 30.0, 20.0, 14.0, 15.0, 10.0, 7.0, 6.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-241.625, -234.37109375, -227.1171875, -219.86328125, -212.609375, -205.35546875, -198.1015625, -190.84765625, -183.59375, -176.33984375, -169.0859375, -161.83203125, -154.578125, -147.32421875, -140.0703125, -132.81640625, -125.5625, -118.30859375, -111.0546875, -103.80078125, -96.546875, -89.29296875, -82.0390625, -74.78515625, -67.53125, -60.27734375, -53.0234375, -45.76953125, -38.515625, -31.26171875, -24.0078125, -16.75390625, -9.5, -2.24609375, 5.0078125, 12.26171875, 19.515625, 26.76953125, 34.0234375, 41.27734375, 48.53125, 55.78515625, 63.0390625, 70.29296875, 77.546875, 84.80078125, 92.0546875, 99.30859375, 106.5625, 113.81640625, 121.0703125, 128.32421875, 135.578125, 142.83203125, 150.0859375, 157.33984375, 164.59375, 171.84765625, 179.1015625, 186.35546875, 193.609375, 200.86328125, 208.1171875, 215.37109375, 222.625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 14.0, 21.0, 17.0, 32.0, 43.0, 36.0, 49.0, 74.0, 96.0, 91.0, 91.0, 89.0, 96.0, 70.0, 32.0, 38.0, 25.0, 19.0, 12.0, 9.0, 8.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.875, -55.96484375, -54.0546875, -52.14453125, -50.234375, -48.32421875, -46.4140625, -44.50390625, -42.59375, -40.68359375, -38.7734375, -36.86328125, -34.953125, -33.04296875, -31.1328125, -29.22265625, -27.3125, -25.40234375, -23.4921875, -21.58203125, -19.671875, -17.76171875, -15.8515625, -13.94140625, -12.03125, -10.12109375, -8.2109375, -6.30078125, -4.390625, -2.48046875, -0.5703125, 1.33984375, 3.25, 5.16015625, 7.0703125, 8.98046875, 10.890625, 12.80078125, 14.7109375, 16.62109375, 18.53125, 20.44140625, 22.3515625, 24.26171875, 26.171875, 28.08203125, 29.9921875, 31.90234375, 33.8125, 35.72265625, 37.6328125, 39.54296875, 41.453125, 43.36328125, 45.2734375, 47.18359375, 49.09375, 51.00390625, 52.9140625, 54.82421875, 56.734375, 58.64453125, 60.5546875, 62.46484375, 64.375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 5.0, 12.0, 18.0, 53.0, 128.0, 117.0, 79.0, 21.0, 19.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.38316345214844, -130.05235290527344, -116.7215576171875, -103.3907470703125, -90.05994415283203, -76.72914123535156, -63.39833068847656, -50.067527770996094, -36.736724853515625, -23.405920028686523, -10.075115203857422, 3.2556915283203125, 16.58649444580078, 29.91729736328125, 43.24810791015625, 56.57891082763672, 69.90971374511719, 83.24051666259766, 96.57131958007812, 109.90213012695312, 123.2329330444336, 136.56373596191406, 149.89454650878906, 163.225341796875, 176.55615234375, 189.886962890625, 203.21775817871094, 216.54856872558594, 229.87936401367188, 243.21017456054688, 256.5409851074219, 269.8717956542969, 283.20257568359375, 296.53338623046875, 309.86419677734375, 323.19500732421875, 336.5257873535156, 349.8565979003906, 363.1874084472656, 376.5182189941406, 389.8489990234375, 403.1798095703125, 416.5106201171875, 429.8414306640625, 443.1722106933594, 456.5030212402344, 469.8338317871094, 483.1646423339844, 496.4954528808594, 509.8262634277344, 523.1570434570312, 536.4878540039062, 549.8186645507812, 563.1494750976562, 576.4802856445312, 589.8110961914062, 603.1419067382812, 616.4727172851562, 629.8035278320312, 643.1343383789062, 656.4651489257812, 669.7958984375, 683.126708984375, 696.45751953125, 709.788330078125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 4.0, 11.0, 8.0, 13.0, 26.0, 93.0, 106.0, 118.0, 43.0, 11.0, 15.0, 7.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-477.7574157714844, -465.9818115234375, -454.2061767578125, -442.4305419921875, -430.6549377441406, -418.87933349609375, -407.10369873046875, -395.32806396484375, -383.5524597167969, -371.77685546875, -360.001220703125, -348.2255859375, -336.4499816894531, -324.67437744140625, -312.89874267578125, -301.12310791015625, -289.3475036621094, -277.5718994140625, -265.7962646484375, -254.02064514160156, -242.24502563476562, -230.4694061279297, -218.69378662109375, -206.9181671142578, -195.14254760742188, -183.36692810058594, -171.59130859375, -159.81568908691406, -148.04006958007812, -136.2644500732422, -124.48883056640625, -112.71321105957031, -100.93759155273438, -89.16197204589844, -77.3863525390625, -65.61073303222656, -53.835113525390625, -42.05949401855469, -30.28387451171875, -18.508255004882812, -6.732635498046875, 5.0429840087890625, 16.818603515625, 28.594223022460938, 40.369842529296875, 52.14546203613281, 63.92108154296875, 75.69670104980469, 87.47232055664062, 99.24794006347656, 111.0235595703125, 122.79917907714844, 134.57479858398438, 146.3504180908203, 158.12603759765625, 169.9016571044922, 181.67727661132812, 193.45289611816406, 205.228515625, 217.00413513183594, 228.77975463867188, 240.5553741455078, 252.33099365234375, 264.10662841796875, 275.8822326660156]}, "eval/loss": 6.7275872230529785, "eval/wer": 1.4950096235887056, "eval/runtime": 1512.5692, "eval/samples_per_second": 1.747, "eval/steps_per_second": 0.437} \ No newline at end of file